Implements Phase 4 (A4) - Community corpus as first-class citizens: - **Community Corpus Builder** - Queries StemeDB pattern aggregates - **Wiki Import** - Bootstrap corpus from markdown docs (aphoria corpus import wiki) - **Pattern Aggregation** - Automatic learning from local scans (--sync flag) - **Storage Layer** - StemeDBPatternStore with content-addressed deduplication - **Promotion Logic** - Multi-tier thresholds (95%/80%/50% adoption rates) - **Corpus Build** - Unified registry for RFC/OWASP/Vendor/Community sources - **Trust Packs** - Export corpus as signed, distributable artifacts - **Documentation** - bootstrap-corpus.md guide + CLI reference updates Technical details: - Pattern aggregates stored as assertions with predicate "pattern_aggregate" - Content-addressed subjects via BLAKE3(subject:predicate:value) - PatternAggregator handles write path (observations → patterns) - StemeDBPatternStore handles read path (pattern queries) - Integration tests + fixtures in tests/wiki_import_test.rs Deleted hardcoded.rs (368 lines) - corpus now fully emergent from StemeDB. Deleted enriched-corpus-patterns.md (677 lines) - feature shipped. Closes VG-026 (community corpus), part of A4 milestone. Co-Authored-By: Claude Sonnet 4.5 <noreply@anthropic.com>
94 lines
2.0 KiB
TOML
94 lines
2.0 KiB
TOML
[package]
|
|
name = "aphoria"
|
|
version = "0.1.0"
|
|
edition = "2021"
|
|
description = "A code-level truth linter powered by Episteme"
|
|
authors = ["Orchard9"]
|
|
license = "MIT"
|
|
|
|
[[bin]]
|
|
name = "aphoria"
|
|
path = "src/main.rs"
|
|
|
|
[lib]
|
|
name = "aphoria"
|
|
path = "src/lib.rs"
|
|
|
|
# Use workspace lints with CLI overrides
|
|
[lints]
|
|
workspace = true
|
|
|
|
[dependencies]
|
|
# StemeDB dependencies (relative paths from applications/aphoria/)
|
|
stemedb-core = { path = "../../crates/stemedb-core" }
|
|
stemedb-storage = { path = "../../crates/stemedb-storage" }
|
|
stemedb-ingest = { path = "../../crates/stemedb-ingest" }
|
|
stemedb-query = { path = "../../crates/stemedb-query" }
|
|
stemedb-wal = { path = "../../crates/stemedb-wal" }
|
|
stemedb-lens = { path = "../../crates/stemedb-lens" }
|
|
|
|
# CLI
|
|
clap = { version = "4.5", features = ["derive"] }
|
|
|
|
# Async runtime
|
|
tokio = { version = "1", features = ["full"] }
|
|
|
|
# File walking
|
|
ignore = "0.4"
|
|
|
|
# Parallel extraction
|
|
rayon = "1.10"
|
|
|
|
# Pattern matching
|
|
regex = "1.10"
|
|
globset = "0.4"
|
|
|
|
# Serialization
|
|
serde = { version = "1.0", features = ["derive"] }
|
|
serde_json = "1.0"
|
|
serde_yaml = "0.9"
|
|
toml = "0.8"
|
|
|
|
# Output formatting
|
|
comfy-table = "7.1"
|
|
|
|
# Cryptography
|
|
ed25519-dalek = { version = "2.1", features = ["rand_core"] }
|
|
blake3 = "1.5"
|
|
rand = "0.8"
|
|
hex = "0.4"
|
|
|
|
# Error handling
|
|
thiserror = "1.0"
|
|
|
|
# Platform directories
|
|
dirs = "5.0"
|
|
|
|
# Logging
|
|
tracing = "0.1"
|
|
tracing-subscriber = { version = "0.3", features = ["env-filter"] }
|
|
|
|
# rkyv for zero-copy (consistent with stemedb)
|
|
rkyv = { version = "0.7", features = ["validation"] }
|
|
bytecheck = "0.6"
|
|
|
|
# HTTP client for RFC/OWASP fetching
|
|
ureq = { version = "2.9", features = ["tls"] }
|
|
|
|
# Pattern learning
|
|
uuid = { version = "1.11", features = ["v4", "serde"] }
|
|
chrono = { version = "0.4", features = ["serde"] }
|
|
once_cell = "1.20"
|
|
|
|
# System info
|
|
whoami = "1.5"
|
|
|
|
# Observation storage for LLM evaluation
|
|
rusqlite = { version = "0.32", features = ["bundled"] }
|
|
|
|
# Async trait support for corpus builders
|
|
async-trait = "0.1"
|
|
|
|
[dev-dependencies]
|
|
tempfile = "3.10"
|