stemedb/applications/aphoria/Cargo.toml
jml 65065f3d8f feat(aphoria): implement community corpus with wiki import and pattern aggregation
Implements Phase 4 (A4) - Community corpus as first-class citizens:

- **Community Corpus Builder** - Queries StemeDB pattern aggregates
- **Wiki Import** - Bootstrap corpus from markdown docs (aphoria corpus import wiki)
- **Pattern Aggregation** - Automatic learning from local scans (--sync flag)
- **Storage Layer** - StemeDBPatternStore with content-addressed deduplication
- **Promotion Logic** - Multi-tier thresholds (95%/80%/50% adoption rates)
- **Corpus Build** - Unified registry for RFC/OWASP/Vendor/Community sources
- **Trust Packs** - Export corpus as signed, distributable artifacts
- **Documentation** - bootstrap-corpus.md guide + CLI reference updates

Technical details:
- Pattern aggregates stored as assertions with predicate "pattern_aggregate"
- Content-addressed subjects via BLAKE3(subject:predicate:value)
- PatternAggregator handles write path (observations → patterns)
- StemeDBPatternStore handles read path (pattern queries)
- Integration tests + fixtures in tests/wiki_import_test.rs

Deleted hardcoded.rs (368 lines) - corpus now fully emergent from StemeDB.
Deleted enriched-corpus-patterns.md (677 lines) - feature shipped.

Closes VG-026 (community corpus), part of A4 milestone.

Co-Authored-By: Claude Sonnet 4.5 <noreply@anthropic.com>
2026-02-09 00:12:31 +00:00

94 lines
2.0 KiB
TOML

[package]
name = "aphoria"
version = "0.1.0"
edition = "2021"
description = "A code-level truth linter powered by Episteme"
authors = ["Orchard9"]
license = "MIT"
[[bin]]
name = "aphoria"
path = "src/main.rs"
[lib]
name = "aphoria"
path = "src/lib.rs"
# Use workspace lints with CLI overrides
[lints]
workspace = true
[dependencies]
# StemeDB dependencies (relative paths from applications/aphoria/)
stemedb-core = { path = "../../crates/stemedb-core" }
stemedb-storage = { path = "../../crates/stemedb-storage" }
stemedb-ingest = { path = "../../crates/stemedb-ingest" }
stemedb-query = { path = "../../crates/stemedb-query" }
stemedb-wal = { path = "../../crates/stemedb-wal" }
stemedb-lens = { path = "../../crates/stemedb-lens" }
# CLI
clap = { version = "4.5", features = ["derive"] }
# Async runtime
tokio = { version = "1", features = ["full"] }
# File walking
ignore = "0.4"
# Parallel extraction
rayon = "1.10"
# Pattern matching
regex = "1.10"
globset = "0.4"
# Serialization
serde = { version = "1.0", features = ["derive"] }
serde_json = "1.0"
serde_yaml = "0.9"
toml = "0.8"
# Output formatting
comfy-table = "7.1"
# Cryptography
ed25519-dalek = { version = "2.1", features = ["rand_core"] }
blake3 = "1.5"
rand = "0.8"
hex = "0.4"
# Error handling
thiserror = "1.0"
# Platform directories
dirs = "5.0"
# Logging
tracing = "0.1"
tracing-subscriber = { version = "0.3", features = ["env-filter"] }
# rkyv for zero-copy (consistent with stemedb)
rkyv = { version = "0.7", features = ["validation"] }
bytecheck = "0.6"
# HTTP client for RFC/OWASP fetching
ureq = { version = "2.9", features = ["tls"] }
# Pattern learning
uuid = { version = "1.11", features = ["v4", "serde"] }
chrono = { version = "0.4", features = ["serde"] }
once_cell = "1.20"
# System info
whoami = "1.5"
# Observation storage for LLM evaluation
rusqlite = { version = "0.32", features = ["bundled"] }
# Async trait support for corpus builders
async-trait = "0.1"
[dev-dependencies]
tempfile = "3.10"