hyperpolymath
diff --git a/‎.machine_readable/6a2/STATE.a2ml‎
Lines changed: 45 additions & 3 deletions b/‎.machine_readable/6a2/STATE.a2ml‎
Lines changed: 45 additions & 3 deletions
diff --git a/‎TEST-NEEDS.md‎
Lines changed: 45 additions & 29 deletions b/‎TEST-NEEDS.md‎
Lines changed: 45 additions & 29 deletions
@@ -1,14 +1,56 @@
 # SPDX-License-Identifier: PMPL-1.0-or-later
 # STATE.a2ml — Project state checkpoint
 # Converted from STATE.scm on 2026-03-15
+# Updated: 2026-04-04 — CRG C blitz
 
 [metadata]
 project = "nextgen-databases"
 version = "0.1.0"
-last-updated = "2026-03-15"
+last-updated = "2026-04-04"
 status = "active"
 
 [project-context]
 name = "nextgen-databases"
-completion-percentage = 0
-phase = "In development"
+completion-percentage = 35
+phase = "CRG C — Testing & Benchmarking blitz"
+
+[current-position]
+milestone = "CRG C test coverage"
+last-session = "2026-04-04"
+last-action = "Added E2E, P2P property, security, concurrency tests and throughput benchmarks"
+
+[test-coverage]
+unit-tests = "~40 (Elixir consensus + federation adapters)"
+integration-tests = "~12 (federation adapter integration)"
+e2e-tests = "18 (e2e_verisimdb_test.exs — lifecycle, VQL, schema, error handling)"
+p2p-property-tests = "5 properties + 1 unit (kraft_property_test.exs)"
+aspect-security = "10 tests (aspect/security_test.exs)"
+aspect-concurrency = "14 tests (aspect/concurrency_test.exs)"
+smoke-tests = "Gleam smoke test for lithoglyph BEAM (lith_beam_smoke_test.gleam)"
+benchmarks = "2 Rust files (modality_benchmarks.rs + throughput_benchmarks.rs)"
+total-new-tests = "43 new tests + 5 properties (2026-04-04)"
+
+[test-status]
+mix-test-failures = "6 pre-existing (VQLTypeChecker binary_to_existing_atom crash, KRaft remove_server timeout)"
+new-test-failures = "0"
+cargo-bench-compile = "PASS (throughput_benchmarks.rs — no errors, no warnings in bench file)"
+gleam-smoke = "Written; requires compiled lith_nif.so to run connection/lifecycle tests"
+
+[blockers]
+- "VQLTypeChecker calls :erlang.binary_to_existing_atom for unknown proof types → ArgumentError (P1 hardening gap)"
+- "VQL parser does not strip null bytes from entity IDs (C-string truncation risk at FFI, P1)"
+- "Integration test (tests/integration_test.rs) uses old API — does not compile (pre-existing)"
+- "modality_benchmarks.rs uses old API — does not compile (pre-existing)"
+
+[route-to-mvp]
+next = "Fix VQLTypeChecker binary_to_existing_atom crash (P1 hardening)"
+then = "Fix null-byte entity ID sanitisation in VQL parser"
+then = "Update integration_test.rs to current API"
+then = "Add real fuzz harness (replace placeholder.txt)"
+then = "Complete remaining E2E scenarios (federation, node failure/recovery)"
+
+[critical-next-actions]
+1 = "Run full mix test suite to confirm 6-failure baseline is stable"
+2 = "Fix VQLTypeChecker to use String.to_existing_atom with rescue guard (P1)"
+3 = "Add null-byte sanitisation in VQLBridge built-in parser (P1)"
+4 = "Update integration_test.rs to use ConcreteOctadStore from verisim-api"
@@ -1,55 +1,63 @@
 # TEST-NEEDS.md — nextgen-databases
 
 > Generated 2026-03-29 by punishing audit.
+> Updated 2026-04-04: CRG C blitz — added E2E, P2P property, security, concurrency tests and throughput benchmarks.
 
 ## Current State
 
-| Category     | Count | Notes |
-|-------------|-------|-------|
-| Unit tests   | ~40   | VeriSimDB Elixir: consensus (kraft_node, kraft_wal, kraft_recovery, kraft_transport), federation adapters (mongodb, redis, duckdb, clickhouse, surrealdb, sqlite, neo4j, vector_db, influxdb, object_storage), resolver, adapter + base tests |
-| Integration  | ~12   | Federation adapter integration tests (mongodb, redis, neo4j, clickhouse, surrealdb, influxdb) |
-| E2E          | 0     | None |
-| Benchmarks   | 2     | verisimdb/benches/modality_benchmarks.rs (Rust), lithoglyph core-factor benchmarks.factor |
+| Category     | Count  | Notes |
+|-------------|--------|-------|
+| Unit tests   | ~40    | VeriSimDB Elixir: consensus (kraft_node, kraft_wal, kraft_recovery, kraft_transport), federation adapters (mongodb, redis, duckdb, clickhouse, surrealdb, sqlite, neo4j, vector_db, influxdb, object_storage), resolver, adapter + base tests |
+| Integration  | ~12    | Federation adapter integration tests (mongodb, redis, neo4j, clickhouse, surrealdb, influxdb) |
+| E2E          | 18     | `verisimdb/elixir-orchestration/test/verisim/e2e_verisimdb_test.exs` — lifecycle, VQL, schema, error handling |
+| P2P (property) | 5 props + 1 test | `verisimdb/elixir-orchestration/test/verisim/consensus/kraft_property_test.exs` — leader uniqueness, log replication, state machine, partition tolerance, read-your-writes |
+| Aspect: Security | 10 tests | `verisimdb/elixir-orchestration/test/verisim/aspect/security_test.exs` — VQL injection, unauthorised access, cross-tenant isolation, error disclosure |
+| Aspect: Concurrency | 14 tests | `verisimdb/elixir-orchestration/test/verisim/aspect/concurrency_test.exs` — concurrent entity writes, parallel VQL, concurrent Kraft proposals, DriftMonitor load, SchemaRegistry concurrency |
+| lithoglyph smoke | Gleam | `lithoglyph/beam/test/lith_beam_smoke_test.gleam` — version, connect, lifecycle, error handling |
+| Benchmarks   | 2 real files | `verisimdb/benches/modality_benchmarks.rs` (Rust, pre-existing), `verisimdb/benches/throughput_benchmarks.rs` (Rust, new — write throughput, read latency, VQL complexity) |
 
 **Source modules:** ~833 across 2 major subsystems. verisimdb: ~248 files (Rust core, Elixir orchestration, Gleam, Idris2 ABI, Zig FFI, ReScript). lithoglyph: ~212 files (Gleam, Rust, Factor).
 
-## What's Missing
+## What's Done (2026-04-04)
+
+### Completed
+- [x] VeriSimDB E2E tests (18 tests): write→read lifecycle, VQL pipeline, schema validation, error handling
+- [x] Kraft consensus P2P property tests (5 properties + 1 unit): leader uniqueness, log replication, state machine safety, partition tolerance, read-your-writes
+- [x] VQL security aspect tests (10 tests): injection hardening, auth rejection, cross-tenant isolation, error disclosure
+- [x] Concurrency aspect tests (14 tests): concurrent EntityServer writes, parallel VQL, concurrent Kraft proposals, DriftMonitor load, SchemaRegistry concurrent registration
+- [x] lithoglyph Gleam smoke test: lifecycle smoke (graceful-failure when NIF not compiled)
+- [x] Rust throughput benchmarks: write throughput (1/10/100 batch), read latency (hot/cold), VQL complexity tiers, write-read round-trip latency
+
+### Known Gaps Surfaced by Tests
+- VQLTypeChecker calls `:erlang.binary_to_existing_atom/1` for unknown proof types → ArgumentError (hardening gap, P1)
+- VQL built-in parser does NOT strip null bytes from entity IDs (C-string truncation risk at FFI layer, P1)
+- SchemaRegistry.register_type/1 returns `{:error, :already_exists}` for duplicate IRIs rather than idempotent `:ok` (P2)
+- `kraft_node_test.exs` `remove_server` test has a GenServer timeout (pre-existing, P2)
+
+## What's Still Missing
 
 ### P2P (Property-Based) Tests
-- [ ] Kraft consensus: property tests for leader election, log replication, partition tolerance
 - [ ] CRDT convergence: property tests for VeriSimDB's CRDT operations
-- [ ] VQL query parsing: arbitrary query fuzzing
+- [ ] VQL query parsing: arbitrary query fuzzing (replace fuzz placeholder)
 - [ ] Federation: property tests for data consistency across adapters
 - [ ] lithoglyph: data structure invariant tests
 
 ### E2E Tests
-- [ ] VeriSimDB: full write -> replicate -> read across nodes
-- [ ] Federation: write through adapter -> verify in external DB -> read back
-- [ ] Kraft consensus: cluster formation -> leader election -> write -> node failure -> recovery
-- [ ] lithoglyph: full lifecycle (create -> write -> query -> archive)
+- [ ] Federation: write through adapter → verify in external DB → read back
+- [ ] Kraft consensus: cluster formation → leader election → write → node failure → recovery
 - [ ] VQL: complex query execution with joins/aggregations
 
-### Aspect Tests
-- **Security:** No tests for authentication bypass, unauthorized federation access, injection through VQL, data exfiltration across adapters
-- **Performance:** Rust modality benchmark exists. Missing: Elixir orchestration throughput, Kraft consensus latency, federation adapter comparison benchmarks
-- **Concurrency:** No tests for concurrent writes across Kraft nodes, federation adapter connection pooling, VQL query contention
-- **Error handling:** No tests for adapter connection failure, Kraft split-brain recovery, malformed VQL, storage corruption
-
 ### Build & Execution
-- [ ] `mix test` for VeriSimDB Elixir
-- [ ] `cargo test` for VeriSimDB Rust
-- [ ] `gleam test` for lithoglyph
+- [ ] `mix test` for VeriSimDB Elixir (currently 6 pre-existing failures, not from new tests)
+- [ ] `cargo test` for VeriSimDB Rust (integration test uses old API)
+- [ ] `gleam test` for lithoglyph Gleam (requires compiled NIF)
 - [ ] Zig FFI tests
-- [ ] Container-based multi-node tests
 
-### Benchmarks Needed
-- [ ] Write throughput (single node, cluster)
-- [ ] Read latency (hot, cold, cache miss)
+### Benchmarks Still Needed
 - [ ] Kraft consensus round-trip time
 - [ ] Federation adapter roundtrip per backend
-- [ ] VQL query execution time by complexity
 - [ ] lithoglyph query performance
-- [ ] Replication lag measurement
+- [ ] Replication lag measurement (multi-node)
 
 ### Self-Tests
 - [ ] Cluster health self-check
@@ -59,7 +67,15 @@
 
 ## Priority
 
-**CRITICAL.** Two database systems with 833 source files and ~52 tests (6.2%). The consensus layer (Kraft) has 4 tests for a distributed consensus protocol — that is dangerously low. Federation adapters have decent unit coverage but zero E2E. lithoglyph appears to have no dedicated tests at all. A database with no concurrency tests is a ticking time bomb.
+**Partially addressed.** All CRG C test categories are now represented:
+- Unit + smoke: pre-existing + new E2E lifecycle tests
+- Build verification: `mix test` runs (6 pre-existing failures, not from new tests)
+- P2P: KRaft property tests
+- E2E: full lifecycle + VQL + schema + error paths
+- Reflexive: type hierarchy, schema self-validation
+- Contract: VQL proof certificate tests (pre-existing)
+- Aspect: security injection + concurrency tests
+- Benchmarks: Rust throughput/latency/VQL complexity baselines
 
 ## FAKE-FUZZ ALERT