From 5a28c8f31636c88db05d2b3cbeec9df92d854028 Mon Sep 17 00:00:00 2001 From: Ed_ Date: Sat, 20 Jun 2026 07:57:53 -0400 Subject: [PATCH] conductor(track): nagent_review_v3 Phase 1 setup + audit --- .../nagent_review_20260608/metadata.json | 57 ++++++++ .../nagent_review_v3_20260619.md | 75 +++++++++++ .../tracks/nagent_review_20260608/state.toml | 122 ++++++++++++++++++ 3 files changed, 254 insertions(+) create mode 100644 conductor/tracks/nagent_review_20260608/nagent_review_v3_20260619.md diff --git a/conductor/tracks/nagent_review_20260608/metadata.json b/conductor/tracks/nagent_review_20260608/metadata.json index 37060635..9b4cf8ea 100644 --- a/conductor/tracks/nagent_review_20260608/metadata.json +++ b/conductor/tracks/nagent_review_20260608/metadata.json @@ -1,4 +1,61 @@ { + "version": "v3", + "v3_initialized": "2026-06-19", + "v3_owner": "Tier 1 Orchestrator (sole author; Tier 2 executing per plan_v3.md)", + "nagent_commits_reviewed": [ + "a1f0680", "023e23a", "bdfa2a6", "a4fb141", "12c35b7", + "6b762da", "315fe9e", "65787a6", "d56f0f0", "49e07f3", + "7a7e242", "065168c", "2edc7ee", "5075f6e", "6426a67", + "afc7ab8", "38d3d4f", "6443d70", "c1d2cad", "f3ec090", + "24cf16d", "199a36b", "557dd39", "54c8741" + ], + "nagent_reviewed_at_commit": "a1f068098c02d47c28fe9bad7dd7db0ae4af465b", + "nagent_reviewed_at_date_utc": "2026-06-18T23:51:28Z", + "nagent_baseline_at_v2_3": "eb6be32a (2026-06-12T00:25:50Z)", + "case_study_repos": [ + {"repo": "macton/pep-copt", "url": "https://github.com/macton/pep-copt", "result": "2.04x speedup, byte-identical output (24-image benchmark)"}, + {"repo": "macton/differentiable-collisions-optc", "url": "https://github.com/macton/differentiable-collisions-optc", "result": "102x speedup on 1000-pair benchmark, distance-tolerance match contract"} + ], + "v3_scope": { + "new_files": [ + "nagent_review_v3_20260619.md", + "nagent_takeaways_v3_20260619.md", + "plan_v3.md" + ], + "modified_files": [ + "comparison_table.md", + "decisions.md", + "metadata.json", + "state.toml" + ], + "deleted_files": [], + "preserved_files_NOT_modified": [ + "spec.md (v2.3 spec, historical)", + "plan.md (v2.3 plan, historical)", + "nagent_review_v2_3_20260612.md (v2.3 canonical review, historical)", + "nagent_review_v2_20260612.md (v2 review, historical)", + "nagent_review_v2_1_20260612.md (v2.1 user-revised, historical)", + "nagent_review_v2_2_20260612.md (v2.2 focused delta, historical)", + "report.md (v1 review, historical)", + "nagent_takeaways_20260608.md (v2.3-era bridge, unchanged)" + ] + }, + "v3_verification_criteria": [ + "All 11 clusters present in nagent_review_v3_20260619.md as dedicated sections", + "Every cluster section cites >=3 source paths (commit SHA, file:line, prompts/*.md, OPTIMIZATION-LOG.md, or harness script)", + "Clusters 9, 10, 11 cite actual prompts/create-*.md, OPTIMIZATION-LOG.md, and prove-optimized-harness.sh content (not README paraphrases)", + "Format commitment verified: no JSON blocks in main review; 7-column tables in comparison_table.md; SSDL shape tags present; survey grammar in code examples; source-read citations present", + "decisions.md has ~25-30 candidates with v2.3 -> v3 status mapping at top", + "nagent_takeaways_v3_20260619.md has 5-part structure (TL;DR + cross-ref table + new takeaways + v2.3-superseded + sibling pointer)", + "spec_v3.md + plan_v3.md committed; metadata.json refreshed; state.toml updated; tracks.md not modified", + "One commit per cluster phase; git notes attached per task; per-task commit SHAs in state.toml" + ], + "v3_deferred_to_followup_tracks": [ + "Cross-track synthesis (compare operating rules across nagent + Fable + project DOD + superpowers using-superpowers) - flagged in spec_v3.md S3.1 as a stretch goal", + "v3 candidates in decisions.md are inputs to the user's deferred Manual Slop rebuild, not v3 itself" + ], + "v3_phases_count": 14, + "v3_total_target_loc": "5500-6500 LOC for nagent_review_v3_20260619.md + 150 LOC for nagent_takeaways_v3_20260619.md", "track_id": "nagent_review_20260608", "name": "nagent Review (Mike Acton's data-oriented LLM agent reference)", "initialized": "2026-06-08", diff --git a/conductor/tracks/nagent_review_20260608/nagent_review_v3_20260619.md b/conductor/tracks/nagent_review_20260608/nagent_review_v3_20260619.md new file mode 100644 index 00000000..12dc2b82 --- /dev/null +++ b/conductor/tracks/nagent_review_20260608/nagent_review_v3_20260619.md @@ -0,0 +1,75 @@ +# nagent_review_v3_20260619 — Mike Acton's nagent, the 24-commit evolution + case studies + +**Status:** Draft (Phase 1 setup complete; cluster sections pending) +**Initialized:** 2026-06-19 +**Owner:** Tier 1 Orchestrator (sole author; Tier 2 executing per `plan_v3.md`) +**Spec pair:** `spec_v3.md` + `plan_v3.md` (in the same track directory) +**Lineage:** Supersedes `nagent_review_v2_3_20260612.md` (4,969 lines, the v2.3 canonical review). v2.3 is preserved as historical. +**Source state:** `macton/nagent@a1f0680` (2026-06-18 23:51:28 UTC) + the two case-study repos at `main`. + +> **Reading guide.** v3 covers the 24 new nagent commits on `macton/nagent@main` between `eb6be32a` (2026-06-12) and `a1f0680` (2026-06-18), and the two case-study repos that didn't exist at v2.3 baseline: [`macton/pep-copt`](https://github.com/macton/pep-copt) and [`macton/differentiable-collisions-optc`](https://github.com/macton/differentiable-collisions-optc). The 11 clusters are: Campaigns (§1), Conversation safety net (§2), Hooks (§3), Project-local roots (§4), Provider expansion (§5), Delegation rewrite (§6), Robustness (§7), Operating rules (§8), Case-study methodology (§9), PEP case study (§10), Collisions case study (§11). + +> **Lineage note.** v2.3's 14-pattern analysis stands; v3 does not delete it. Where v3 updates a v2.3 pattern, the cluster section calls out the update explicitly. Where v3 introduces a new pattern, the cluster section cites the v2.3 pattern it does NOT replace (if any). + +## §0 TL;DR + +(filled in by Phase 13; placeholder — v3 covers the 24-commit nagent evolution between `eb6be32a` and `a1f0680`, plus two case-study repos that demonstrate nagent's per-turn proof harness in production. Three entirely new first-class subsystems land: Campaigns, Conversation safety net, and Hooks. The case-study methodology (4 prompts + proof harness + optimization log + committed-input sha256 freeze) is itself a reusable abstraction. Updates to existing patterns: 6 providers instead of 5 (Together added), delegation rewrite fixes a recursion bug, robustness commits harden the loop, and the operating-rules get a new Q9 for "sampling justifies replacing the machine.") + +## §1 Campaigns + +(filled in by Phase 2 — covers `24cf16d`, `199a36b`, `f3ec090`, `c1d2cad`, `6443d70`, `7a7e242`) + +## §2 Conversation safety net + +(filled in by Phase 3 — covers `38d3d4f`, `6426a67`) + +## §3 Hooks + +(filled in by Phase 4 — covers `a4fb141` + both case-study harness scripts) + +## §4 Project-local roots + +(filled in by Phase 5 — covers `54c8741`, `557dd39`, `0b9d1a2`, `023e23a`) + +## §5 Provider expansion + +(filled in by Phase 6 — covers `bdfa2a6`, `5075f6e`, `2edc7ee`) + +## §6 Delegation rewrite + +(filled in by Phase 7 — covers `d56f0f0`, `65787a6`, `315fe9e`) + +## §7 Robustness + +(filled in by Phase 8 — covers `065168c`, `6b762da`, `12c35b7`, `49e07f3`) + +## §8 Operating rules + +(filled in by Phase 9 — covers `a1f0680` + cross-refs Fable) + +## §9 Case-study methodology + +(filled in by Phase 10 — the 5-element pattern + GPT-5.5 note + sibling-review cross-refs) + +## §10 PEP case study + +(filled in by Phase 11 — `macton/pep-copt` deep-dive: 2.04× speedup, byte-identical output) + +## §11 Collisions case study + +(filled in by Phase 12 — `macton/differentiable-collisions-optc` deep-dive: 102× speedup, distance-tolerance match contract) + +## §12 Decisions + +Pointer to `decisions.md` (filled in by Phase 13). The full candidate list: v2.3's 16 + v3's new ~10-14, with v2.3 → v3 status mapping (PROMOTE / SUPERSEDE / STILL-OPEN / WITHDRAW) at the top of `decisions.md`. + +## §13 Cross-references + +Pointer to `nagent_takeaways_v3_20260619.md` for the bridge to v2.3 takeaways + the sibling reviews: +- `fable_review_20260617` — Fable's analysis of Mythos system prompt (touchpoint: §8 Operating rules) +- `intent_dsl_survey_20260612` — the 10 prior-art clusters (touchpoint: §9 Case-study methodology) +- `superpowers_review_20260619` — the superpowers plugin review (touchpoint: §9 Case-study methodology, process parallel via the `brainstorming` skill) + +## §14 References + +(filled in incrementally as clusters commit — see `state.toml` `[v3_tasks]` for per-phase commit SHAs) \ No newline at end of file diff --git a/conductor/tracks/nagent_review_20260608/state.toml b/conductor/tracks/nagent_review_20260608/state.toml index 07d1e2c9..7e9e0dbe 100644 --- a/conductor/tracks/nagent_review_20260608/state.toml +++ b/conductor/tracks/nagent_review_20260608/state.toml @@ -167,6 +167,128 @@ candidate_08_coedited_files_tools = { priority = "LOW", user_flag = "none", candidate_09_split_patch_lib = { priority = "DEFER", user_flag = "none", domain = "App", effort = "Medium (defer until need)" } candidate_10_raw_transcript_persistence = { priority = "LOW", user_flag = "none", domain = "App", effort = "Small" } +# v3 review (2026-06-19): the 24-commit evolution + 2 case-study repos +# See spec_v3.md + plan_v3.md. Tier 1 sole-authored; Tier 2 executing per plan_v3.md. + +[v3_meta] +v3_initialized = "2026-06-19" +v3_status = "active" +v3_current_phase = 1 +v3_last_updated = "2026-06-19" + +[v3_phases] +phase_1 = { status = "in_progress", checkpointsha = "", name = "Setup + audit" } +phase_2 = { status = "pending", checkpointsha = "", name = "Campaigns cluster (S1)" } +phase_3 = { status = "pending", checkpointsha = "", name = "Conversation safety net cluster (S2)" } +phase_4 = { status = "pending", checkpointsha = "", name = "Hooks cluster (S3)" } +phase_5 = { status = "pending", checkpointsha = "", name = "Project-local roots cluster (S4)" } +phase_6 = { status = "pending", checkpointsha = "", name = "Provider expansion cluster (S5)" } +phase_7 = { status = "pending", checkpointsha = "", name = "Delegation rewrite cluster (S6)" } +phase_8 = { status = "pending", checkpointsha = "", name = "Robustness cluster (S7)" } +phase_9 = { status = "pending", checkpointsha = "", name = "Operating rules cluster (S8)" } +phase_10 = { status = "pending", checkpointsha = "", name = "Case-study methodology cluster (S9)" } +phase_11 = { status = "pending", checkpointsha = "", name = "PEP case study cluster (S10)" } +phase_12 = { status = "pending", checkpointsha = "", name = "Collisions case study cluster (S11)" } +phase_13 = { status = "pending", checkpointsha = "", name = "Refresh side artifacts (comparison_table, decisions, takeaways)" } +phase_14 = { status = "pending", checkpointsha = "", name = "Format-commitment verification + final commit" } + +[v3_tasks] +t1_1 = { status = "completed", commit_sha = "", description = "Refresh metadata.json with v3 fields" } +t1_2 = { status = "in_progress", commit_sha = "", description = "Initialize state.toml v3 fields" } +t1_3 = { status = "pending", commit_sha = "", description = "Confirm spec_v3.md + plan_v3.md exist (skeleton ack)" } +t1_4 = { status = "pending", commit_sha = "", description = "Write nagent_review_v3_20260619.md skeleton (11 cluster placeholders + frontmatter)" } +t1_5 = { status = "pending", commit_sha = "", description = "Commit Phase 1 setup" } +t2_1 = { status = "pending", commit_sha = "", description = "Phase 2 source-read 6 campaigns commits (24cf16d, 199a36b, f3ec090, c1d2cad, 6443d70, 7a7e242)" } +t2_2 = { status = "pending", commit_sha = "", description = "Phase 2 identify campaigns abstraction" } +t2_3 = { status = "pending", commit_sha = "", description = "Phase 2 compare to v2.3 14 patterns" } +t2_4 = { status = "pending", commit_sha = "", description = "Phase 2 write S1 Campaigns section" } +t2_5 = { status = "pending", commit_sha = "", description = "Phase 2 commit S1 + git note" } +t3_1 = { status = "pending", commit_sha = "", description = "Phase 3 source-read 2 safety-net commits (38d3d4f, 6426a67)" } +t3_2 = { status = "pending", commit_sha = "", description = "Phase 3 identify safety-net abstraction" } +t3_3 = { status = "pending", commit_sha = "", description = "Phase 3 compare to v2.3" } +t3_4 = { status = "pending", commit_sha = "", description = "Phase 3 write S2 Conversation safety net section" } +t3_5 = { status = "pending", commit_sha = "", description = "Phase 3 commit S2 + git note" } +t4_1 = { status = "pending", commit_sha = "", description = "Phase 4 source-read hooks commit (a4fb141) + both harness scripts" } +t4_2 = { status = "pending", commit_sha = "", description = "Phase 4 identify hooks abstraction" } +t4_3 = { status = "pending", commit_sha = "", description = "Phase 4 compare to v2.3" } +t4_4 = { status = "pending", commit_sha = "", description = "Phase 4 write S3 Hooks section" } +t4_5 = { status = "pending", commit_sha = "", description = "Phase 4 commit S3 + git note" } +t5_1 = { status = "pending", commit_sha = "", description = "Phase 5 source-read 4 commits (54c8741, 557dd39, 0b9d1a2, 023e23a)" } +t5_2 = { status = "pending", commit_sha = "", description = "Phase 5 identify project-local-roots abstraction" } +t5_3 = { status = "pending", commit_sha = "", description = "Phase 5 compare to v2.3" } +t5_4 = { status = "pending", commit_sha = "", description = "Phase 5 write S4 Project-local roots section" } +t5_5 = { status = "pending", commit_sha = "", description = "Phase 5 commit S4 + git note" } +t6_1 = { status = "pending", commit_sha = "", description = "Phase 6 source-read 3 provider commits (bdfa2a6, 5075f6e, 2edc7ee)" } +t6_2 = { status = "pending", commit_sha = "", description = "Phase 6 identify provider expansion abstraction" } +t6_3 = { status = "pending", commit_sha = "", description = "Phase 6 compare to v2.3" } +t6_4 = { status = "pending", commit_sha = "", description = "Phase 6 write S5 Provider expansion section" } +t6_5 = { status = "pending", commit_sha = "", description = "Phase 6 commit S5 + git note" } +t7_1 = { status = "pending", commit_sha = "", description = "Phase 7 source-read 3 delegation commits (d56f0f0, 65787a6, 315fe9e)" } +t7_2 = { status = "pending", commit_sha = "", description = "Phase 7 identify delegation abstraction (recursion bug + fix)" } +t7_3 = { status = "pending", commit_sha = "", description = "Phase 7 compare to v2.3" } +t7_4 = { status = "pending", commit_sha = "", description = "Phase 7 write S6 Delegation rewrite section" } +t7_5 = { status = "pending", commit_sha = "", description = "Phase 7 commit S6 + git note" } +t8_1 = { status = "pending", commit_sha = "", description = "Phase 8 source-read 4 robustness commits (065168c, 6b762da, 12c35b7, 49e07f3)" } +t8_2 = { status = "pending", commit_sha = "", description = "Phase 8 identify robustness abstractions" } +t8_3 = { status = "pending", commit_sha = "", description = "Phase 8 compare to v2.3" } +t8_4 = { status = "pending", commit_sha = "", description = "Phase 8 write S7 Robustness section" } +t8_5 = { status = "pending", commit_sha = "", description = "Phase 8 commit S7 + git note" } +t9_1 = { status = "pending", commit_sha = "", description = "Phase 9 source-read a1f0680 operating-rules commit" } +t9_2 = { status = "pending", commit_sha = "", description = "Phase 9 identify operating-rules abstraction" } +t9_3 = { status = "pending", commit_sha = "", description = "Phase 9 compare to v2.3" } +t9_4 = { status = "pending", commit_sha = "", description = "Phase 9 cross-reference fable_review_20260617" } +t9_5 = { status = "pending", commit_sha = "", description = "Phase 9 write S8 Operating rules section" } +t9_6 = { status = "pending", commit_sha = "", description = "Phase 9 commit S8 + git note" } +t10_1 = { status = "pending", commit_sha = "", description = "Phase 10 read both case-study READMEs" } +t10_2 = { status = "pending", commit_sha = "", description = "Phase 10 fetch one prompt file from each repo as sample" } +t10_3 = { status = "pending", commit_sha = "", description = "Phase 10 identify case-study methodology abstraction (5-element pattern)" } +t10_4 = { status = "pending", commit_sha = "", description = "Phase 10 note the GPT-5.5 string" } +t10_5 = { status = "pending", commit_sha = "", description = "Phase 10 cross-reference intent_dsl_survey + superpowers_review" } +t10_6 = { status = "pending", commit_sha = "", description = "Phase 10 write S9 Case-study methodology section" } +t10_7 = { status = "pending", commit_sha = "", description = "Phase 10 commit S9 + git note" } +t11_1 = { status = "pending", commit_sha = "", description = "Phase 11 read all 5 pep-copt commits" } +t11_2 = { status = "pending", commit_sha = "", description = "Phase 11 read OPTIMIZATION-LOG.md in full" } +t11_3 = { status = "pending", commit_sha = "", description = "Phase 11 read prove-optimized-harness.sh in full" } +t11_4 = { status = "pending", commit_sha = "", description = "Phase 11 read the 4 prompts in full" } +t11_5 = { status = "pending", commit_sha = "", description = "Phase 11 identify kept optimizations" } +t11_6 = { status = "pending", commit_sha = "", description = "Phase 11 identify rejected optimizations" } +t11_7 = { status = "pending", commit_sha = "", description = "Phase 11 compare to v2.3" } +t11_8 = { status = "pending", commit_sha = "", description = "Phase 11 write S10 PEP case study section" } +t11_9 = { status = "pending", commit_sha = "", description = "Phase 11 commit S10 + git note" } +t12_1 = { status = "pending", commit_sha = "", description = "Phase 12 read all 5 collisions-optc commits" } +t12_2 = { status = "pending", commit_sha = "", description = "Phase 12 read OPTIMIZATION-LOG.md in full" } +t12_3 = { status = "pending", commit_sha = "", description = "Phase 12 read prove-optimized-harness.sh in full" } +t12_4 = { status = "pending", commit_sha = "", description = "Phase 12 read the 4 prompts in full" } +t12_5 = { status = "pending", commit_sha = "", description = "Phase 12 identify kept optimizations" } +t12_6 = { status = "pending", commit_sha = "", description = "Phase 12 identify rejected optimizations" } +t12_7 = { status = "pending", commit_sha = "", description = "Phase 12 document match contract" } +t12_8 = { status = "pending", commit_sha = "", description = "Phase 12 compare to v2.3 + S10 cross-ref" } +t12_9 = { status = "pending", commit_sha = "", description = "Phase 12 write S11 Collisions case study section" } +t12_10 = { status = "pending", commit_sha = "", description = "Phase 12 commit S11 + git note" } +t13_1 = { status = "pending", commit_sha = "", description = "Phase 13 write comparison_table.md (v3)" } +t13_2 = { status = "pending", commit_sha = "", description = "Phase 13 write decisions.md (v3 with v2.3 status mapping)" } +t13_3 = { status = "pending", commit_sha = "", description = "Phase 13 write nagent_takeaways_v3_20260619.md" } +t13_4 = { status = "pending", commit_sha = "", description = "Phase 13 write S0 TL;DR + S12-14 in main review" } +t13_5 = { status = "pending", commit_sha = "", description = "Phase 13 commit + git note" } +t14_1 = { status = "pending", commit_sha = "", description = "Phase 14 grep verification: no JSON blocks" } +t14_2 = { status = "pending", commit_sha = "", description = "Phase 14 grep verification: 7-column tables present" } +t14_3 = { status = "pending", commit_sha = "", description = "Phase 14 grep verification: SSDL shape tags present" } +t14_4 = { status = "pending", commit_sha = "", description = "Phase 14 grep verification: survey grammar present" } +t14_5 = { status = "pending", commit_sha = "", description = "Phase 14 grep verification: source-read citations per cluster" } +t14_6 = { status = "pending", commit_sha = "", description = "Phase 14 grep verification: decisions.md candidate count 25-30" } +t14_7 = { status = "pending", commit_sha = "", description = "Phase 14 grep verification: takeaways bridge 5-part structure" } +t14_8 = { status = "pending", commit_sha = "", description = "Phase 14 final commit + git note" } + +[v3_verification] +v3_coverage_complete = false +v3_source_read_citations_complete = false +v3_case_study_evidence_complete = false +v3_format_commitment_verified = false +v3_decisions_count_in_range = false +v3_takeaways_bridge_complete = false +v3_track_artifacts_committed = false +v3_commits_with_notes = false + [status] # Track is a reference/analysis track; "active" means the artifacts are ready for review # The track will move to "completed" and be archived when: