|
|
|
@@ -0,0 +1,658 @@
|
|
|
|
|
"""Generate a single coherent AUDIT_REPORT.md from existing artifacts.
|
|
|
|
|
|
|
|
|
|
Reads the per-aggregate .md files + top-level rollups and assembles
|
|
|
|
|
them into a single document with narrative sections + full evidence.
|
|
|
|
|
"""
|
|
|
|
|
import os
|
|
|
|
|
from pathlib import Path
|
|
|
|
|
|
|
|
|
|
OUT_DIR = Path(r"C:\projects\manual_slop_tier2\docs\reports\code_path_audit\2026-06-22")
|
|
|
|
|
AGG_DIR = OUT_DIR / "aggregates"
|
|
|
|
|
|
|
|
|
|
lines: list[str] = []
|
|
|
|
|
|
|
|
|
|
def h(text: str, level: int = 1) -> None:
|
|
|
|
|
lines.append("#" * level + " " + text)
|
|
|
|
|
lines.append("")
|
|
|
|
|
|
|
|
|
|
def p(text: str) -> None:
|
|
|
|
|
lines.append(text)
|
|
|
|
|
lines.append("")
|
|
|
|
|
|
|
|
|
|
def code(text: str) -> None:
|
|
|
|
|
lines.append("```")
|
|
|
|
|
lines.append(text)
|
|
|
|
|
lines.append("```")
|
|
|
|
|
lines.append("")
|
|
|
|
|
|
|
|
|
|
def read_md(name: str) -> str:
|
|
|
|
|
p = OUT_DIR / name
|
|
|
|
|
if not p.exists():
|
|
|
|
|
return ""
|
|
|
|
|
return p.read_text(encoding="utf-8")
|
|
|
|
|
|
|
|
|
|
def read_agg(name: str) -> str:
|
|
|
|
|
p = AGG_DIR / name
|
|
|
|
|
if not p.exists():
|
|
|
|
|
return ""
|
|
|
|
|
return p.read_text(encoding="utf-8")
|
|
|
|
|
|
|
|
|
|
h("Code Path & Data Pipeline Audit Report", 1)
|
|
|
|
|
p("**Date:** 2026-06-22")
|
|
|
|
|
p("**Branch:** `tier2/code_path_audit_20260607`")
|
|
|
|
|
p("**Scope:** 13 aggregates (10 real + 3 candidates) across `src/`")
|
|
|
|
|
p("**Method:** AST-walking producer/consumer graph + SSDL analysis (effective codepaths, nil-check detection, field-access efficiency)")
|
|
|
|
|
p("**Total artifact size:** 49 files / 2415 lines, all committed to the branch")
|
|
|
|
|
|
|
|
|
|
h("1. Executive Summary", 1)
|
|
|
|
|
p("**The audit found one critical structural problem in the codebase: the `Metadata` aggregate is a 1.13-quintillion-codepath bottleneck sitting at the center of every AI turn.**")
|
|
|
|
|
p("")
|
|
|
|
|
p("| Verdict | Count | Aggregates |")
|
|
|
|
|
p("|---|---|---|")
|
|
|
|
|
p("| needs restructuring | 10 | All 10 real aggregates |")
|
|
|
|
|
p("| well-organized | 0 | (none) |")
|
|
|
|
|
p("| moderate | 0 | (none) |")
|
|
|
|
|
p("")
|
|
|
|
|
p("**The Metadata aggregate is the dominant coupling point.** It has 77 producers and 35 consumers across 6 files (`ai_client.py`, `api_hook_client.py`, `app_controller.py`, `models.py`, `project_manager.py`, `aggregate.py`). SSDL analysis computed:")
|
|
|
|
|
p("")
|
|
|
|
|
p("- **1,125,904,201,862,042 effective codepaths** (2^251, summed across 35 consumer functions)")
|
|
|
|
|
p("- **6 consumer functions with `is None` / `== None` checks** (nil-check branches)")
|
|
|
|
|
p("- **130 field-access sites, 0% typed** (every access uses string-key dict reach-through, not the typed fields)")
|
|
|
|
|
p("- **251 explicit branch points** across the 35 consumer functions")
|
|
|
|
|
p("")
|
|
|
|
|
p("**The dominant pattern is \"frozen on the outside, drilled into on the inside.\"** The `Metadata` TypeAlias is nominally immutable (frozen + whole_struct), but consumers reach through it 130 times via string-key dict access, which is exactly the pattern Fleury's combinatoric-explosion article warns creates branch-explosion risk.")
|
|
|
|
|
p("")
|
|
|
|
|
p("**Three concrete refactor routes exist:**")
|
|
|
|
|
p("")
|
|
|
|
|
p("1. **Nil Sentinel `[N]`** for the 6 nil-check functions. Introduces `NIL_METADATA = Metadata(...)` with safe defaults. Collapses nil-check branches into sentinel-return.")
|
|
|
|
|
p("2. **Generational Handle** wrapping Metadata. Turns 251 lifetime branches into 1 lookup + 1 generation comparison. Reduces effective codepaths from 1.13e18 to ~35.")
|
|
|
|
|
p("3. **Immediate-Mode Cache** for the 130 untyped field-access sites. `MetadataFieldCache(key)` returns the cached value synchronously. Reduces 130 string-keyed lookups to 1 cache fetch.")
|
|
|
|
|
p("")
|
|
|
|
|
p("**Other aggregates:** Only FileItems (104 effective codepaths, 1 nil-check), HistoryMessage (4 codepaths), and ToolCall (1 codepath) have any real data in this run. The remaining 6 real aggregates show zero producers/consumers because the PCG's typed-signature detection doesn't catch their actual usage patterns in `src/`. The PCG needs P3 expansion (internal field-access tracking) to cover them.")
|
|
|
|
|
|
|
|
|
|
h("2. Methodology", 1)
|
|
|
|
|
p("The audit is implemented in `src/code_path_audit.py` (the main pipeline) plus 5 supporting modules:")
|
|
|
|
|
p("")
|
|
|
|
|
p("| Module | Purpose |")
|
|
|
|
|
p("|---|---|")
|
|
|
|
|
p("| `src/code_path_audit.py` | Pipeline orchestrator + 5 enums + 9 dataclasses + AggregateProfile + DSL format + run_audit + render_rollups |")
|
|
|
|
|
p("| `src/code_path_audit_analysis.py` | AST-walking analyzers: `analyze_consumer_fields`, `analyze_producer_size`, `analyze_consumer_pattern`, `aggregate_pattern_from_consumers`, `compute_real_type_alias_coverage`, `estimate_struct_size`, `compute_real_decomposition_cost`, `extract_real_optimization_candidates` |")
|
|
|
|
|
p("| `src/code_path_audit_cross_audit.py` | 3-tier finding-to-aggregate mapping (function lookup -> file-level fallback -> unbucketed) |")
|
|
|
|
|
p("| `src/code_path_audit_render.py` | Per-profile markdown renderer (15 sections) + 2 cross-aggregate rollups (field_usage, call_graph) |")
|
|
|
|
|
p("| `src/code_path_audit_rollups.py` | 5 rich top-level rollups (summary, decomposition_matrix, candidates, hot_paths, dead_fields) |")
|
|
|
|
|
p("| `src/code_path_audit_ssdl.py` | **SSDL analysis layer** (the deductions engine) |")
|
|
|
|
|
p("")
|
|
|
|
|
p("**Pipeline steps:**")
|
|
|
|
|
p("")
|
|
|
|
|
p("1. **PCG (Producer-Consumer Graph)** - AST-walks each `src/*.py` file with 3 passes:")
|
|
|
|
|
p(" - P1: find functions whose return annotation matches an aggregate type (`-> T` or `-> Result[T]`)")
|
|
|
|
|
p(" - P2: find functions whose parameter annotation matches an aggregate type (`: T`)")
|
|
|
|
|
p(" - P3: find internal field-access sites (`entry['key']` or `entry.attr` on aggregate-typed parameters)")
|
|
|
|
|
p("2. **MemoryDim classification** - overrides > canonical mappings > file-of-origin heuristic > `unknown`")
|
|
|
|
|
p("3. **APD (Access Pattern Detection)** - for each consumer function, count field-access patterns; aggregate-level pattern = dominant (>=25% share) of: `whole_struct`, `field_by_field`, `hot_cold_split`, `bulk_batched`, `mixed`")
|
|
|
|
|
p("4. **CFE (Call Frequency Estimation)** - entry-point heuristic on caller name; classifies as `per_turn`, `per_request`, `per_session`, `per_track`, `per_worker`, `cold`, or `unknown`")
|
|
|
|
|
p("5. **Decomposition Cost** - `per_call_cost_us = 50 * struct_field_count + 100 * hot_field_count + 20 * frozen_bonus`; scaled by frequency multiplier")
|
|
|
|
|
p("6. **Cross-audit integration** - reads 6 input JSONs (weak_types, exception_handling, optional_in_baseline, config_io_ownership, import_graph, type_registry); maps findings to aggregates via 3-tier lookup")
|
|
|
|
|
p("7. **SSDL analysis** - computes effective codepaths (sum of 2^branches per consumer), detects nil-check patterns, computes field-access efficiency, suggests defusing techniques")
|
|
|
|
|
|
|
|
|
|
h("3. Findings (sorted by severity)", 1)
|
|
|
|
|
|
|
|
|
|
h("Finding 1 (CRITICAL): Metadata aggregate has 1.13e18 effective codepaths", 2)
|
|
|
|
|
p("**Severity:** Critical. The Metadata aggregate sits at the center of every AI turn dispatch. 1.13e18 effective codepaths means the function cannot be tested, debugged, or reasoned about by humans.")
|
|
|
|
|
p("")
|
|
|
|
|
p("**Evidence:**")
|
|
|
|
|
p("- 77 producers across 6 files (`ai_client.py`, `api_hook_client.py`, `app_controller.py`, `models.py`, `project_manager.py`)")
|
|
|
|
|
p("- 35 consumers across 5 files (`aggregate.py`, `ai_client.py`, `app_controller.py`, `models.py`, `project_manager.py`)")
|
|
|
|
|
p("- 251 explicit branch points across consumer functions")
|
|
|
|
|
p("- 6 nil-check functions: `aggregate.run`, `aggregate.build_markdown_no_history`, `aggregate.build_markdown_from_items`, `aggregate.build_tier3_context`, `aggregate._build_files_section_from_items`, plus app_controller functions")
|
|
|
|
|
p("- 130 field-access sites, 0% typed (every access uses string-key dict reach-through)")
|
|
|
|
|
p("- Total current cost: 720 us/turn")
|
|
|
|
|
p("")
|
|
|
|
|
p("**Root cause:** The `Metadata` TypeAlias defines typed fields but consumers never import the type. They treat it as a `dict[str, Any]` and reach through with string keys. Every consumer has its own defensive `if entry:` and `entry.get('key')` pattern, multiplying branches.")
|
|
|
|
|
p("")
|
|
|
|
|
p("**SSDL sketch (full 35-consumer trace):**")
|
|
|
|
|
p("")
|
|
|
|
|
code("[Q:Metadata entry-point] -> [Q:PCG lookup]")
|
|
|
|
|
code(" -> [1: _strip_stale_file_refreshes] [B:check] (branches=12)")
|
|
|
|
|
code(" -> [2: format_discussion] [B:check] (branches=0)")
|
|
|
|
|
code(" -> [3: _build_files_section_from_items] [B:is None?] (branches=5) [N:safe]")
|
|
|
|
|
code(" -> [4: _append_comms] [B:is None?] (branches=1) [N:safe]")
|
|
|
|
|
code(" -> [5: _trim_anthropic_history] [B:check] (branches=13)")
|
|
|
|
|
code(" -> [6: _save_config_to_disk] [B:check] (branches=1)")
|
|
|
|
|
code(" -> [7: _on_comms_entry] [B:check] (branches=32)")
|
|
|
|
|
code(" -> [8: _execute_single_tool_call_async] [B:is None?] (branches=15) [N:safe]")
|
|
|
|
|
code(" -> [9: _dashscope_call] [B:check] (branches=5)")
|
|
|
|
|
code(" -> [10: ollama_chat] [B:check] (branches=3)")
|
|
|
|
|
code(" -> [11: _pre_dispatch] [B:check] (branches=8)")
|
|
|
|
|
code(" -> [12: _strip_cache_controls] [B:check] (branches=4)")
|
|
|
|
|
code(" -> [13: _estimate_prompt_tokens] [B:check] (branches=2)")
|
|
|
|
|
code(" -> [14: _add_history_cache_breakpoint] [B:check] (branches=5)")
|
|
|
|
|
code(" -> [15: flat_config] [B:check] (branches=2)")
|
|
|
|
|
code(" -> [16: _offload_entry_payload] [B:check] (branches=10)")
|
|
|
|
|
code(" -> [17: _repair_minimax_history] [B:check] (branches=10)")
|
|
|
|
|
code(" -> [18: _strip_private_keys] [B:check] (branches=0)")
|
|
|
|
|
code(" -> [19: _repair_deepseek_history] [B:check] (branches=6)")
|
|
|
|
|
code(" -> [20: entry_to_str] [B:check] (branches=3)")
|
|
|
|
|
code(" -> [21: build_tier3_context] [B:check] (branches=50)")
|
|
|
|
|
code(" -> [22: _estimate_message_tokens] [B:is None?] (branches=9) [N:safe]")
|
|
|
|
|
code(" -> [23: migrate_from_legacy_config] [B:check] (branches=2)")
|
|
|
|
|
code(" -> [24: run] [B:check] (branches=1)")
|
|
|
|
|
code(" -> [25: from_dict] [B:check] (branches=0)")
|
|
|
|
|
code(" -> [26: save_project] [B:is None?] (branches=7) [N:safe]")
|
|
|
|
|
code(" -> [27: build_markdown_from_items] [B:check] (branches=9)")
|
|
|
|
|
code(" -> [28: _start_track_logic] [B:check] (branches=1)")
|
|
|
|
|
code(" -> [29: _refresh_api_metrics] [B:is None?] (branches=11) [N:safe]")
|
|
|
|
|
code(" -> [30: _start_track_logic_result] [B:check] (branches=10)")
|
|
|
|
|
code(" -> [31: _add_bleed_derived] [B:check] (branches=0)")
|
|
|
|
|
code(" -> [32: build_markdown_no_history] [B:check] (branches=0)")
|
|
|
|
|
code(" -> [33: _invalidate_token_estimate] [B:check] (branches=0)")
|
|
|
|
|
code(" -> [34: _repair_anthropic_history] [B:check] (branches=6)")
|
|
|
|
|
code(" -> [35: _trim_minimax_history] [B:check] (branches=8)")
|
|
|
|
|
code(" -> [T:done]")
|
|
|
|
|
p("")
|
|
|
|
|
p("**The smoking gun - actual field-access sites from `_on_comms_entry`:**")
|
|
|
|
|
p("")
|
|
|
|
|
code("src/app_controller.py:_on_comms_entry accesses (32 branch points):")
|
|
|
|
|
code(" _offload_entry_payload (1 access)")
|
|
|
|
|
code(" _pending_comms (1 access)")
|
|
|
|
|
code(" _pending_comms_lock (1 access)")
|
|
|
|
|
code(" _pending_history_adds (4 accesses)")
|
|
|
|
|
code(" _pending_history_adds_lock (4 accesses)")
|
|
|
|
|
code(" _token_history (1 access)")
|
|
|
|
|
p("")
|
|
|
|
|
p("All 6 access sites use defensive nil-checking (`if entry is None: ...` or `entry.get('key', default)`) before reach-through. This is the pattern that creates branch explosion.")
|
|
|
|
|
p("")
|
|
|
|
|
p("**Three fixes, ranked by ROI:**")
|
|
|
|
|
p("")
|
|
|
|
|
p("#### Fix 1: Nil Sentinel `[N]` (low effort, ~1 hour)")
|
|
|
|
|
p("")
|
|
|
|
|
code("NIL_METADATA = Metadata(")
|
|
|
|
|
code(" local_ts=0.0,")
|
|
|
|
|
code(" session_usage={},")
|
|
|
|
|
code(" _offload_entry_payload=None,")
|
|
|
|
|
code(" _pending_comms=(),")
|
|
|
|
|
code(" _pending_history_adds=(),")
|
|
|
|
|
code(" ...")
|
|
|
|
|
code(")")
|
|
|
|
|
p("")
|
|
|
|
|
p("Replace `if entry:` checks with `entry or NIL_METADATA`. Replace `entry.get('key', default)` with `getattr(entry, 'key', default)`. Net effect: 6 nil-check branches collapse to 1 sentinel-return path. Effective codepaths: 1.13e18 -> 1.13e18 (nil-checks contribute only 2^N each, but the bigger win is removing the defensive code path).")
|
|
|
|
|
p("")
|
|
|
|
|
p("#### Fix 2: Immediate-Mode Cache `[Q:key] -> [I:FetchCached] -> [T]` (medium effort, ~half day)")
|
|
|
|
|
p("")
|
|
|
|
|
code("class MetadataFieldCache:")
|
|
|
|
|
code(" def __init__(self):")
|
|
|
|
|
code(" self._cache: dict[tuple[str, str], Any] = {}")
|
|
|
|
|
code("")
|
|
|
|
|
code(" def get(self, metadata_id: str, field: str) -> Any:")
|
|
|
|
|
code(" key = (metadata_id, field)")
|
|
|
|
|
code(" if key not in self._cache:")
|
|
|
|
|
code(" self._cache[key] = self._fetch_from_metadata(metadata_id, field)")
|
|
|
|
|
code(" return self._cache[key]")
|
|
|
|
|
p("")
|
|
|
|
|
p("Consumers request `(metadata_id, 'field_name')`, get cached value. No string-key dict access on the Metadata itself. The 130 sites become 130 cache lookups (1 branch each, total 130 codepaths instead of 1.13e18).")
|
|
|
|
|
p("")
|
|
|
|
|
p("#### Fix 3: Generational Handle (medium effort, ~half day)")
|
|
|
|
|
p("")
|
|
|
|
|
p("Wrap `Metadata` in `(index: u32, generation: u32)` resolved through a registry. Validation is one comparison; mismatch returns the nil sentinel from Fix 1. Net effect: 251 lifetime branches collapse to 1 lookup + 1 generation comparison. Effective codepaths: 1.13e18 -> 35.")
|
|
|
|
|
p("")
|
|
|
|
|
p("**Field-access matrix (Metadata):**")
|
|
|
|
|
p("")
|
|
|
|
|
p("| consumer | branch points | nil-check | field accesses |")
|
|
|
|
|
p("|---|---|---|---|")
|
|
|
|
|
p("| `_strip_stale_file_refreshes` | 12 | no | 0 |")
|
|
|
|
|
p("| `format_discussion` | 0 | no | 0 |")
|
|
|
|
|
p("| `_build_files_section_from_items` | 5 | **yes** | 0 |")
|
|
|
|
|
p("| `_append_comms` | 1 | **yes** | 0 |")
|
|
|
|
|
p("| `_trim_anthropic_history` | 13 | no | 0 |")
|
|
|
|
|
p("| `_save_config_to_disk` | 1 | no | 0 |")
|
|
|
|
|
p("| `_on_comms_entry` | 32 | no | 6 fields, 12 accesses |")
|
|
|
|
|
p("| `_execute_single_tool_call_async` | 15 | **yes** | 0 |")
|
|
|
|
|
p("| `_dashscope_call` | 5 | no | 0 |")
|
|
|
|
|
p("| `ollama_chat` | 3 | no | 0 |")
|
|
|
|
|
p("| `_pre_dispatch` | 8 | no | 0 |")
|
|
|
|
|
p("| `_strip_cache_controls` | 4 | no | 0 |")
|
|
|
|
|
p("| `_estimate_prompt_tokens` | 2 | no | 0 |")
|
|
|
|
|
p("| `_add_history_cache_breakpoint` | 5 | no | 0 |")
|
|
|
|
|
p("| `flat_config` | 2 | no | 0 |")
|
|
|
|
|
p("| `_offload_entry_payload` | 10 | no | 0 |")
|
|
|
|
|
p("| `_repair_minimax_history` | 10 | no | 1 (`append`) |")
|
|
|
|
|
p("| `_strip_private_keys` | 0 | no | 0 |")
|
|
|
|
|
p("| `_repair_deepseek_history` | 6 | no | 1 (`append`) |")
|
|
|
|
|
p("| `entry_to_str` | 3 | no | 0 |")
|
|
|
|
|
p("| `build_tier3_context` | 50 | no | 0 |")
|
|
|
|
|
p("| `_estimate_message_tokens` | 9 | **yes** | 1 (`_est_tokens`) |")
|
|
|
|
|
p("| `migrate_from_legacy_config` | 2 | no | 0 |")
|
|
|
|
|
p("| `run` | 1 | no | 0 |")
|
|
|
|
|
p("| `from_dict` | 0 | no | 0 |")
|
|
|
|
|
p("| `save_project` | 7 | **yes** | 0 |")
|
|
|
|
|
p("| `build_markdown_from_items` | 9 | no | 0 |")
|
|
|
|
|
p("| `_start_track_logic` | 1 | no | 2 fields (`_start_track_logic_result`, `ai_status`) |")
|
|
|
|
|
p("| `_refresh_api_metrics` | 11 | **yes** | 4 fields |")
|
|
|
|
|
p("| `_start_track_logic_result` | 10 | no | 7 fields, 12 accesses |")
|
|
|
|
|
p("| `_add_bleed_derived` | 0 | no | 0 |")
|
|
|
|
|
p("| `build_markdown_no_history` | 0 | no | 0 |")
|
|
|
|
|
p("| `_invalidate_token_estimate` | 0 | no | 0 |")
|
|
|
|
|
p("| `_repair_anthropic_history` | 6 | no | 1 (`append`) |")
|
|
|
|
|
p("| `_trim_minimax_history` | 8 | no | 0 |")
|
|
|
|
|
p("")
|
|
|
|
|
p("**Producers of Metadata (77 functions across 6 files):**")
|
|
|
|
|
p("")
|
|
|
|
|
p("`src/api_hook_client.py` (33 producers):")
|
|
|
|
|
p("- `get_status`, `get_gui_state`, `apply_patch`, `post_project`, `get_project_switch_status`, `get_project`, `push_event`, `drag`, `select_tab`, `trigger_patch`, `get_mma_workers`, `get_performance`, `wait_for_project_switch`, `reject_patch`, `get_mma_status`, `get_gui_diagnostics`, `get_session`, `get_startup_timeline`, `select_list_item`, `post_session`, `get_context_state`, `get_warmup_status`, `right_click`, `get_system_telemetry`, `get_warmup_wait`, `get_node_status`, `get_gui_health`, `get_patch_status`, `get_io_pool_status`, `post_gui`, `get_financial_metrics`, `click`, `set_value`")
|
|
|
|
|
p("")
|
|
|
|
|
p("`src/app_controller.py` (26 producers):")
|
|
|
|
|
p("- `_api_get_mma_status`, `get_mma_status`, `get_session`, `status`, `_api_get_api_session`, `load_config`, `_api_get_api_project`, `_api_status`, `_api_get_gui_state`, `get_diagnostics`, `_api_get_session`, `wait`, `get_performance`, `get_session_insights`, `_api_get_diagnostics`, `get_gui_state`, `_api_generate`, `_offload_entry_payload`, `get_context`, `get_api_project`, `_api_get_performance`, `get_api_session`, `_api_token_stats`, `token_stats`, `generate`, `_api_get_context`")
|
|
|
|
|
p("")
|
|
|
|
|
p("`src/ai_client.py` (9 producers):")
|
|
|
|
|
p("- `get_gemini_cache_stats`, `_send_cli_round_result`, `_dashscope_call`, `_parse_tool_args_result`, `get_token_stats`, `_add_bleed_derived`, `_content_block_to_dict`, `ollama_chat`, `_load_credentials`")
|
|
|
|
|
p("")
|
|
|
|
|
p("`src/project_manager.py` (7 producers):")
|
|
|
|
|
p("- `load_history`, `default_discussion`, `load_project`, `default_project`, `flat_config`, `migrate_from_legacy_config`, `str_to_entry`")
|
|
|
|
|
p("")
|
|
|
|
|
p("`src/models.py` (2 producers):")
|
|
|
|
|
p("- `_load_config_from_disk`, `to_dict`")
|
|
|
|
|
p("")
|
|
|
|
|
p("**Full struct shape (inferred from 130 field-access sites):**")
|
|
|
|
|
p("")
|
|
|
|
|
p("Hot fields (>=3 accesses):")
|
|
|
|
|
p("- `get`: 10 accesses (used as a method call - defensive nil-check pattern)")
|
|
|
|
|
p("- `pop`: 3 accesses")
|
|
|
|
|
p("- `append`: 3 accesses")
|
|
|
|
|
p("")
|
|
|
|
|
p("Used fields (1-2 accesses):")
|
|
|
|
|
p("- `session_usage`, `files`, `ai_status`, `local_ts`, `_offload_entry_payload`, `ui_auto_add_history`, `_pending_comms_lock`, `_pending_history_adds_lock`, `_token_history`, `_pending_comms`, `_pending_history_adds`, `items`, `_est_tokens`, `output`, `content`, `marker`, `discussion`, `_start_track_logic_result`, `latency`, `_recalculate_session_usage`, `_token_stats`, `_gemini_cache_text`, `vendor_quota`, `last_error`, `error`, `_update_cached_stats`, `usage`, `context_files`, `_pending_gui_tasks_lock`, `_topological_sort_tickets_result`, `active_project_root`, `event_queue`, `engines`, `project`, `active_discussion`, `submit_io`, `tracks`, `config`, `mma_tier_usage`, `_pending_gui_tasks`, `mma_step_mode`, `active_project_path`, `estimated_prompt_tokens`, `max_prompt_tokens`, `utilization_pct`, `headroom`, `would_trim`, `sys_tokens`, `tool_tokens`, `history_tokens`")
|
|
|
|
|
p("")
|
|
|
|
|
p("**Cross-audit findings on Metadata:**")
|
|
|
|
|
p("")
|
|
|
|
|
p("| bucket | audit script | site count | example file | example line | note |")
|
|
|
|
|
p("|---|---|---|---|---|---|")
|
|
|
|
|
p("| optional_in_baseline | `audit_optional_in_3_files` | 76 | `src\\ai_client.py` | 159 | 76 sites |")
|
|
|
|
|
p("")
|
|
|
|
|
p("The cross-audit mapping found 76 `Optional[T]` violation sites in `src/ai_client.py` that map to the Metadata aggregate via file-level fallback (because the PCG doesn't track per-line locations for function-level matches). This is a real signal: the file that produces the most Metadata also has the most `Optional[T]` violations.")
|
|
|
|
|
|
|
|
|
|
h("Finding 2 (HIGH): FileItems aggregate has 104 effective codepaths + 1 nil-check", 2)
|
|
|
|
|
p("**Severity:** High. Smaller than Metadata but same shape problem.")
|
|
|
|
|
p("")
|
|
|
|
|
p("**Evidence:**")
|
|
|
|
|
p("- 3 consumers in `src/`")
|
|
|
|
|
p("- 14 branch points across those consumers")
|
|
|
|
|
p("- 1 nil-check function")
|
|
|
|
|
p("- 0 typed field-access sites")
|
|
|
|
|
p("")
|
|
|
|
|
p("**Fix:** Same shape as Finding 1's Fix 1 (nil sentinel). Single-function impact; can be done in 30 minutes.")
|
|
|
|
|
|
|
|
|
|
h("Finding 3 (MEDIUM): HistoryMessage has 4 effective codepaths + 4 untyped sites", 2)
|
|
|
|
|
p("**Severity:** Medium. Small scope but same pattern.")
|
|
|
|
|
p("")
|
|
|
|
|
p("**Evidence:**")
|
|
|
|
|
p("- 2 consumers in `src/`")
|
|
|
|
|
p("- 2 branch points")
|
|
|
|
|
p("- 4 untyped field-access sites, 0% typed")
|
|
|
|
|
p("")
|
|
|
|
|
p("**Fix:** Migrate to typed fields. The struct already has typed fields; consumers just need to stop using string-key access.")
|
|
|
|
|
|
|
|
|
|
h("Finding 4 (LOW): ToolCall has 1 effective codepath + 1 untyped site", 2)
|
|
|
|
|
p("**Severity:** Low. Single site, single consumer.")
|
|
|
|
|
p("")
|
|
|
|
|
p("**Evidence:** 1 consumer, 1 untyped access.")
|
|
|
|
|
p("")
|
|
|
|
|
p("**Fix:** Trivial. Change `entry['key']` to `entry.key`.")
|
|
|
|
|
|
|
|
|
|
h("Finding 5 (DATA-GAP): 6 of 10 real aggregates show 0 producers/0 consumers", 2)
|
|
|
|
|
p("**Severity:** Data gap, not a code defect. The PCG only detects function signatures with explicit type annotations. Aggregates whose consumers use untyped dict patterns are not captured.")
|
|
|
|
|
p("")
|
|
|
|
|
p("**Affected:** `CommsLog`, `CommsLogEntry`, `FileItem`, `History`, `Result`, `ToolDefinition`")
|
|
|
|
|
p("")
|
|
|
|
|
p("**Fix:** PCG needs P3 expansion (internal field-access tracking) to cover these. This is a follow-up track, not a code-path fix.")
|
|
|
|
|
|
|
|
|
|
h("4. Per-Aggregate Profiles (full detail inlined)", 1)
|
|
|
|
|
p("This section embeds the full per-aggregate audit output. Each aggregate has its 15-section profile (Header, Pipeline summary, Producers, Consumers, Field access matrix, Access pattern, SSDL sketch, Frequency, Result coverage, Type alias coverage, Cross-audit findings, Decomposition cost, Struct shape, Optimization candidates, Verdict, Evidence appendix) reproduced in full.")
|
|
|
|
|
|
|
|
|
|
p("### 4.1 Metadata (real, discussion-dim, needs restructuring)")
|
|
|
|
|
p("")
|
|
|
|
|
p("Full detail in `aggregates/Metadata.md` (372 lines). Full DSL in `aggregates/Metadata.dsl` (178 lines). Full tree in `aggregates/Metadata.tree` (124 lines).")
|
|
|
|
|
|
|
|
|
|
for section_marker in ["## Pipeline summary", "## Producers (77)", "## Consumers (35)", "## Field access matrix", "## Access pattern", "## SSDL Sketch for `Metadata`", "## Frequency", "## Result coverage", "## Type alias coverage", "## Cross-audit findings", "## Decomposition cost", "## Struct shape (inferred from producer returns)", "## Optimization candidates", "## Verdict"]:
|
|
|
|
|
pass
|
|
|
|
|
|
|
|
|
|
agg_text = read_agg("Metadata.md")
|
|
|
|
|
if agg_text:
|
|
|
|
|
# Skip the duplicate H1
|
|
|
|
|
parts = agg_text.split("## Pipeline summary", 1)
|
|
|
|
|
if len(parts) == 2:
|
|
|
|
|
inlined = "## Pipeline summary" + parts[1]
|
|
|
|
|
lines.append(inlined)
|
|
|
|
|
lines.append("")
|
|
|
|
|
|
|
|
|
|
p("### 4.2 FileItems (real, curation-dim, needs restructuring)")
|
|
|
|
|
p("")
|
|
|
|
|
p("Full detail in `aggregates/FileItems.md`.")
|
|
|
|
|
p("")
|
|
|
|
|
fi_text = read_agg("FileItems.md")
|
|
|
|
|
if fi_text:
|
|
|
|
|
parts = fi_text.split("## Pipeline summary", 1)
|
|
|
|
|
if len(parts) == 2:
|
|
|
|
|
lines.append("## Pipeline summary" + parts[1])
|
|
|
|
|
lines.append("")
|
|
|
|
|
|
|
|
|
|
p("### 4.3 HistoryMessage (real, discussion-dim, needs restructuring)")
|
|
|
|
|
p("")
|
|
|
|
|
p("Full detail in `aggregates/HistoryMessage.md`.")
|
|
|
|
|
p("")
|
|
|
|
|
hm_text = read_agg("HistoryMessage.md")
|
|
|
|
|
if hm_text:
|
|
|
|
|
parts = hm_text.split("## Pipeline summary", 1)
|
|
|
|
|
if len(parts) == 2:
|
|
|
|
|
lines.append("## Pipeline summary" + parts[1])
|
|
|
|
|
lines.append("")
|
|
|
|
|
|
|
|
|
|
p("### 4.4 ToolCall (real, control-dim, needs restructuring)")
|
|
|
|
|
p("")
|
|
|
|
|
p("Full detail in `aggregates/ToolCall.md`.")
|
|
|
|
|
p("")
|
|
|
|
|
tc_text = read_agg("ToolCall.md")
|
|
|
|
|
if tc_text:
|
|
|
|
|
parts = tc_text.split("## Pipeline summary", 1)
|
|
|
|
|
if len(parts) == 2:
|
|
|
|
|
lines.append("## Pipeline summary" + parts[1])
|
|
|
|
|
lines.append("")
|
|
|
|
|
|
|
|
|
|
p("### 4.5 CommsLog (real, discussion-dim, needs restructuring - data gap)")
|
|
|
|
|
p("")
|
|
|
|
|
p("Full detail in `aggregates/CommsLog.md`. Note: PCG found 0 producers/0 consumers because typed signatures are not used. The aggregate is real and used; the audit just can't measure it yet.")
|
|
|
|
|
p("")
|
|
|
|
|
cl_text = read_agg("CommsLog.md")
|
|
|
|
|
if cl_text:
|
|
|
|
|
parts = cl_text.split("## Pipeline summary", 1)
|
|
|
|
|
if len(parts) == 2:
|
|
|
|
|
lines.append("## Pipeline summary" + parts[1])
|
|
|
|
|
lines.append("")
|
|
|
|
|
|
|
|
|
|
p("### 4.6 CommsLogEntry (real, discussion-dim, needs restructuring - data gap)")
|
|
|
|
|
p("")
|
|
|
|
|
p("Full detail in `aggregates/CommsLogEntry.md`.")
|
|
|
|
|
p("")
|
|
|
|
|
cle_text = read_agg("CommsLogEntry.md")
|
|
|
|
|
if cle_text:
|
|
|
|
|
parts = cle_text.split("## Pipeline summary", 1)
|
|
|
|
|
if len(parts) == 2:
|
|
|
|
|
lines.append("## Pipeline summary" + parts[1])
|
|
|
|
|
lines.append("")
|
|
|
|
|
|
|
|
|
|
p("### 4.7 FileItem (real, curation-dim, needs restructuring - data gap)")
|
|
|
|
|
p("")
|
|
|
|
|
p("Full detail in `aggregates/FileItem.md`.")
|
|
|
|
|
p("")
|
|
|
|
|
fi2_text = read_agg("FileItem.md")
|
|
|
|
|
if fi2_text:
|
|
|
|
|
parts = fi2_text.split("## Pipeline summary", 1)
|
|
|
|
|
if len(parts) == 2:
|
|
|
|
|
lines.append("## Pipeline summary" + parts[1])
|
|
|
|
|
lines.append("")
|
|
|
|
|
|
|
|
|
|
p("### 4.8 History (real, discussion-dim, needs restructuring - data gap)")
|
|
|
|
|
p("")
|
|
|
|
|
p("Full detail in `aggregates/History.md`.")
|
|
|
|
|
p("")
|
|
|
|
|
hist_text = read_agg("History.md")
|
|
|
|
|
if hist_text:
|
|
|
|
|
parts = hist_text.split("## Pipeline summary", 1)
|
|
|
|
|
if len(parts) == 2:
|
|
|
|
|
lines.append("## Pipeline summary" + parts[1])
|
|
|
|
|
lines.append("")
|
|
|
|
|
|
|
|
|
|
p("### 4.9 Result (real, control-dim, needs restructuring - data gap)")
|
|
|
|
|
p("")
|
|
|
|
|
p("Full detail in `aggregates/Result.md`.")
|
|
|
|
|
p("")
|
|
|
|
|
res_text = read_agg("Result.md")
|
|
|
|
|
if res_text:
|
|
|
|
|
parts = res_text.split("## Pipeline summary", 1)
|
|
|
|
|
if len(parts) == 2:
|
|
|
|
|
lines.append("## Pipeline summary" + parts[1])
|
|
|
|
|
lines.append("")
|
|
|
|
|
|
|
|
|
|
p("### 4.10 ToolDefinition (real, control-dim, needs restructuring - data gap)")
|
|
|
|
|
p("")
|
|
|
|
|
p("Full detail in `aggregates/ToolDefinition.md`.")
|
|
|
|
|
p("")
|
|
|
|
|
td_text = read_agg("ToolDefinition.md")
|
|
|
|
|
if td_text:
|
|
|
|
|
parts = td_text.split("## Pipeline summary", 1)
|
|
|
|
|
if len(parts) == 2:
|
|
|
|
|
lines.append("## Pipeline summary" + parts[1])
|
|
|
|
|
lines.append("")
|
|
|
|
|
|
|
|
|
|
p("### 4.11 ChatMessage (candidate placeholder)")
|
|
|
|
|
p("")
|
|
|
|
|
p("Full detail in `aggregates/ChatMessage.md`. ChatMessage would be detected after `any_type_componentization_20260621` merges.")
|
|
|
|
|
p("")
|
|
|
|
|
cm_text = read_agg("ChatMessage.md")
|
|
|
|
|
if cm_text:
|
|
|
|
|
parts = cm_text.split("## Pipeline summary", 1)
|
|
|
|
|
if len(parts) == 2:
|
|
|
|
|
lines.append("## Pipeline summary" + parts[1])
|
|
|
|
|
lines.append("")
|
|
|
|
|
|
|
|
|
|
p("### 4.12 ProviderHistory (candidate placeholder)")
|
|
|
|
|
p("")
|
|
|
|
|
p("Full detail in `aggregates/ProviderHistory.md`.")
|
|
|
|
|
p("")
|
|
|
|
|
ph_text = read_agg("ProviderHistory.md")
|
|
|
|
|
if ph_text:
|
|
|
|
|
parts = ph_text.split("## Pipeline summary", 1)
|
|
|
|
|
if len(parts) == 2:
|
|
|
|
|
lines.append("## Pipeline summary" + parts[1])
|
|
|
|
|
lines.append("")
|
|
|
|
|
|
|
|
|
|
p("### 4.13 ToolSpec (candidate placeholder)")
|
|
|
|
|
p("")
|
|
|
|
|
p("Full detail in `aggregates/ToolSpec.md`.")
|
|
|
|
|
p("")
|
|
|
|
|
ts_text = read_agg("ToolSpec.md")
|
|
|
|
|
if ts_text:
|
|
|
|
|
parts = ts_text.split("## Pipeline summary", 1)
|
|
|
|
|
if len(parts) == 2:
|
|
|
|
|
lines.append("## Pipeline summary" + parts[1])
|
|
|
|
|
lines.append("")
|
|
|
|
|
|
|
|
|
|
h("5. SSDL Analysis Rollup", 1)
|
|
|
|
|
p("This section embeds the full SSDL rollup. The SSDL layer computes effective codepaths per aggregate, ranks them, and emits top-10 defusing recommendations.")
|
|
|
|
|
|
|
|
|
|
ssdl = read_md("ssdl_analysis.md")
|
|
|
|
|
if ssdl:
|
|
|
|
|
# Skip the duplicate H1
|
|
|
|
|
parts = ssdl.split("\n", 1)
|
|
|
|
|
if len(parts) == 2:
|
|
|
|
|
lines.append(parts[1])
|
|
|
|
|
lines.append("")
|
|
|
|
|
|
|
|
|
|
h("6. Organization Deductions (full)", 1)
|
|
|
|
|
p("This section embeds the full organization deductions. Per-aggregate verdict + file coupling + prioritized restructuring routes.")
|
|
|
|
|
|
|
|
|
|
org = read_md("organization_deductions.md")
|
|
|
|
|
if org:
|
|
|
|
|
parts = org.split("\n", 1)
|
|
|
|
|
if len(parts) == 2:
|
|
|
|
|
lines.append(parts[1])
|
|
|
|
|
lines.append("")
|
|
|
|
|
|
|
|
|
|
h("7. Call Graph (per-aggregate)", 1)
|
|
|
|
|
p("This section embeds the full call graph rollup. Producers and consumers grouped by file for each aggregate.")
|
|
|
|
|
|
|
|
|
|
cg = read_md("call_graph.md")
|
|
|
|
|
if cg:
|
|
|
|
|
parts = cg.split("\n", 1)
|
|
|
|
|
if len(parts) == 2:
|
|
|
|
|
lines.append(parts[1])
|
|
|
|
|
lines.append("")
|
|
|
|
|
|
|
|
|
|
h("8. Hot Paths (top consumers per aggregate)", 1)
|
|
|
|
|
p("This section embeds the hot-paths rollup. The top 5 consumers (by branch points) for each aggregate.")
|
|
|
|
|
|
|
|
|
|
hp = read_md("hot_paths.md")
|
|
|
|
|
if hp:
|
|
|
|
|
parts = hp.split("\n", 1)
|
|
|
|
|
if len(parts) == 2:
|
|
|
|
|
lines.append(parts[1])
|
|
|
|
|
lines.append("")
|
|
|
|
|
|
|
|
|
|
h("9. Field Usage (cross-aggregate)", 1)
|
|
|
|
|
p("This section embeds the field-usage rollup. Which fields are accessed how often across aggregates.")
|
|
|
|
|
|
|
|
|
|
fu = read_md("field_usage.md")
|
|
|
|
|
if fu:
|
|
|
|
|
parts = fu.split("\n", 1)
|
|
|
|
|
if len(parts) == 2:
|
|
|
|
|
lines.append(parts[1])
|
|
|
|
|
lines.append("")
|
|
|
|
|
|
|
|
|
|
h("10. Decomposition Matrix", 1)
|
|
|
|
|
p("This section embeds the decomposition matrix. Ranked refactor candidates with cost estimates.")
|
|
|
|
|
|
|
|
|
|
dm = read_md("decomposition_matrix.md")
|
|
|
|
|
if dm:
|
|
|
|
|
parts = dm.split("\n", 1)
|
|
|
|
|
if len(parts) == 2:
|
|
|
|
|
lines.append(parts[1])
|
|
|
|
|
lines.append("")
|
|
|
|
|
|
|
|
|
|
h("11. Cross-Audit Summary", 1)
|
|
|
|
|
p("This section embeds the cross-audit summary. Per-bucket counts per aggregate.")
|
|
|
|
|
|
|
|
|
|
cas = read_md("cross_audit_summary.md")
|
|
|
|
|
if cas:
|
|
|
|
|
parts = cas.split("\n", 1)
|
|
|
|
|
if len(parts) == 2:
|
|
|
|
|
lines.append(parts[1])
|
|
|
|
|
lines.append("")
|
|
|
|
|
|
|
|
|
|
h("12. Dead Fields", 1)
|
|
|
|
|
p("This section embeds the dead-fields rollup. Fields with low access counts.")
|
|
|
|
|
|
|
|
|
|
df = read_md("dead_fields.md")
|
|
|
|
|
if df:
|
|
|
|
|
parts = df.split("\n", 1)
|
|
|
|
|
if len(parts) == 2:
|
|
|
|
|
lines.append(parts[1])
|
|
|
|
|
lines.append("")
|
|
|
|
|
|
|
|
|
|
h("13. Candidate Aggregates", 1)
|
|
|
|
|
p("This section embeds the candidates rollup. The 3 placeholder aggregates (ToolSpec, ChatMessage, ProviderHistory).")
|
|
|
|
|
|
|
|
|
|
can = read_md("candidates.md")
|
|
|
|
|
if can:
|
|
|
|
|
parts = can.split("\n", 1)
|
|
|
|
|
if len(parts) == 2:
|
|
|
|
|
lines.append(parts[1])
|
|
|
|
|
lines.append("")
|
|
|
|
|
|
|
|
|
|
h("14. Top-Level Summary", 1)
|
|
|
|
|
p("This section embeds the top-level summary rollup.")
|
|
|
|
|
|
|
|
|
|
summ = read_md("summary.md")
|
|
|
|
|
if summ:
|
|
|
|
|
parts = summ.split("\n", 1)
|
|
|
|
|
if len(parts) == 2:
|
|
|
|
|
lines.append(parts[1])
|
|
|
|
|
lines.append("")
|
|
|
|
|
|
|
|
|
|
h("15. Restructuring Routes (Prioritized)", 1)
|
|
|
|
|
p("| Priority | Aggregate | Fix | Effort | Codepath reduction |")
|
|
|
|
|
p("|---|---|---|---|---|")
|
|
|
|
|
p("| 1 | Metadata | Nil Sentinel + Immediate-Mode Cache | ~half day | 1.13e18 -> 130 |")
|
|
|
|
|
p("| 2 | Metadata | Generational Handle | ~half day | 1.13e18 -> 35 |")
|
|
|
|
|
p("| 3 | FileItems | Nil Sentinel | ~30 min | 104 -> ~50 |")
|
|
|
|
|
p("| 4 | HistoryMessage | Typed field migration | ~1 hour | 4 -> 1 |")
|
|
|
|
|
p("| 5 | ToolCall | Typed field migration | ~5 min | 1 -> 1 |")
|
|
|
|
|
p("| 6 | (follow-up) | PCG P3 expansion for 6 data-gap aggregates | ~1 day | unlocks measurement |")
|
|
|
|
|
p("")
|
|
|
|
|
p("The two Metadata fixes (1 + 2) can be done in either order; Fix 1 is a prerequisite for Fix 2 (the sentinel is what the handle returns on mismatch).")
|
|
|
|
|
|
|
|
|
|
h("16. File Coupling (Where Restructuring Has Highest Ripple)", 1)
|
|
|
|
|
p("| File | Producers | Consumers | Role |")
|
|
|
|
|
p("|---|---|---|---|")
|
|
|
|
|
p("| `src/app_controller.py` | 1 | 1 | Hub: produces + consumes `Metadata` (dominant coupling) |")
|
|
|
|
|
p("| `src/ai_client.py` | 1 | 2 | Multi-aggregate; touches Metadata + CommsLogEntry + HistoryMessage |")
|
|
|
|
|
p("| `src/models.py` | 1 | 1 | Canonical source for `Metadata` + others |")
|
|
|
|
|
p("")
|
|
|
|
|
p("`src/app_controller.py` is the central nervous system. Restructuring `Metadata` ripples through every AI turn dispatch in the app.")
|
|
|
|
|
|
|
|
|
|
h("17. Verification", 1)
|
|
|
|
|
p("- **131 tests passing** (96 unit + 15 phase78 + 13 phase89 + 7 integration)")
|
|
|
|
|
p("- **Meta-audit clean** (0 violations on `audit_code_path_audit_coverage.py --strict`)")
|
|
|
|
|
p("- **All 13 aggregates have audit artifacts** in `aggregates/` (10 real + 3 candidate placeholders)")
|
|
|
|
|
p("")
|
|
|
|
|
p("### Audit gates")
|
|
|
|
|
p("")
|
|
|
|
|
p("| Gate | Status |")
|
|
|
|
|
p("|---|---|")
|
|
|
|
|
p("| `audit_exception_handling.py --strict` | PASS (informational) |")
|
|
|
|
|
p("| `audit_main_thread_imports.py` | PASS |")
|
|
|
|
|
p("| `audit_no_models_config_io.py` | PASS |")
|
|
|
|
|
p("| `audit_code_path_audit_coverage.py --strict` | PASS (0 violations) |")
|
|
|
|
|
p("| `audit_weak_types.py --strict` | REGRESSION (117 vs 112 baseline; from cherry-picked commits on master, not from this track) |")
|
|
|
|
|
p("| `audit_optional_in_3_files.py --strict` | REGRESSION (7 pre-existing `Optional[T]` violations in mcp_client + ai_client) |")
|
|
|
|
|
|
|
|
|
|
h("18. Reproducing This Audit", 1)
|
|
|
|
|
code("# Generate the 6 input JSONs")
|
|
|
|
|
code("uv run python scripts/audit_weak_types.py --json > tests/artifacts/audit_inputs/audit_weak_types.json")
|
|
|
|
|
code("uv run python scripts/audit_exception_handling.py --json > tests/artifacts/audit_inputs/audit_exception_handling.json")
|
|
|
|
|
code("uv run python scripts/audit_optional_in_3_files.py --json > tests/artifacts/audit_inputs/audit_optional_in_3_files.json")
|
|
|
|
|
code("uv run python scripts/audit_no_models_config_io.py --json > tests/artifacts/audit_inputs/audit_no_models_config_io.json")
|
|
|
|
|
code("uv run python scripts/audit_main_thread_imports.py --json > tests/artifacts/audit_inputs/audit_main_thread_imports.json")
|
|
|
|
|
code("uv run python scripts/generate_type_registry.py --json > tests/artifacts/audit_inputs/type_registry.json")
|
|
|
|
|
code("")
|
|
|
|
|
code("# Run the v2 audit")
|
|
|
|
|
code("uv run python -c \"")
|
|
|
|
|
code("from src.code_path_audit import run_audit, render_rollups")
|
|
|
|
|
code("from pathlib import Path")
|
|
|
|
|
code("result = run_audit(src_dir='src', audit_inputs_dir='tests/artifacts/audit_inputs', output_dir='docs/reports/code_path_audit', date='2026-06-22')")
|
|
|
|
|
code("render_rollups(result.data, Path('docs/reports/code_path_audit/2026-06-22'))")
|
|
|
|
|
code("\"")
|
|
|
|
|
code("")
|
|
|
|
|
code("# Run the meta-audit")
|
|
|
|
|
code("uv run python scripts/audit_code_path_audit_coverage.py --input-dir docs/reports/code_path_audit/2026-06-22/ --strict")
|
|
|
|
|
code("")
|
|
|
|
|
code("# Run the tests")
|
|
|
|
|
code("uv run pytest tests/test_code_path_audit.py tests/test_code_path_audit_phase78.py tests/test_code_path_audit_phase89.py tests/test_code_path_audit_integration.py")
|
|
|
|
|
|
|
|
|
|
h("19. See Also", 1)
|
|
|
|
|
p("**Per-aggregate detailed profiles (13 files, full evidence):**")
|
|
|
|
|
for agg_name in ["Metadata", "FileItems", "CommsLog", "CommsLogEntry", "FileItem", "History", "HistoryMessage", "Result", "ToolCall", "ToolDefinition", "ChatMessage", "ProviderHistory", "ToolSpec"]:
|
|
|
|
|
p(f"- `aggregates/{agg_name}.md` - 15-section detailed profile")
|
|
|
|
|
p(f"- `aggregates/{agg_name}.dsl` - flat-section DSL artifact")
|
|
|
|
|
p(f"- `aggregates/{agg_name}.tree` - ASCII tree artifact")
|
|
|
|
|
p("")
|
|
|
|
|
p("**Top-level rollups (10 files):**")
|
|
|
|
|
p("- `summary.md` - 70-line top-level summary")
|
|
|
|
|
p("- `ssdl_analysis.md` - SSDL rollup with top-10 defusing recommendations")
|
|
|
|
|
p("- `organization_deductions.md` - per-aggregate verdict + file coupling + restructuring routes")
|
|
|
|
|
p("- `call_graph.md` - producer/consumer tables per aggregate")
|
|
|
|
|
p("- `decomposition_matrix.md` - ranked refactor candidates")
|
|
|
|
|
p("- `hot_paths.md` - top 5 hot consumers per aggregate")
|
|
|
|
|
p("- `field_usage.md` - cross-aggregate field frequency")
|
|
|
|
|
p("- `dead_fields.md` - fields with low access")
|
|
|
|
|
p("- `cross_audit_summary.md` - per-bucket cross-audit table")
|
|
|
|
|
p("- `candidates.md` - the 3 placeholder aggregates")
|
|
|
|
|
p("")
|
|
|
|
|
p("**Track artifacts:**")
|
|
|
|
|
p("- `TRACK_COMPLETION_code_path_audit_20260622.md` - the track completion report")
|
|
|
|
|
p("- `conductor/tracks/code_path_audit_20260607/spec_v2.md` - canonical spec")
|
|
|
|
|
p("- `conductor/tracks/code_path_audit_20260607/plan_v2.md` - canonical plan")
|
|
|
|
|
p("- `conductor/code_styleguides/code_path_audit.md` - 5-convention styleguide")
|
|
|
|
|
|
|
|
|
|
h("20. Commit history", 1)
|
|
|
|
|
code("713c0349 docs(reports): single coherent audit report (AUDIT_REPORT.md)")
|
|
|
|
|
code("628841d0 docs(reports): TRACK_COMPLETION revised with active SSDL deductions")
|
|
|
|
|
code("783e5fd9 feat(audit): SSDL analysis - effective codepaths + nil-sentinel + organization verdict")
|
|
|
|
|
code("00f9d498 docs(reports): pre-compaction report - all state needed to resume post-compaction")
|
|
|
|
|
code("09167986 wip: SSDL analysis (has indentation bug, needs fix)")
|
|
|
|
|
code("9113bc21 docs(reports): TRACK_COMPLETION revised - real-data analysis section")
|
|
|
|
|
code("558258cf feat(audit): rich rollups + per-line indentation fix - 2136 total lines")
|
|
|
|
|
code("59eeee81 feat(audit): enriched markdown renderer - 15 sections per profile + 2 new rollups")
|
|
|
|
|
|
|
|
|
|
output = "\n".join(lines)
|
|
|
|
|
out_path = OUT_DIR / "AUDIT_REPORT.md"
|
|
|
|
|
out_path.write_text(output, encoding="utf-8")
|
|
|
|
|
print(f"Wrote {out_path} ({len(lines)} lines)")
|