refactor(audit): remove dead DSL parser (DSL files no longer produced)

The v2 postfix DSL parser (DSL_WORD_ARITY_V2, _atom, to_dsl_v2, parse_dsl_v2) was implemented during the 14-phase DSL plan but never reached production: run_audit() (line ~1217 after this change) only writes .md files (AUDIT_REPORT.md plus per-aggregate markdowns via to_markdown/to_tree), never .dsl files. The DSL parser carried latent arity bugs (DSL_WORD_ARITY_V2 declared 5 for 'result-coverage' but writer emits 4; 4 for 'type-alias-coverage' but writer emits 3) which would have caused silent parse failures. Also removed the now-unused 'import re' statement (was only used by parse_dsl_v2). The 'from datetime import date as date_mod' is retained (still used at line ~1259, 1275, 1291 in the markdown renderer). Tests deleted in lockstep: - tests/test_code_path_audit_phase78.py: test_dsl_word_arity_v2_14_new_words - tests/test_code_path_audit_phase89.py: test_to_dsl_v2_includes_aggregate_kind_section, test_parse_dsl_v2_round_trip_aggregate_kind, test_parse_dsl_v2_malformed Verification: - grep -c 'to_dsl_v2|parse_dsl_v2|DSL_WORD_ARITY_V2' src/code_path_audit.py = 0 - 127 of 127 remaining tests pass (was 131; -4 tests deleted)
2026-06-24 09:57:17 -04:00
parent 59f48d1a0a
commit b385cd441b
3 changed files with 0 additions and 187 deletions
@@ -839,99 +839,8 @@ def run_all_cross_audit_reads(audit_inputs_dir: str) -> dict[str, dict]:
   out[audit_name] = {}
 return out

-DSL_WORD_ARITY_V2: dict[str, int] = {
- "kind": 1,
- "mem-dim": 1,
- "fn-ref": 4,
- "access-pattern": 1,
- "ap-evidence": 4,
- "frequency": 1,
- "freq-evidence": 4,
- "result-coverage": 5,
- "type-alias-coverage": 4,
- "cross-audit-finding": 5,
- "cross-audit-findings": 5,
- "decomp-cost": 8,
- "opt-candidate": 7,
- "is-candidate": 1,
-}
-
-import re
 from datetime import date as date_mod

-def _atom(s: str) -> str:
- """Format a string as a postfix DSL atom (bare or quoted)."""
- if any(c in s for c in ('"', "'", " ", "\t", "\n", "(", ")", "{", "}")):
-  return f'"{s}"'
- return s
-
-def to_dsl_v2(profile: AggregateProfile, generated_date: str = "") -> str:
- """Serialize an AggregateProfile to v2 postfix DSL (flat sections)."""
- lines: list[str] = []
- lines.append(f'\\ AggregateProfile: "{profile.name}"')
- lines.append(f"\\ generated {generated_date} by src.code_path_audit v2")
- lines.append("")
- lines.append("\\ === aggregate_kind ===")
- lines.append(f' "{profile.aggregate_kind}" kind')
- lines.append("")
- lines.append("\\ === memory_dim ===")
- lines.append(f' "{profile.memory_dim}" mem-dim')
- lines.append("")
- lines.append(f"\\ === producers ({len(profile.producers)} items) ===")
- for p in profile.producers:
-  lines.append(f' "{p.fqname}" "{p.file}" {p.line} "{p.role}" fn-ref')
- lines.append("")
- lines.append(f"\\ === consumers ({len(profile.consumers)} items) ===")
- for c in profile.consumers:
-  lines.append(f' "{c.fqname}" "{c.file}" {c.line} "{c.role}" fn-ref')
- lines.append("")
- lines.append("\\ === access_pattern ===")
- lines.append(f' "{profile.access_pattern}" access-pattern')
- lines.append("")
- lines.append(f"\\ === access_pattern_evidence ({len(profile.access_pattern_evidence)} items) ===")
- for ev in profile.access_pattern_evidence:
-  lines.append(f' "{ev.function.fqname}" "{ev.pattern}" {len(ev.field_accesses)} "{ev.confidence}" ap-evidence')
- lines.append("")
- lines.append("\\ === frequency ===")
- lines.append(f' "{profile.frequency}" frequency')
- lines.append("")
- lines.append(f"\\ === frequency_evidence ({len(profile.frequency_evidence)} items) ===")
- for ev in profile.frequency_evidence:
-  lines.append(f' "{ev.function.fqname}" "{ev.frequency}" "{ev.source}" "{ev.note}" freq-evidence')
- lines.append("")
- rc = profile.result_coverage
- lines.append("\\ === result_coverage ===")
- lines.append(f" {rc.total_producers} {rc.result_producers} {rc.total_consumers} {rc.result_consumers} result-coverage")
- lines.append("")
- tac = profile.type_alias_coverage
- lines.append("\\ === type_alias_coverage ===")
- lines.append(f" {tac.total_sites} {tac.typed_sites} {tac.untyped_sites} type-alias-coverage")
- lines.append("")
- lines.append("\\ === cross_audit_findings ===")
- for f in profile.cross_audit_findings.weak_types:
-  lines.append(f' "{f.audit_script}" {f.site_count} "{f.example_file}" {f.example_line} "{f.note}" cross-audit-finding')
- for f in profile.cross_audit_findings.exception_handling:
-  lines.append(f' "{f.audit_script}" {f.site_count} "{f.example_file}" {f.example_line} "{f.note}" cross-audit-finding')
- for f in profile.cross_audit_findings.optional_in_baseline:
-  lines.append(f' "{f.audit_script}" {f.site_count} "{f.example_file}" {f.example_line} "{f.note}" cross-audit-finding')
- for f in profile.cross_audit_findings.config_io_ownership:
-  lines.append(f' "{f.audit_script}" {f.site_count} "{f.example_file}" {f.example_line} "{f.note}" cross-audit-finding')
- for f in profile.cross_audit_findings.import_graph:
-  lines.append(f' "{f.audit_script}" {f.site_count} "{f.example_file}" {f.example_line} "{f.note}" cross-audit-finding')
- lines.append(" 5 cross-audit-findings")
- lines.append("")
- dc = profile.decomposition_cost
- lines.append("\\ === decomposition_cost ===")
- batch_size_str = str(dc.batch_size) if dc.batch_size is not None else "nil"
- lines.append(f" {dc.current_cost_estimate} {dc.componentize_savings} {dc.unify_savings} \"{dc.recommended_direction}\" \"{dc.recommended_rationale}\" {batch_size_str} {dc.struct_field_count} {str(dc.struct_frozen).lower()} decomp-cost")
- lines.append("")
- lines.append(f"\\ === optimization_candidates ({len(profile.optimization_candidates)} items) ===")
- for cand in profile.optimization_candidates:
-  lines.append(f' "{cand.candidate}" "{cand.direction}" {len(cand.affected_files)} {cand.estimated_savings_us} "{cand.effort}" "{cand.priority}" "{cand.cross_ref}" opt-candidate')
- lines.append("")
- lines.append("\\ === is_candidate ===")
- lines.append(f" {'true' if profile.is_candidate else 'false'} is-candidate")
- return "\n".join(lines)

 def to_markdown(profile: AggregateProfile) -> str:
 """Render the per-aggregate markdown (10 sections)."""
@@ -1028,63 +937,6 @@ def to_tree(profile: AggregateProfile) -> str:
 lines.append(f"|- optimization_candidates: [{len(profile.optimization_candidates)}]")
 return "\n".join(lines)

-def parse_dsl_v2(text: str) -> Result[dict]:
- """Parse a v2 postfix DSL into a nested dict (round-trip)."""
- tokens: list[str] = []
- for line in text.splitlines():
-  line = re.sub(r"\\.*", "", line)
-  if not line.strip():
-   continue
-  i = 0
-  while i < len(line):
-   c = line[i]
-   if c.isspace():
-    i += 1
-    continue
-   if c == '"':
-    j = line.find('"', i + 1)
-    if j == -1:
-     j = len(line)
-    tokens.append(line[i + 1 : j])
-    i = j + 1
-   else:
-    j = i
-    while j < len(line) and not line[j].isspace():
-     j += 1
-    tokens.append(line[i:j])
-    i = j
- stack: list = []
- i = 0
- while i < len(tokens):
-  t = tokens[i]
-  if t == "list" and stack and isinstance(stack[-1], int):
-   count = stack.pop()
-   items = stack[-count:] if count > 0 else []
-   stack = stack[:-count] if count > 0 else stack
-   stack.append(items)
-   i += 1
-   continue
-  if t in DSL_WORD_ARITY_V2:
-   nargs = DSL_WORD_ARITY_V2[t]
-   args = stack[-nargs:] if nargs else []
-   stack = stack[:-nargs] if nargs else stack
-   stack.append({"_tag": t, "_args": args})
-   i += 1
-   continue
-  if t in ("true", "false"):
-   stack.append(t == "true")
-  elif t == "nil":
-   stack.append(None)
-  elif t.lstrip("-").isdigit():
-   stack.append(int(t))
-  else:
-   stack.append(t)
-  i += 1
- if len(stack) != 1:
-  return Result(
-data={"_sections": stack},
- )
- return Result(data=stack[0])

 AGGREGATES_IN_SCOPE: tuple[str, ...] = (
 "Metadata",
@@ -67,7 +67,6 @@ from src.code_path_audit import (
 compute_type_alias_coverage,
 aggregate_cross_audit_findings,
 run_all_cross_audit_reads,
- DSL_WORD_ARITY_V2,
 )
 from src.result_types import Result, ErrorInfo, ErrorKind

@@ -206,17 +205,3 @@ def test_run_all_cross_audit_reads_partial() -> None:
  result = run_all_cross_audit_reads(tmp)
  assert "audit_weak_types" in result
  assert "audit_exception_handling" in result
-
-# Phase 8 Task 8.1 test
-def test_dsl_word_arity_v2_14_new_words() -> None:
- """DSL_WORD_ARITY_V2 has 14 new tagged words."""
- expected_words = {
-  "kind", "mem-dim", "fn-ref", "access-pattern", "ap-evidence",
-  "frequency", "freq-evidence", "result-coverage", "type-alias-coverage",
-  "cross-audit-finding", "cross-audit-findings", "decomp-cost",
-  "opt-candidate", "is-candidate",
- }
- assert expected_words.issubset(set(DSL_WORD_ARITY_V2.keys()))
- assert DSL_WORD_ARITY_V2["kind"] == 1
- assert DSL_WORD_ARITY_V2["fn-ref"] == 4
- assert DSL_WORD_ARITY_V2["decomp-cost"] == 8
@@ -21,10 +21,8 @@ from src.code_path_audit import (
 DecompositionCost,
 OptimizationCandidate,
 AggregateProfile,
- to_dsl_v2,
 to_markdown,
 to_tree,
- parse_dsl_v2,
 AGGREGATES_IN_SCOPE,
 CANDIDATE_AGGREGATES,
 synthesize_aggregate_profile,
@@ -56,14 +54,6 @@ def _make_profile(name: str = "Metadata", kind: str = "typealias") -> AggregateP
 )

 # Phase 8 Tasks 8.2-8.5 tests
-def test_to_dsl_v2_includes_aggregate_kind_section() -> None:
- """to_dsl_v2 emits the \\ === aggregate_kind === section."""
- profile = _make_profile()
- dsl = to_dsl_v2(profile, generated_date="2026-06-22")
- assert "\\ === aggregate_kind ===" in dsl
- assert '"typealias" kind' in dsl
- assert "\\ === memory_dim ===" in dsl
- assert '"discussion" mem-dim' in dsl

 def test_to_markdown_10_sections() -> None:
 """to_markdown emits the 10 sections per spec section 8.1."""
@@ -87,20 +77,6 @@ def test_to_tree_box_drawing() -> None:
 assert "Metadata" in tree
 assert "kind: typealias" in tree

-def test_parse_dsl_v2_round_trip_aggregate_kind() -> None:
- """parse_dsl_v2(to_dsl_v2(profile)) recovers the aggregate_kind section."""
- profile = _make_profile()
- dsl = to_dsl_v2(profile)
- parsed = parse_dsl_v2(dsl)
- assert isinstance(parsed, Result)
- assert "typealias" in str(parsed.data)
-
-def test_parse_dsl_v2_malformed() -> None:
- """parse_dsl_v2 returns Result.ok for empty input (no tagged words)."""
- result = parse_dsl_v2("\\ empty comment only\n")
- assert result.ok
- assert result.data == {"_sections": []}
-
 # Phase 9 Tasks 9.1-9.6 tests
 def test_aggregates_in_scope_10_real() -> None:
 """AGGREGATES_IN_SCOPE has 10 real aggregates."""