From be689ad1e9542bd182a3ad8af2cc4cacb0fdafc6 Mon Sep 17 00:00:00 2001 From: Ed_ Date: Wed, 25 Feb 2026 20:52:45 -0500 Subject: [PATCH] chore(conductor): Checkpoint Phase 1: Research and Inventory for test curation track --- conductor/tracks.md | 2 +- .../test_curation_20260225/inventory.md | 70 +++++++++++++++++++ .../tracks/test_curation_20260225/plan.md | 8 +-- 3 files changed, 75 insertions(+), 5 deletions(-) create mode 100644 conductor/tracks/test_curation_20260225/inventory.md diff --git a/conductor/tracks.md b/conductor/tracks.md index eecbfef..67f4b98 100644 --- a/conductor/tracks.md +++ b/conductor/tracks.md @@ -45,7 +45,7 @@ This file tracks all major tracks for the project. Each track has its own detail --- -- [ ] **Track: Test Suite Curation and Organization** +- [~] **Track: Test Suite Curation and Organization** *Link: [./tracks/test_curation_20260225/](./tracks/test_curation_20260225/)* diff --git a/conductor/tracks/test_curation_20260225/inventory.md b/conductor/tracks/test_curation_20260225/inventory.md new file mode 100644 index 0000000..55e097e --- /dev/null +++ b/conductor/tracks/test_curation_20260225/inventory.md @@ -0,0 +1,70 @@ +# Test Suite Inventory - manual_slop + +## Categories + +### Manual Slop Core/GUI +- `tests/test_ai_context_history.py` +- `tests/test_api_events.py` +- `tests/test_gui_diagnostics.py` +- `tests/test_gui_events.py` +- `tests/test_gui_performance_requirements.py` +- `tests/test_gui_stress_performance.py` +- `tests/test_gui_updates.py` +- `tests/test_gui2_events.py` +- `tests/test_gui2_layout.py` +- `tests/test_gui2_mcp.py` +- `tests/test_gui2_parity.py` +- `tests/test_gui2_performance.py` +- `tests/test_headless_api.py` +- `tests/test_headless_dependencies.py` +- `tests/test_headless_startup.py` +- `tests/test_history_blacklist.py` +- `tests/test_history_bleed.py` (FAILING) +- `tests/test_history_migration.py` +- `tests/test_history_persistence.py` +- `tests/test_history_truncation.py` +- `tests/test_performance_monitor.py` +- `tests/test_token_usage.py` +- `tests/test_layout_reorganization.py` + +### Conductor/MMA (To be Blacklisted from core runs) +- `tests/test_mma_exec.py` +- `tests/test_mma_skeleton.py` +- `tests/test_conductor_api_hook_integration.py` +- `tests/conductor/test_infrastructure.py` +- `tests/test_gemini_cli_adapter.py` +- `tests/test_gemini_cli_integration.py` (FAILING) +- `tests/test_ai_client_cli.py` +- `tests/test_cli_tool_bridge.py` (FAILING) +- `tests/test_gemini_metrics.py` + +### MCP/Integrations +- `tests/test_api_hook_client.py` +- `tests/test_api_hook_extensions.py` +- `tests/test_hooks.py` +- `tests/test_sync_hooks.py` +- `tests/test_mcp_perf_tool.py` + +### Simulation/Workflows +- `tests/test_sim_ai_settings.py` +- `tests/test_sim_base.py` +- `tests/test_sim_context.py` +- `tests/test_sim_execution.py` +- `tests/test_sim_tools.py` +- `tests/test_workflow_sim.py` +- `tests/test_extended_sims.py` +- `tests/test_user_agent.py` +- `tests/test_live_workflow.py` +- `tests/test_agent_capabilities.py` +- `tests/test_agent_tools_wiring.py` + +## Redundancy Observations +- GUI tests are split between `gui` and `gui2`. Since `gui_2.py` is the current focus, legacy `gui` tests should be reviewed for relevance. +- History tests are highly fragmented (5+ files). +- Headless tests are fragmented (3 files). +- Simulation tests are fragmented (10+ files). + +## Failure Summary +- `tests/test_cli_tool_bridge.py`: `test_deny_decision` and `test_unreachable_hook_server` failing (wrong decision returned). +- `tests/test_gemini_cli_integration.py`: Integration with `gui_2.py` failing to find mock response in history. +- `tests/test_history_bleed.py`: `test_get_history_bleed_stats_basic` failing (assert 0 == 900000). diff --git a/conductor/tracks/test_curation_20260225/plan.md b/conductor/tracks/test_curation_20260225/plan.md index 51f8226..318bf79 100644 --- a/conductor/tracks/test_curation_20260225/plan.md +++ b/conductor/tracks/test_curation_20260225/plan.md @@ -3,10 +3,10 @@ This plan outlines the process for categorizing, organizing, and curating the existing test suite using a central manifest and exhaustive review. ## Phase 1: Research and Inventory -- [ ] Task: Initialize MMA Environment `activate_skill mma-orchestrator` -- [ ] Task: Inventory all existing tests in `tests/` and mapping them to categories -- [ ] Task: Identify failing and redundant tests through a full execution sweep -- [ ] Task: Conductor - User Manual Verification 'Phase 1: Research and Inventory' (Protocol in workflow.md) +- [x] Task: Initialize MMA Environment `activate_skill mma-orchestrator` +- [x] Task: Inventory all existing tests in `tests/` and mapping them to categories +- [x] Task: Identify failing and redundant tests through a full execution sweep +- [x] Task: Conductor - User Manual Verification 'Phase 1: Research and Inventory' (Protocol in workflow.md) ## Phase 2: Manifest and Tooling - [ ] Task: Design and create `tests.toml` manifest file