test(audit): fix critical test suite deadlocks and write exhaustive architectural report

- Fix 'Triple Bingo' history synchronization explosion during streaming - Implement stateless event buffering in ApiHookClient to prevent dropped events - Ensure 'tool_execution' events emit consistently across all LLM providers - Add hard timeouts to all background thread wait() conditions - Add thorough teardown cleanup to conftest.py's reset_ai_client fixture - Write highly detailed report_gemini.md exposing asyncio lifecycle flaws
2026-03-05 01:42:47 -05:00
parent bfdbd43785
commit 35480a26dc
15 changed files with 715 additions and 481 deletions
@@ -52,7 +52,6 @@ def test_tools_sim_live(live_gui: Any) -> None:
 sim.run() # Ensure history is updated via the async queue
 time.sleep(2)
 sim.teardown()
-
@pytest.mark.integration
 def test_execution_sim_live(live_gui: Any) -> None:
 """Run the Execution & Modals simulation against a live GUI."""
@@ -60,7 +59,11 @@ def test_execution_sim_live(live_gui: Any) -> None:
 assert client.wait_for_server(timeout=10)
 sim = ExecutionSimulation(client)
 sim.setup("LiveExecutionSim")
+ # Enable manual approval to test modals
+ client.set_value('manual_approve', True)
 client.set_value('current_provider', 'gemini_cli')
 client.set_value('gcli_path', f'"{sys.executable}" "{os.path.abspath("tests/mock_gemini_cli.py")}"')
 sim.run()
+ time.sleep(2)
 sim.teardown()
+