Private
Public Access
0
0

test(ai_client): add red tests for run_with_tool_loop shared helper

5 Red tests in tests/test_ai_client_tool_loop.py verify the planned
run_with_tool_loop contract (no-tool-call fast path, tool-call
dispatch, max-rounds safety, history append, error tolerance).

Deviation from plan: tests patch src.ai_client.send_openai_compatible
(plan's Task 1.1 had src.tool_loop.send_openai_compatible). The plan
predates the AGENTS.md HARD RULE on src/<thing>.py files; per the
follow-up track's Naming Convention section, run_with_tool_loop lives
IN src/ai_client.py. The function body imports send_openai_compatible
from src.openai_compatible, so src.ai_client.send_openai_compatible
is the correct patch path.

state.toml: current_phase 0 -> 1, phase_1 pending -> in_progress,
t1_1 pending -> in_progress, blocked_by status
phase_6_in_progress -> phase_6_complete (parent's Phase 6
checkpointed at 064cb26).

Confirmed red: 5 ImportError against src.ai_client.run_with_tool_loop
at collection time.
This commit is contained in:
2026-06-11 10:43:56 -04:00
parent a22d497591
commit dc0f25c53b
2 changed files with 114 additions and 4 deletions
@@ -5,15 +5,16 @@
track_id = "qwen_llama_grok_followup_20260611"
name = "Qwen/Llama/Grok Follow-Up (tool loop, PROVIDERS move, UX adaptations 2-9, local-first, matrix v2, Anthropic/Gemini/DeepSeek migration)"
status = "active"
current_phase = 0
current_phase = 1
last_updated = "2026-06-11"
[blocked_by]
# This follow-up is blocked on the parent track's Phase 6 (docs) completing.
qwen_llama_grok_integration_20260606 = "phase_6_in_progress"
# Resolved 2026-06-11 (parent Phase 6 checkpoint sha 064cb26).
qwen_llama_grok_integration_20260606 = "phase_6_complete"
[phases]
phase_1 = { status = "pending", checkpoint_sha = "", name = "Tool loop lift (run_with_tool_loop helper for 8 vendors)" }
phase_1 = { status = "in_progress", checkpoint_sha = "", name = "Tool loop lift (run_with_tool_loop helper for 8 vendors)" }
phase_2 = { status = "pending", checkpoint_sha = "", name = "PROVIDERS move (out of src/models.py)" }
phase_3 = { status = "pending", checkpoint_sha = "", name = "UX adaptations 2-9 (8 of 9 deferred from parent Phase 5)" }
phase_4 = { status = "pending", checkpoint_sha = "", name = "Local-first + matrix v2 expansion (12 new fields)" }
@@ -21,7 +22,7 @@ phase_5 = { status = "pending", checkpoint_sha = "", name = "Anthropic/Gemini/De
[tasks]
# Phase 1: Tool loop lift
t1_1 = { status = "pending", commit_sha = "", description = "Read tool-loop patterns in _send_minimax + the 4 inline-loop vendors" }
t1_1 = { status = "in_progress", commit_sha = "", description = "Read tool-loop patterns in _send_minimax + the 4 inline-loop vendors" }
t1_2 = { status = "pending", commit_sha = "", description = "Design run_with_tool_loop helper signature" }
t1_3 = { status = "pending", commit_sha = "", description = "Red: 5 tests for run_with_tool_loop in tests/test_tool_loop.py" }
t1_4 = { status = "pending", commit_sha = "", description = "Green: implement run_with_tool_loop in src/ai_client.py" }
+109
View File
@@ -0,0 +1,109 @@
"""Tests for src.ai_client.run_with_tool_loop (shared tool-loop helper).
5 Red tests. They verify:
1. No-tool-call path: returns immediately after one send.
2. Tool-call dispatch: dispatches via _execute_tool_calls_concurrently and
continues the loop.
3. Max-rounds safety: bails out after MAX_TOOL_ROUNDS + 2 iterations.
4. History append: appends an assistant message to the caller's history.
5. Error tolerance: continues even if a tool errors.
The helper lives in src.ai_client (per the AGENTS.md HARD RULE: no new
src/<thing>.py files). The tests patch src.ai_client.send_openai_compatible
because that's the symbol the function uses internally.
"""
from __future__ import annotations
from typing import Any
from unittest.mock import MagicMock, patch
import pytest
from src.openai_compatible import NormalizedResponse, OpenAICompatibleRequest
from src.ai_client import run_with_tool_loop
from src.vendor_capabilities import VendorCapabilities
@pytest.fixture
def caps() -> VendorCapabilities:
return VendorCapabilities(vendor="test", model="test-model", tool_calling=True, context_window=8192)
def _make_normalized_response(text: str = "ok", tool_calls: list[dict[str, Any]] | None = None) -> NormalizedResponse:
return NormalizedResponse(
text=text, tool_calls=tool_calls or [],
usage_input_tokens=10, usage_output_tokens=5,
usage_cache_read_tokens=0, usage_cache_creation_tokens=0,
raw_response=None,
)
def test_run_with_tool_loop_no_tool_calls_returns_immediately(caps: VendorCapabilities) -> None:
client = MagicMock()
with patch("src.ai_client.send_openai_compatible", return_value=_make_normalized_response("hello")) as call:
result = run_with_tool_loop(
client, OpenAICompatibleRequest(messages=[{"role": "user", "content": "x"}], model="m"),
capabilities=caps,
pre_tool_callback=None, qa_callback=None, patch_callback=None,
base_dir=".", vendor_name="test", history_lock=None, history=None,
)
assert result == "hello"
assert call.call_count == 1
def test_run_with_tool_loop_dispatches_tool_calls(caps: VendorCapabilities) -> None:
client = MagicMock()
tool_response = _make_normalized_response(
"first response", tool_calls=[{"id": "c1", "type": "function", "function": {"name": "read_file", "arguments": "{}"}}]
)
final_response = _make_normalized_response("after tool")
with patch("src.ai_client.send_openai_compatible", side_effect=[tool_response, final_response]) as call, \
patch("src.ai_client._execute_tool_calls_concurrently", return_value=[("read_file", "c1", "result", "")]) as dispatch:
result = run_with_tool_loop(
client, OpenAICompatibleRequest(messages=[{"role": "user", "content": "x"}], model="m"),
capabilities=caps,
pre_tool_callback=None, qa_callback=None, patch_callback=None,
base_dir=".", vendor_name="test", history_lock=None, history=None,
)
assert result == "after tool"
assert call.call_count == 2
assert dispatch.call_count == 1
def test_run_with_tool_loop_respects_max_rounds(caps: VendorCapabilities) -> None:
client = MagicMock()
infinite_tool_response = _make_normalized_response(
"loop", tool_calls=[{"id": "c1", "type": "function", "function": {"name": "noop", "arguments": "{}"}}]
)
with patch("src.ai_client.send_openai_compatible", return_value=infinite_tool_response), \
patch("src.ai_client._execute_tool_calls_concurrently", return_value=[("noop", "c1", "result", "")]):
result = run_with_tool_loop(
client, OpenAICompatibleRequest(messages=[{"role": "user", "content": "x"}], model="m"),
capabilities=caps,
pre_tool_callback=None, qa_callback=None, patch_callback=None,
base_dir=".", vendor_name="test", history_lock=None, history=None,
)
assert result == "loop"
def test_run_with_tool_loop_appends_to_history(caps: VendorCapabilities) -> None:
client = MagicMock()
history: list[dict[str, Any]] = []
history_lock = MagicMock()
history_lock.__enter__ = MagicMock(return_value=history_lock)
history_lock.__exit__ = MagicMock(return_value=False)
with patch("src.ai_client.send_openai_compatible", return_value=_make_normalized_response("hi")):
run_with_tool_loop(
client, OpenAICompatibleRequest(messages=[{"role": "user", "content": "x"}], model="m"),
capabilities=caps,
pre_tool_callback=None, qa_callback=None, patch_callback=None,
base_dir=".", vendor_name="test", history_lock=history_lock, history=history,
)
assert any(msg.get("role") == "assistant" and msg.get("content") == "hi" for msg in history)
def test_run_with_tool_loop_does_not_crash_on_tool_error(caps: VendorCapabilities) -> None:
client = MagicMock()
tool_response = _make_normalized_response(
"err", tool_calls=[{"id": "c1", "type": "function", "function": {"name": "fail", "arguments": "{}"}}]
)
final_response = _make_normalized_response("recovered")
with patch("src.ai_client.send_openai_compatible", side_effect=[tool_response, final_response]), \
patch("src.ai_client._execute_tool_calls_concurrently", return_value=[("fail", "c1", "", "ToolExecutionError")]):
result = run_with_tool_loop(
client, OpenAICompatibleRequest(messages=[{"role": "user", "content": "x"}], model="m"),
capabilities=caps,
pre_tool_callback=None, qa_callback=None, patch_callback=None,
base_dir=".", vendor_name="test", history_lock=None, history=None,
)
assert result == "recovered"