manual_slop/tests/test_ai_client_tool_loop_builder.py

"""Verify run_with_tool_loop supports a per-round request_builder callback.

Vendors that mutate their history list (e.g. MiniMax) need to rebuild
the messages on each round so the API sees the latest tool results.
run_with_tool_loop accepts a callable as the 2nd arg to enable this.
"""
from __future__ import annotations
from typing import Any
from unittest.mock import MagicMock, patch
from src.openai_compatible import NormalizedResponse, OpenAICompatibleRequest
from src.ai_client import run_with_tool_loop
from src.result_types import Result
from src.vendor_capabilities import VendorCapabilities

def _make_normalized_response(text: str = "ok", tool_calls: list[dict[str, Any]] | None = None) -> NormalizedResponse:
 from src.openai_schemas import UsageStats
 return NormalizedResponse(
  text=text, tool_calls=tool_calls or (),
  usage=UsageStats(input_tokens=10, output_tokens=5),
  raw_response=None,
 )

def test_run_with_tool_loop_calls_request_builder_each_round() -> None:
 caps = VendorCapabilities(vendor="test", model="test-model", tool_calling=True, context_window=8192)
 client = MagicMock()
 tool_response = _make_normalized_response(
  "first", tool_calls=[{"id": "c1", "type": "function", "function": {"name": "noop", "arguments": "{}"}}]
 )
 final = _make_normalized_response("done")
 builder_calls: list[int] = []
 def builder(round_idx: int) -> OpenAICompatibleRequest:
  builder_calls.append(round_idx)
  return OpenAICompatibleRequest(messages=[{"role": "user", "content": f"round={round_idx}"}], model="m")
 with patch("src.openai_compatible.send_openai_compatible", side_effect=[Result(data=tool_response), Result(data=final)]), \
      patch("src.ai_client._execute_tool_calls_concurrently", return_value=[("noop", "c1", "r", "")]):
  result = run_with_tool_loop(
   client, builder, capabilities=caps,
   pre_tool_callback=None, qa_callback=None, patch_callback=None,
   base_dir=".", vendor_name="test", history_lock=None, history=None,
  )
  assert result == "done"
  assert len(builder_calls) >= 2