conductor(checkpoint): Phase 2: Infrastructure Verification complete
This commit is contained in:
@@ -4,13 +4,13 @@
|
|||||||
- [x] Task: Review `mma-orchestrator/SKILL.md` and `MMA_Support` docs for Tier 2/3/4 definitions. e9283f1
|
- [x] Task: Review `mma-orchestrator/SKILL.md` and `MMA_Support` docs for Tier 2/3/4 definitions. e9283f1
|
||||||
- [x] Task: Investigate "Centralized Skill" vs. "Role-Based Sub-Agents" architectures for hierarchical delegation. a8b7c2d
|
- [x] Task: Investigate "Centralized Skill" vs. "Role-Based Sub-Agents" architectures for hierarchical delegation. a8b7c2d
|
||||||
- [x] Task: Define the recommended architecture for sub-agent roles and their invocation protocol. f1a2b3c
|
- [x] Task: Define the recommended architecture for sub-agent roles and their invocation protocol. f1a2b3c
|
||||||
- [~] Task: Conductor - User Manual Verification 'Research and Investigation' (Protocol in workflow.md)
|
- [x] Task: Conductor - User Manual Verification 'Research and Investigation' (Protocol in workflow.md) a3cb12b
|
||||||
|
|
||||||
## Phase 2: Infrastructure Verification
|
## Phase 2: Infrastructure Verification
|
||||||
- [ ] Task: Write tests for `.\scripts
|
- [x] Task: Write tests for `.\scripts\run_subagent.ps1` to ensure it correctly spawns stateless agents and handles output. a3cb12b
|
||||||
un_subagent.ps1` to ensure it correctly spawns stateless agents and handles output.
|
- [x] Task: Verify `run_subagent.ps1` behavior for Tier 3 (coding) and Tier 4 (QA) use cases. a3cb12b
|
||||||
- [ ] Task: Verify `run_subagent.ps1` behavior for Tier 3 (coding) and Tier 4 (QA) use cases.
|
- [x] Task: Create a diagnostic test to verify Tier 2 -> Tier 3 delegation flow and context isolation. a3cb12b
|
||||||
- [ ] Task: Create a diagnostic test to verify Tier 2 -> Tier 3 delegation flow and context isolation.
|
- [~] Task: Conductor - User Manual Verification 'Infrastructure Verification' (Protocol in workflow.md)
|
||||||
|
|
||||||
## Phase 3: Test Track Implementation
|
## Phase 3: Test Track Implementation
|
||||||
- [ ] Task: Scaffold the `mma_verification_mock` test track directory and metadata.
|
- [ ] Task: Scaffold the `mma_verification_mock` test track directory and metadata.
|
||||||
|
|||||||
@@ -12,6 +12,10 @@ def run_ps_script(role, prompt):
|
|||||||
"-Prompt", prompt
|
"-Prompt", prompt
|
||||||
]
|
]
|
||||||
result = subprocess.run(cmd, capture_output=True, text=True)
|
result = subprocess.run(cmd, capture_output=True, text=True)
|
||||||
|
if result.stdout:
|
||||||
|
print(f"\n[Sub-Agent {role} Output]:\n{result.stdout}")
|
||||||
|
if result.stderr:
|
||||||
|
print(f"\n[Sub-Agent {role} Error]:\n{result.stderr}")
|
||||||
return result
|
return result
|
||||||
|
|
||||||
def test_subagent_script_qa_live():
|
def test_subagent_script_qa_live():
|
||||||
@@ -41,3 +45,13 @@ def test_subagent_script_utility_live():
|
|||||||
|
|
||||||
assert result.returncode == 0
|
assert result.returncode == 0
|
||||||
assert "true" in result.stdout.lower()
|
assert "true" in result.stdout.lower()
|
||||||
|
|
||||||
|
def test_subagent_isolation_live():
|
||||||
|
"""Verify that the sub-agent is stateless and does not see the parent's conversation context."""
|
||||||
|
# This prompt asks the sub-agent about a 'secret' mentioned only here, not in its prompt.
|
||||||
|
prompt = "What is the secret code I just told you? If I didn't tell you, say 'UNKNOWN'."
|
||||||
|
result = run_ps_script("Utility", prompt)
|
||||||
|
|
||||||
|
assert result.returncode == 0
|
||||||
|
# A stateless agent should not know any previous context.
|
||||||
|
assert "unknown" in result.stdout.lower()
|
||||||
Reference in New Issue
Block a user