Updated folder structure (for Docker)
This commit is contained in:
@@ -1,283 +0,0 @@
|
||||
"""Tests for the Agent."""
|
||||
|
||||
from unittest.mock import Mock
|
||||
|
||||
from agent.agent import Agent
|
||||
from infrastructure.persistence import get_memory
|
||||
|
||||
|
||||
class TestAgentInit:
|
||||
"""Tests for Agent initialization."""
|
||||
|
||||
def test_init(self, memory, mock_llm):
|
||||
"""Should initialize agent with LLM."""
|
||||
agent = Agent(llm=mock_llm)
|
||||
|
||||
assert agent.llm is mock_llm
|
||||
assert agent.tools is not None
|
||||
assert agent.prompt_builder is not None
|
||||
assert agent.max_tool_iterations == 5
|
||||
|
||||
def test_init_custom_iterations(self, memory, mock_llm):
|
||||
"""Should accept custom max iterations."""
|
||||
agent = Agent(llm=mock_llm, max_tool_iterations=10)
|
||||
|
||||
assert agent.max_tool_iterations == 10
|
||||
|
||||
def test_tools_registered(self, memory, mock_llm):
|
||||
"""Should register all tools."""
|
||||
agent = Agent(llm=mock_llm)
|
||||
|
||||
expected_tools = [
|
||||
"set_path_for_folder",
|
||||
"list_folder",
|
||||
"find_media_imdb_id",
|
||||
"find_torrent",
|
||||
"add_torrent_by_index",
|
||||
"add_torrent_to_qbittorrent",
|
||||
"get_torrent_by_index",
|
||||
"set_language",
|
||||
]
|
||||
|
||||
for tool_name in expected_tools:
|
||||
assert tool_name in agent.tools
|
||||
|
||||
|
||||
class TestExecuteToolCall:
|
||||
"""Tests for _execute_tool_call method."""
|
||||
|
||||
def test_execute_known_tool(self, memory, mock_llm, real_folder):
|
||||
"""Should execute known tool."""
|
||||
agent = Agent(llm=mock_llm)
|
||||
memory.ltm.set_config("download_folder", str(real_folder["downloads"]))
|
||||
|
||||
tool_call = {
|
||||
"id": "call_123",
|
||||
"function": {
|
||||
"name": "list_folder",
|
||||
"arguments": '{"folder_type": "download"}',
|
||||
},
|
||||
}
|
||||
result = agent._execute_tool_call(tool_call)
|
||||
|
||||
assert result["status"] == "ok"
|
||||
|
||||
def test_execute_unknown_tool(self, memory, mock_llm):
|
||||
"""Should return error for unknown tool."""
|
||||
agent = Agent(llm=mock_llm)
|
||||
|
||||
tool_call = {
|
||||
"id": "call_123",
|
||||
"function": {"name": "unknown_tool", "arguments": "{}"},
|
||||
}
|
||||
result = agent._execute_tool_call(tool_call)
|
||||
|
||||
assert result["error"] == "unknown_tool"
|
||||
assert "available_tools" in result
|
||||
|
||||
def test_execute_with_bad_args(self, memory, mock_llm):
|
||||
"""Should return error for bad arguments."""
|
||||
agent = Agent(llm=mock_llm)
|
||||
|
||||
tool_call = {
|
||||
"id": "call_123",
|
||||
"function": {"name": "set_path_for_folder", "arguments": "{}"},
|
||||
}
|
||||
result = agent._execute_tool_call(tool_call)
|
||||
|
||||
assert result["error"] == "bad_args"
|
||||
|
||||
def test_execute_tracks_errors(self, memory, mock_llm):
|
||||
"""Should track errors in episodic memory."""
|
||||
agent = Agent(llm=mock_llm)
|
||||
|
||||
# Use invalid arguments to trigger a TypeError
|
||||
tool_call = {
|
||||
"id": "call_123",
|
||||
"function": {
|
||||
"name": "set_path_for_folder",
|
||||
"arguments": '{"folder_name": 123}', # Wrong type
|
||||
},
|
||||
}
|
||||
agent._execute_tool_call(tool_call)
|
||||
|
||||
mem = get_memory()
|
||||
assert len(mem.episodic.recent_errors) > 0
|
||||
|
||||
def test_execute_with_invalid_json(self, memory, mock_llm):
|
||||
"""Should handle invalid JSON arguments."""
|
||||
agent = Agent(llm=mock_llm)
|
||||
|
||||
tool_call = {
|
||||
"id": "call_123",
|
||||
"function": {"name": "list_folder", "arguments": "{invalid json}"},
|
||||
}
|
||||
result = agent._execute_tool_call(tool_call)
|
||||
|
||||
assert result["error"] == "bad_args"
|
||||
|
||||
|
||||
class TestStep:
|
||||
"""Tests for step method."""
|
||||
|
||||
def test_step_text_response(self, memory, mock_llm):
|
||||
"""Should return text response when no tool call."""
|
||||
agent = Agent(llm=mock_llm)
|
||||
|
||||
response = agent.step("Hello")
|
||||
|
||||
assert response == "I found what you're looking for!"
|
||||
|
||||
def test_step_saves_to_history(self, memory, mock_llm):
|
||||
"""Should save conversation to STM history."""
|
||||
agent = Agent(llm=mock_llm)
|
||||
|
||||
agent.step("Hi there")
|
||||
|
||||
mem = get_memory()
|
||||
history = mem.stm.get_recent_history(10)
|
||||
assert len(history) == 2
|
||||
assert history[0]["role"] == "user"
|
||||
assert history[0]["content"] == "Hi there"
|
||||
assert history[1]["role"] == "assistant"
|
||||
|
||||
def test_step_with_tool_call(self, memory, mock_llm_with_tool_call, real_folder):
|
||||
"""Should execute tool and continue."""
|
||||
memory.ltm.set_config("download_folder", str(real_folder["downloads"]))
|
||||
|
||||
agent = Agent(llm=mock_llm_with_tool_call)
|
||||
|
||||
response = agent.step("List my downloads")
|
||||
|
||||
assert "found" in response.lower() or "torrent" in response.lower()
|
||||
assert mock_llm_with_tool_call.complete.call_count == 2
|
||||
|
||||
# CRITICAL: Verify tools were passed to LLM
|
||||
first_call_args = mock_llm_with_tool_call.complete.call_args_list[0]
|
||||
assert first_call_args[1]["tools"] is not None, "Tools not passed to LLM!"
|
||||
assert len(first_call_args[1]["tools"]) > 0, "Tools list is empty!"
|
||||
|
||||
def test_step_max_iterations(self, memory, mock_llm):
|
||||
"""Should stop after max iterations."""
|
||||
call_count = [0]
|
||||
|
||||
def mock_complete(messages, tools=None):
|
||||
call_count[0] += 1
|
||||
# CRITICAL: Verify tools are passed (except on forced final call)
|
||||
if call_count[0] <= 3:
|
||||
assert tools is not None, f"Tools not passed on call {call_count[0]}!"
|
||||
|
||||
if call_count[0] <= 3:
|
||||
return {
|
||||
"role": "assistant",
|
||||
"content": None,
|
||||
"tool_calls": [
|
||||
{
|
||||
"id": f"call_{call_count[0]}",
|
||||
"function": {
|
||||
"name": "list_folder",
|
||||
"arguments": '{"folder_type": "download"}',
|
||||
},
|
||||
}
|
||||
],
|
||||
}
|
||||
else:
|
||||
return {"role": "assistant", "content": "I couldn't complete the task."}
|
||||
|
||||
mock_llm.complete = Mock(side_effect=mock_complete)
|
||||
agent = Agent(llm=mock_llm, max_tool_iterations=3)
|
||||
|
||||
agent.step("Do something")
|
||||
|
||||
assert call_count[0] == 4
|
||||
|
||||
def test_step_includes_history(self, memory_with_history, mock_llm):
|
||||
"""Should include conversation history in prompt."""
|
||||
agent = Agent(llm=mock_llm)
|
||||
|
||||
agent.step("New message")
|
||||
|
||||
call_args = mock_llm.complete.call_args[0][0]
|
||||
messages_content = [m.get("content", "") for m in call_args]
|
||||
assert any("Hello" in str(c) for c in messages_content)
|
||||
|
||||
def test_step_includes_events(self, memory, mock_llm):
|
||||
"""Should include unread events in prompt."""
|
||||
memory.episodic.add_background_event("download_complete", {"name": "Movie.mkv"})
|
||||
agent = Agent(llm=mock_llm)
|
||||
|
||||
agent.step("What's new?")
|
||||
|
||||
call_args = mock_llm.complete.call_args[0][0]
|
||||
messages_content = [m.get("content", "") for m in call_args]
|
||||
assert any("download" in str(c).lower() for c in messages_content)
|
||||
|
||||
def test_step_saves_ltm(self, memory, mock_llm, temp_dir):
|
||||
"""Should save LTM after step."""
|
||||
agent = Agent(llm=mock_llm)
|
||||
|
||||
agent.step("Hello")
|
||||
|
||||
ltm_file = temp_dir / "ltm.json"
|
||||
assert ltm_file.exists()
|
||||
|
||||
|
||||
class TestAgentIntegration:
|
||||
"""Integration tests for Agent."""
|
||||
|
||||
def test_multiple_tool_calls(self, memory, mock_llm, real_folder):
|
||||
"""Should handle multiple tool calls in sequence."""
|
||||
memory.ltm.set_config("download_folder", str(real_folder["downloads"]))
|
||||
memory.ltm.set_config("movie_folder", str(real_folder["movies"]))
|
||||
|
||||
call_count = [0]
|
||||
|
||||
def mock_complete(messages, tools=None):
|
||||
call_count[0] += 1
|
||||
# CRITICAL: Verify tools are passed on every call
|
||||
assert tools is not None, f"Tools not passed on call {call_count[0]}!"
|
||||
|
||||
if call_count[0] == 1:
|
||||
return {
|
||||
"role": "assistant",
|
||||
"content": None,
|
||||
"tool_calls": [
|
||||
{
|
||||
"id": "call_1",
|
||||
"function": {
|
||||
"name": "list_folder",
|
||||
"arguments": '{"folder_type": "download"}',
|
||||
},
|
||||
}
|
||||
],
|
||||
}
|
||||
elif call_count[0] == 2:
|
||||
# CRITICAL: Verify tool result was sent back
|
||||
tool_messages = [m for m in messages if m.get("role") == "tool"]
|
||||
assert len(tool_messages) > 0, "Tool result not sent back to LLM!"
|
||||
|
||||
return {
|
||||
"role": "assistant",
|
||||
"content": None,
|
||||
"tool_calls": [
|
||||
{
|
||||
"id": "call_2",
|
||||
"function": {
|
||||
"name": "list_folder",
|
||||
"arguments": '{"folder_type": "movie"}',
|
||||
},
|
||||
}
|
||||
],
|
||||
}
|
||||
else:
|
||||
return {
|
||||
"role": "assistant",
|
||||
"content": "I listed both folders for you.",
|
||||
}
|
||||
|
||||
mock_llm.complete = Mock(side_effect=mock_complete)
|
||||
agent = Agent(llm=mock_llm)
|
||||
|
||||
agent.step("List my downloads and movies")
|
||||
|
||||
assert call_count[0] == 3
|
||||
Reference in New Issue
Block a user