mirror of
https://github.com/pewdiepie-archdaemon/odysseus.git
synced 2026-06-16 01:35:36 -04:00
148 lines
4.7 KiB
Python
148 lines
4.7 KiB
Python
import pytest
|
|
|
|
from services.memory import skill_extractor
|
|
|
|
|
|
class _FakeSession:
|
|
session_id = "s1"
|
|
|
|
def get_context_messages(self):
|
|
return [
|
|
{"role": "user", "content": "Walk me through deploying the service"},
|
|
{"role": "assistant", "content": "Sure, here's the runbook..."},
|
|
]
|
|
|
|
|
|
class _FakeSkillsManager:
|
|
def __init__(self):
|
|
self.added = []
|
|
|
|
def load(self, owner=None):
|
|
return []
|
|
|
|
def add_skill(self, **kwargs):
|
|
self.added.append(kwargs)
|
|
return {"id": "skill-1", **kwargs}
|
|
|
|
|
|
# Stray '{' in prose ("uses {a} then ...") before the real JSON object —
|
|
# the bug this fix addresses: slicing from the FIRST '{' to the LAST '}'
|
|
# produced invalid JSON and the whole extraction was silently dropped.
|
|
_STRAY_BRACE_RESPONSE = (
|
|
'Sure thing — note this uses {a} as a placeholder, then the actual skill is:\n'
|
|
'{"title": "Deploy runbook", "problem": "manual deploys are error-prone", '
|
|
'"solution": "use the deploy script", "steps": ["build", "push", "restart"], '
|
|
'"tags": ["deploy"], "confidence": 0.9}'
|
|
)
|
|
|
|
|
|
@pytest.mark.parametrize("response", [_STRAY_BRACE_RESPONSE])
|
|
async def test_maybe_extract_skill_recovers_json_past_stray_braces(monkeypatch, response):
|
|
async def fake_llm_call_async(*args, **kwargs):
|
|
return response
|
|
|
|
monkeypatch.setattr("src.llm_core.llm_call_async", fake_llm_call_async)
|
|
|
|
skills_manager = _FakeSkillsManager()
|
|
entry = await skill_extractor.maybe_extract_skill(
|
|
_FakeSession(),
|
|
skills_manager,
|
|
endpoint_url="http://endpoint",
|
|
model="test-model",
|
|
headers={},
|
|
round_count=3,
|
|
tool_count=3,
|
|
owner="alice",
|
|
)
|
|
|
|
assert entry is not None
|
|
assert entry["title"] == "Deploy runbook"
|
|
assert skills_manager.added and skills_manager.added[0]["title"] == "Deploy runbook"
|
|
|
|
|
|
# Response *starts* with a brace, but it's an invalid fragment — the valid
|
|
# skill JSON only appears on a later line. `json.loads(text)` fails on the
|
|
# first attempt even though `text[0] == "{"`, so the candidate walk must run
|
|
# regardless of whether the response starts with '{'.
|
|
_LEADING_INVALID_BRACE_RESPONSE = (
|
|
'{not json}\n'
|
|
'{"title": "Valid later", "problem": "p", "solution": "s", '
|
|
'"steps": ["one", "two", "three"], "tags": ["test"], "confidence": 0.9}'
|
|
)
|
|
|
|
|
|
@pytest.mark.parametrize("response", [_LEADING_INVALID_BRACE_RESPONSE])
|
|
async def test_maybe_extract_skill_recovers_json_after_leading_invalid_brace(monkeypatch, response):
|
|
async def fake_llm_call_async(*args, **kwargs):
|
|
return response
|
|
|
|
monkeypatch.setattr("src.llm_core.llm_call_async", fake_llm_call_async)
|
|
|
|
skills_manager = _FakeSkillsManager()
|
|
entry = await skill_extractor.maybe_extract_skill(
|
|
_FakeSession(),
|
|
skills_manager,
|
|
endpoint_url="http://endpoint",
|
|
model="test-model",
|
|
headers={},
|
|
round_count=3,
|
|
tool_count=3,
|
|
owner="alice",
|
|
)
|
|
|
|
assert entry is not None
|
|
assert entry["title"] == "Valid later"
|
|
assert skills_manager.added and skills_manager.added[0]["title"] == "Valid later"
|
|
|
|
|
|
async def test_maybe_extract_skill_drops_when_no_candidate_parses(monkeypatch):
|
|
async def fake_llm_call_async(*args, **kwargs):
|
|
return 'Some commentary with {unbalanced and { nested } braces } but no real JSON object'
|
|
|
|
monkeypatch.setattr("src.llm_core.llm_call_async", fake_llm_call_async)
|
|
|
|
skills_manager = _FakeSkillsManager()
|
|
entry = await skill_extractor.maybe_extract_skill(
|
|
_FakeSession(),
|
|
skills_manager,
|
|
endpoint_url="http://endpoint",
|
|
model="test-model",
|
|
headers={},
|
|
round_count=3,
|
|
tool_count=3,
|
|
owner="alice",
|
|
)
|
|
|
|
assert entry is None
|
|
assert not skills_manager.added
|
|
|
|
|
|
async def test_maybe_extract_skill_drops_on_multiple_json_objects(monkeypatch):
|
|
# Two valid JSON objects should be rejected by maybe_extract_skill.
|
|
resp = (
|
|
'{"title": "Deploy runbook", "problem": "manual", "solution": "script", '
|
|
'"steps": ["build"], "tags": ["deploy"], "confidence": 0.9}\n'
|
|
'{"title": "Unrelated skill", "problem": "manual", "solution": "script", '
|
|
'"steps": ["build"], "tags": ["deploy"], "confidence": 0.9}'
|
|
)
|
|
async def fake_llm_call_async(*args, **kwargs):
|
|
return resp
|
|
|
|
monkeypatch.setattr("src.llm_core.llm_call_async", fake_llm_call_async)
|
|
|
|
skills_manager = _FakeSkillsManager()
|
|
entry = await skill_extractor.maybe_extract_skill(
|
|
_FakeSession(),
|
|
skills_manager,
|
|
endpoint_url="http://endpoint",
|
|
model="test-model",
|
|
headers={},
|
|
round_count=3,
|
|
tool_count=3,
|
|
owner="alice",
|
|
)
|
|
|
|
assert entry is None
|
|
assert not skills_manager.added
|
|
|