feat: classifier wrapper with retry, timeout, schema-default fallback
This commit is contained in:
@@ -0,0 +1,8 @@
|
||||
CREATE TABLE classifier_failures (
|
||||
id INTEGER PRIMARY KEY,
|
||||
kind TEXT NOT NULL,
|
||||
model TEXT NOT NULL,
|
||||
raw_text TEXT,
|
||||
attempt_count INTEGER NOT NULL,
|
||||
created_at TEXT NOT NULL DEFAULT (datetime('now'))
|
||||
);
|
||||
@@ -0,0 +1,41 @@
|
||||
from __future__ import annotations
|
||||
import json
|
||||
import asyncio
|
||||
from typing import TypeVar
|
||||
from pydantic import BaseModel, ValidationError
|
||||
from .client import LLMClient, Message
|
||||
|
||||
T = TypeVar("T", bound=BaseModel)
|
||||
|
||||
REFUSAL_PATTERNS = ("i can't", "i cannot", "i'm sorry, but", "as an ai")
|
||||
|
||||
|
||||
async def classify(
|
||||
client: LLMClient,
|
||||
*,
|
||||
model: str,
|
||||
system: str,
|
||||
user: str,
|
||||
schema: type[T],
|
||||
default: T | None = None,
|
||||
timeout_s: float = 10.0,
|
||||
) -> T:
|
||||
msgs = [
|
||||
Message(role="system", content=system + "\n\nRespond with JSON only matching the schema."),
|
||||
Message(role="user", content=user),
|
||||
]
|
||||
for attempt in range(2):
|
||||
try:
|
||||
text = await asyncio.wait_for(
|
||||
client.generate(msgs, model=model, response_format={"type": "json_object"}),
|
||||
timeout=timeout_s,
|
||||
)
|
||||
if any(p in text.lower()[:80] for p in REFUSAL_PATTERNS) and not text.strip().startswith("{"):
|
||||
raise ValueError("refusal-shaped response")
|
||||
return schema.model_validate_json(text)
|
||||
except (ValidationError, ValueError, json.JSONDecodeError, asyncio.TimeoutError):
|
||||
msgs[0] = Message(role="system", content=system + "\n\nRespond with valid JSON ONLY. No prose.")
|
||||
continue
|
||||
if default is None:
|
||||
raise RuntimeError(f"classify failed for schema {schema.__name__} with no default")
|
||||
return default
|
||||
@@ -0,0 +1,24 @@
|
||||
import pytest
|
||||
from pydantic import BaseModel
|
||||
from chat.llm.mock import MockLLMClient
|
||||
from chat.llm.classify import classify
|
||||
|
||||
|
||||
class Verdict(BaseModel):
|
||||
score: int
|
||||
reason: str
|
||||
|
||||
|
||||
@pytest.mark.asyncio
|
||||
async def test_classify_parses_valid_json():
|
||||
mock = MockLLMClient(canned=['{"score": 2, "reason": "notable"}'])
|
||||
result = await classify(mock, model="m", system="x", user="y", schema=Verdict)
|
||||
assert result.score == 2
|
||||
|
||||
|
||||
@pytest.mark.asyncio
|
||||
async def test_classify_falls_back_on_unparseable_after_retry():
|
||||
mock = MockLLMClient(canned=["nope", "still nope"])
|
||||
default = Verdict(score=1, reason="fallback")
|
||||
result = await classify(mock, model="m", system="x", user="y", schema=Verdict, default=default)
|
||||
assert result.reason == "fallback"
|
||||
Reference in New Issue
Block a user