merge: T101 phase 4 cross-feature integration tests
This commit is contained in:
@@ -1,20 +1,38 @@
|
||||
"""Phase 4 cross-feature integration tests (T97 follow-up).
|
||||
"""Phase 4 cross-feature integration tests (T97 follow-up + T101).
|
||||
|
||||
Wave 8 / T101 will populate this file with the full Phase 4 retrieval +
|
||||
embedding integration suite. For now this houses a single test pinning
|
||||
the T97.5 wiring: the production turn route plumbs ``app=request.app``
|
||||
all the way through ``record_turn_memory_for_present`` so the embedding
|
||||
worker actually receives jobs in production. Without this fix-up the
|
||||
plumbing added in T97 was dormant — every per-witness write took the
|
||||
no-app branch and silently dropped the embed enqueue.
|
||||
Cross-feature flows for the Phase 4 retrieval + branching + drawer
|
||||
features. Each test drives multiple Phase 4 surfaces end-to-end and
|
||||
asserts both event_log and projected-state outcomes.
|
||||
|
||||
The test monkeypatches ``app.state.embedding_worker.enqueue`` to record
|
||||
jobs (rather than draining the worker mid-test) so the assertion is
|
||||
deterministic and free of asyncio-timing flakiness inside FastAPI's
|
||||
TestClient. The bug we're guarding against is "did the call site pass
|
||||
``app`` at all" — the worker's drain path is exercised in
|
||||
:mod:`tests.test_embedding_worker`, so duplicating that here would add
|
||||
no coverage.
|
||||
Test inventory:
|
||||
|
||||
* ``test_post_turn_embeddings_indexed_via_worker_hook`` (T97.5) —
|
||||
pins the production turn route's ``app=request.app`` plumbing so
|
||||
the embedding worker actually receives jobs.
|
||||
|
||||
T101 additions (the "Phase 4 cross-feature integration" suite):
|
||||
|
||||
1. ``test_vector_retrieval_feedback_loop`` — write a memory, drain
|
||||
the embedding worker, assert the vector path retrieves it.
|
||||
2. ``test_branch_diverge_main_intact`` — create a branch from a
|
||||
mid-log turn, switch, append more events, switch back and assert
|
||||
the original log past the branch point is still present (Phase 4
|
||||
branching is metadata-only — no read-side filter yet).
|
||||
3. ``test_surgical_delete_truncates_log_and_writes_snapshot`` —
|
||||
compute impact, confirm via the drawer route, assert the log was
|
||||
truncated and a pre-rewind snapshot landed on disk.
|
||||
4. ``test_hide_then_unhide_round_trip_through_read_recent_dialogue``
|
||||
— flip ``hidden`` via the drawer route both directions and assert
|
||||
``read_recent_dialogue`` honours the flag in real time.
|
||||
5. ``test_cross_chat_search_surfaces_memories_in_three_chats`` —
|
||||
write memories in 3 chats, hit ``/search?q=...`` and assert all
|
||||
three appear.
|
||||
|
||||
The T97.5 test monkeypatches ``app.state.embedding_worker.enqueue`` to
|
||||
record jobs (rather than draining the worker) because the bug it pins
|
||||
is "did the call site pass ``app`` at all". T101 test 1 takes the
|
||||
opposite tack: it drives the worker for real to verify the entire
|
||||
write -> index -> retrieve loop.
|
||||
"""
|
||||
|
||||
from __future__ import annotations
|
||||
@@ -27,7 +45,7 @@ from fastapi.testclient import TestClient
|
||||
|
||||
from chat.app import app
|
||||
from chat.db.connection import open_db
|
||||
from chat.eventlog.log import append_event
|
||||
from chat.eventlog.log import append_and_apply, append_event
|
||||
from chat.eventlog.projector import project
|
||||
from chat.llm.mock import MockLLMClient
|
||||
|
||||
@@ -178,3 +196,696 @@ def test_post_turn_embeddings_indexed_via_worker_hook(
|
||||
).fetchall()
|
||||
]
|
||||
assert job.memory_id in memory_ids
|
||||
|
||||
|
||||
# ---------------------------------------------------------------------------
|
||||
# T101 — Phase 4 cross-feature integration suite.
|
||||
# ---------------------------------------------------------------------------
|
||||
#
|
||||
# Helpers + the five required scenarios. Each test drives multiple Phase 4
|
||||
# features so a regression in any one of them fails an integration check.
|
||||
|
||||
|
||||
def _seed_minimal_chat(db_path: Path, chat_id: str = "chat_bot_a") -> None:
|
||||
"""Seed bot_a, you, a chat, edges, and activities — same shape as
|
||||
``tests/test_phase3_integration.py::_seed_single_bot_chat`` but
|
||||
parameterised on chat_id so the cross-chat search test can stamp
|
||||
several chats in the same database without renaming bots.
|
||||
|
||||
Uses ``append_and_apply`` rather than ``append_event`` + a final
|
||||
``project`` so successive calls (e.g. one per chat in the
|
||||
cross-chat-search test) don't try to re-project the cumulative
|
||||
log and trip the ``chats.id`` UNIQUE constraint on the prior
|
||||
chat's row.
|
||||
"""
|
||||
with open_db(db_path) as conn:
|
||||
existing_bot = conn.execute(
|
||||
"SELECT 1 FROM bots WHERE id = 'bot_a'"
|
||||
).fetchone()
|
||||
if existing_bot is None:
|
||||
append_and_apply(
|
||||
conn,
|
||||
kind="bot_authored",
|
||||
payload={
|
||||
"id": "bot_a",
|
||||
"name": "BotA",
|
||||
"persona": "thoughtful",
|
||||
"voice_samples": [],
|
||||
"traits": [],
|
||||
"backstory": "",
|
||||
"initial_relationship_to_you": "",
|
||||
"kickoff_prose": "...",
|
||||
},
|
||||
)
|
||||
append_and_apply(
|
||||
conn,
|
||||
kind="you_authored",
|
||||
payload={
|
||||
"name": "Me",
|
||||
"pronouns": "they/them",
|
||||
"persona": "",
|
||||
},
|
||||
)
|
||||
append_and_apply(
|
||||
conn,
|
||||
kind="chat_created",
|
||||
payload={
|
||||
"id": chat_id,
|
||||
"host_bot_id": "bot_a",
|
||||
"initial_time": "2026-04-26T20:00:00+00:00",
|
||||
"narrative_anchor": "Day 1",
|
||||
"weather": "",
|
||||
},
|
||||
)
|
||||
append_and_apply(
|
||||
conn,
|
||||
kind="edge_update",
|
||||
payload={
|
||||
"source_id": "bot_a",
|
||||
"target_id": "you",
|
||||
"chat_id": chat_id,
|
||||
"knowledge_facts": [],
|
||||
},
|
||||
)
|
||||
# Activities are unique per (entity_id) — only seed them on the
|
||||
# first call (when the bot row is also fresh).
|
||||
if existing_bot is None:
|
||||
for entity_id, verb in [
|
||||
("you", "talking"),
|
||||
("bot_a", "listening"),
|
||||
]:
|
||||
append_and_apply(
|
||||
conn,
|
||||
kind="activity_change",
|
||||
payload={
|
||||
"entity_id": entity_id,
|
||||
"posture": "sitting",
|
||||
"action": {
|
||||
"verb": verb,
|
||||
"interruptible": True,
|
||||
"required_attention": "low",
|
||||
"expected_duration": "ongoing",
|
||||
},
|
||||
"attention": "",
|
||||
"holding": [],
|
||||
"status": {},
|
||||
},
|
||||
)
|
||||
|
||||
|
||||
# ---------------------------------------------------------------------------
|
||||
# 1. Vector retrieval feedback loop.
|
||||
# ---------------------------------------------------------------------------
|
||||
|
||||
|
||||
async def test_vector_retrieval_feedback_loop(tmp_path):
|
||||
"""End-to-end: write a memory through
|
||||
:func:`record_turn_memory_for_present` so an :class:`EmbeddingJob`
|
||||
lands on a worker, drain the worker, then call
|
||||
:func:`vector_search` with the SAME pseudo-embedding function and
|
||||
assert the just-written memory is the top hit.
|
||||
|
||||
Why this test does NOT use the TestClient fixture: the live
|
||||
``app.state.embedding_worker`` is created inside the FastAPI
|
||||
lifespan's event loop. ``await``-ing on it from pytest-asyncio's
|
||||
loop trips ``"got Future attached to a different loop"``. We
|
||||
instead spin up a fresh :class:`EmbeddingWorker` in the test
|
||||
loop, exactly mirroring ``tests/test_embedding_worker.py``'s
|
||||
pattern. The T97.5 test above pins the wiring between the live
|
||||
HTTP route and the live app worker; this test pins the
|
||||
write -> index -> retrieve loop with no transport in scope.
|
||||
|
||||
Cross-feature gaps this test catches:
|
||||
* Memory write enqueues to the worker but the worker never
|
||||
drains (e.g. ``_run`` deadlock or sentinel mishandled).
|
||||
* Worker uses a different embedding function than
|
||||
``vector_search`` at query time, producing different vectors
|
||||
and breaking cosine retrieval.
|
||||
* ``embeddings`` projector handler is not registered (e.g.
|
||||
import ordering bug) so the event fires but the table stays
|
||||
empty.
|
||||
"""
|
||||
from types import SimpleNamespace
|
||||
|
||||
from chat.db.migrate import apply_migrations
|
||||
from chat.services.embedding_worker import EmbeddingWorker
|
||||
from chat.services.embeddings import generate_embedding
|
||||
from chat.services.memory_write import record_turn_memory_for_present
|
||||
from chat.services.vector_search import vector_search
|
||||
|
||||
# Trigger projector handler registration. ``record_turn_memory_for_present``
|
||||
# imports memory_write which imports the worker module, but the
|
||||
# projector handlers live in ``chat.state.*`` modules and are
|
||||
# registered as a side effect of import.
|
||||
import chat.state.embeddings # noqa: F401
|
||||
import chat.state.entities # noqa: F401
|
||||
import chat.state.memory # noqa: F401
|
||||
import chat.state.world # noqa: F401
|
||||
|
||||
db = tmp_path / "test.db"
|
||||
apply_migrations(db)
|
||||
_seed_minimal_chat(db)
|
||||
|
||||
# Spin up our own worker in the test event loop. ``client=None``
|
||||
# is fine for the pseudo-embedding path — the local hash function
|
||||
# does not require an LLM client.
|
||||
worker = EmbeddingWorker(
|
||||
conn_factory=lambda: open_db(db),
|
||||
client=None,
|
||||
)
|
||||
await worker.start()
|
||||
|
||||
# Stub ``app`` — only ``app.state.embedding_worker`` is read by
|
||||
# ``_write_one_memory``. SimpleNamespace gives us a stand-in that
|
||||
# exposes ``state.embedding_worker`` without the full FastAPI app.
|
||||
fake_app = SimpleNamespace(state=SimpleNamespace(embedding_worker=worker))
|
||||
|
||||
distinctive_text = "Maya watched the gondola lights drift across the lagoon."
|
||||
with open_db(db) as conn:
|
||||
record_turn_memory_for_present(
|
||||
conn,
|
||||
chat_id="chat_bot_a",
|
||||
host_bot_id="bot_a",
|
||||
guest_bot_id=None,
|
||||
narrative_text=distinctive_text,
|
||||
app=fake_app,
|
||||
)
|
||||
|
||||
# Drain the worker via the sentinel. After this returns the
|
||||
# ``embedding_indexed`` event has been projected.
|
||||
await worker.stop()
|
||||
|
||||
# Generate a query embedding using the same function the worker
|
||||
# used. The pseudo-embedding is deterministic so a query equal to
|
||||
# the indexed text produces the identical vector and a cosine
|
||||
# similarity of 1.0.
|
||||
query_result = await generate_embedding(client=None, text=distinctive_text)
|
||||
|
||||
with open_db(db) as conn:
|
||||
emb_count = conn.execute(
|
||||
"SELECT COUNT(*) FROM embeddings"
|
||||
).fetchone()[0]
|
||||
assert emb_count == 1, (
|
||||
"embedding worker did not project an embedding_indexed event"
|
||||
)
|
||||
|
||||
hits = vector_search(
|
||||
conn,
|
||||
owner_id="bot_a",
|
||||
witness_role="host", # bot_a is host, witness_host=1 by default
|
||||
query_vector=query_result.vector,
|
||||
k=4,
|
||||
)
|
||||
assert len(hits) == 1
|
||||
top = hits[0]
|
||||
assert top["pov_summary"] == distinctive_text
|
||||
# Self-match: cosine of identical vectors is 1.0.
|
||||
assert top["score"] == pytest.approx(1.0, abs=1e-9)
|
||||
|
||||
|
||||
# ---------------------------------------------------------------------------
|
||||
# 2. Branch + diverge: main's post-branch tail stays intact (Phase 4
|
||||
# branches are metadata-only).
|
||||
# ---------------------------------------------------------------------------
|
||||
|
||||
|
||||
def test_branch_diverge_main_intact(app_state_setup, tmp_path):
|
||||
"""Append turns 1-12 on main, branch from turn 10's event_id, switch
|
||||
to the new branch, append 3 more "play" turns, switch back to main,
|
||||
assert the original turn 11+ events are untouched.
|
||||
|
||||
Phase 4's branches table is metadata-only — the read-side filter
|
||||
isn't wired yet, so all events live in one log regardless of which
|
||||
branch is "active". This test pins that contract: switching does
|
||||
not mutate or hide existing events on either branch.
|
||||
|
||||
Canned LLM queue: none. ``user_turn`` / ``assistant_turn`` are
|
||||
transcript-only kinds with no projector handler that needs an
|
||||
LLM call, and ``branch_created`` / ``branch_switched`` are pure
|
||||
state events. We use ``append_and_apply`` directly rather than
|
||||
driving the HTTP turn route, which would require a 6-slot canned
|
||||
queue per turn (parse + narrative + 2 state-updates + scene-close
|
||||
+ memory) for 15 turns total = 90 slots of plumbing irrelevant to
|
||||
the branch contract.
|
||||
"""
|
||||
from chat.services.branching import branch_from_event, switch_active_branch
|
||||
from chat.state.branches import active_branch
|
||||
|
||||
db = tmp_path / "test.db"
|
||||
_seed_minimal_chat(db)
|
||||
|
||||
# Append 12 user_turn / assistant_turn pairs on main. We collect
|
||||
# the assistant_turn id at index 10 (1-based: "turn 10") so the
|
||||
# branch fork point is unambiguous.
|
||||
main_turn_ids: list[int] = []
|
||||
with open_db(db) as conn:
|
||||
for i in range(1, 13):
|
||||
user_id = append_and_apply(
|
||||
conn,
|
||||
kind="user_turn",
|
||||
payload={
|
||||
"chat_id": "chat_bot_a",
|
||||
"prose": f"main turn {i}",
|
||||
"segments": [],
|
||||
},
|
||||
)
|
||||
asst_id = append_and_apply(
|
||||
conn,
|
||||
kind="assistant_turn",
|
||||
payload={
|
||||
"chat_id": "chat_bot_a",
|
||||
"speaker_id": "bot_a",
|
||||
"text": f"main reply {i}",
|
||||
"truncated": False,
|
||||
"user_turn_id": user_id,
|
||||
},
|
||||
)
|
||||
main_turn_ids.append(asst_id)
|
||||
turn_10_id = main_turn_ids[9]
|
||||
|
||||
# Snapshot the post-turn-10 main tail (turns 11, 12 + their
|
||||
# user_turn predecessors) so we can byte-compare after the
|
||||
# round-trip.
|
||||
main_tail_before = conn.execute(
|
||||
"SELECT id, kind, payload_json, hidden, superseded_by "
|
||||
"FROM event_log WHERE id > ? ORDER BY id",
|
||||
(turn_10_id,),
|
||||
).fetchall()
|
||||
assert len(main_tail_before) == 4 # 2 user + 2 assistant past turn 10
|
||||
|
||||
# Branch from turn 10. Phase 4's helper validates the origin
|
||||
# event id exists and emits ``branch_created``.
|
||||
branch_from_event(
|
||||
conn,
|
||||
name="experiment",
|
||||
origin_event_id=turn_10_id,
|
||||
chat_id="chat_bot_a",
|
||||
)
|
||||
switch_active_branch(conn, name="experiment")
|
||||
active = active_branch(conn)
|
||||
assert active is not None and active["name"] == "experiment"
|
||||
|
||||
# Play 3 turns on the experiment branch.
|
||||
for i in range(1, 4):
|
||||
user_id = append_and_apply(
|
||||
conn,
|
||||
kind="user_turn",
|
||||
payload={
|
||||
"chat_id": "chat_bot_a",
|
||||
"prose": f"experiment turn {i}",
|
||||
"segments": [],
|
||||
},
|
||||
)
|
||||
append_and_apply(
|
||||
conn,
|
||||
kind="assistant_turn",
|
||||
payload={
|
||||
"chat_id": "chat_bot_a",
|
||||
"speaker_id": "bot_a",
|
||||
"text": f"experiment reply {i}",
|
||||
"truncated": False,
|
||||
"user_turn_id": user_id,
|
||||
},
|
||||
)
|
||||
|
||||
# Switch back to main.
|
||||
switch_active_branch(conn, name="main")
|
||||
active2 = active_branch(conn)
|
||||
assert active2 is not None and active2["name"] == "main"
|
||||
|
||||
# Main's original tail past turn 10 is byte-identical: the
|
||||
# branching events (branch_created, branch_switched x2) and the
|
||||
# 3 experiment turns sit AFTER the original tail in event_log
|
||||
# order, never overwriting it.
|
||||
main_tail_after = conn.execute(
|
||||
"SELECT id, kind, payload_json, hidden, superseded_by "
|
||||
"FROM event_log "
|
||||
"WHERE id > ? AND id <= ? ORDER BY id",
|
||||
(turn_10_id, main_turn_ids[-1]),
|
||||
).fetchall()
|
||||
assert main_tail_after == main_tail_before
|
||||
|
||||
# The 6 experiment events (3 user + 3 assistant) all live in
|
||||
# the same log past the original main tail. Verify their
|
||||
# prose payloads to disambiguate from main's content.
|
||||
diverged = conn.execute(
|
||||
"SELECT kind, json_extract(payload_json, '$.prose'), "
|
||||
" json_extract(payload_json, '$.text') "
|
||||
"FROM event_log WHERE id > ? "
|
||||
" AND kind IN ('user_turn', 'assistant_turn') ORDER BY id",
|
||||
(main_turn_ids[-1],),
|
||||
).fetchall()
|
||||
assert len(diverged) == 6
|
||||
prose_or_text = [(row[1] or row[2]) for row in diverged]
|
||||
# Sequence: user1, asst1, user2, asst2, user3, asst3.
|
||||
assert "experiment turn 1" in prose_or_text
|
||||
assert "experiment reply 1" in prose_or_text
|
||||
assert "experiment turn 3" in prose_or_text
|
||||
assert "experiment reply 3" in prose_or_text
|
||||
|
||||
|
||||
# ---------------------------------------------------------------------------
|
||||
# 3. Surgical delete: impact preview -> confirm -> log truncated +
|
||||
# pre-rewind snapshot saved.
|
||||
# ---------------------------------------------------------------------------
|
||||
|
||||
|
||||
def test_surgical_delete_truncates_log_and_writes_snapshot(
|
||||
app_state_setup, tmp_path
|
||||
):
|
||||
"""Compute the delete-impact for a turn (read-only preview), then
|
||||
confirm via the POST drawer route. Assert:
|
||||
|
||||
* The preview returns 200 + cascade markup.
|
||||
* The event_log is physically truncated past ``target_id - 1``.
|
||||
* A snapshot file lands under ``<data_dir>/snapshots/rewind/``.
|
||||
* The pre-rewind snapshot's ``last_event_id`` matches the high
|
||||
water mark BEFORE the truncate (so recovery can replay back to
|
||||
pre-delete state).
|
||||
|
||||
Snapshot location: T97.5's ``data_dir`` derives from the db's
|
||||
parent directory when ``CHAT_DATA_DIR`` is unset. The fixture
|
||||
sets ``CHAT_DB_PATH = tmp_path / "test.db"`` so the snapshot
|
||||
parent is ``tmp_path / "snapshots" / "rewind"``.
|
||||
|
||||
No canned LLM queue — the preview is pure SQL and the rewind path
|
||||
is also pure SQL (delete + reproject). The drawer routes don't
|
||||
invoke the LLM.
|
||||
"""
|
||||
import json as _json
|
||||
|
||||
db = tmp_path / "test.db"
|
||||
_seed_minimal_chat(db)
|
||||
|
||||
# Append a small fixed turn sequence we can predict the cascade for.
|
||||
with open_db(db) as conn:
|
||||
first_user = append_and_apply(
|
||||
conn,
|
||||
kind="user_turn",
|
||||
payload={
|
||||
"chat_id": "chat_bot_a",
|
||||
"prose": "first message",
|
||||
"segments": [],
|
||||
},
|
||||
)
|
||||
append_and_apply(
|
||||
conn,
|
||||
kind="assistant_turn",
|
||||
payload={
|
||||
"chat_id": "chat_bot_a",
|
||||
"speaker_id": "bot_a",
|
||||
"text": "first reply",
|
||||
"truncated": False,
|
||||
"user_turn_id": first_user,
|
||||
},
|
||||
)
|
||||
target_user = append_and_apply(
|
||||
conn,
|
||||
kind="user_turn",
|
||||
payload={
|
||||
"chat_id": "chat_bot_a",
|
||||
"prose": "this turn will be deleted",
|
||||
"segments": [],
|
||||
},
|
||||
)
|
||||
target_asst = append_and_apply(
|
||||
conn,
|
||||
kind="assistant_turn",
|
||||
payload={
|
||||
"chat_id": "chat_bot_a",
|
||||
"speaker_id": "bot_a",
|
||||
"text": "and so will this reply",
|
||||
"truncated": False,
|
||||
"user_turn_id": target_user,
|
||||
},
|
||||
)
|
||||
# One trailing event past the target so we can verify the
|
||||
# cascade catches >1 event.
|
||||
trailing = append_and_apply(
|
||||
conn,
|
||||
kind="user_turn",
|
||||
payload={
|
||||
"chat_id": "chat_bot_a",
|
||||
"prose": "trailing context",
|
||||
"segments": [],
|
||||
},
|
||||
)
|
||||
max_id_before = conn.execute(
|
||||
"SELECT MAX(id) FROM event_log"
|
||||
).fetchone()[0]
|
||||
|
||||
# ---- Preview: GET delete-preview returns 200 + the cascade list. ----
|
||||
preview = app_state_setup.get(
|
||||
f"/chats/chat_bot_a/drawer/turn/delete-preview/{target_user}"
|
||||
)
|
||||
assert preview.status_code == 200
|
||||
body = preview.text
|
||||
assert "delete-impact-modal" in body
|
||||
assert f"Delete event {target_user}?" in body
|
||||
assert "user_turn" in body
|
||||
assert "assistant_turn" in body
|
||||
# Confirm form points at the delete route.
|
||||
assert f"/drawer/turn/delete/{target_user}" in body
|
||||
|
||||
# ---- Confirm: POST delete drops user, assistant, AND trailing. ----
|
||||
confirm = app_state_setup.post(
|
||||
f"/chats/chat_bot_a/drawer/turn/delete/{target_user}"
|
||||
)
|
||||
assert confirm.status_code == 200
|
||||
|
||||
# ---- Event log truncated past target_user - 1. ----
|
||||
with open_db(db) as conn:
|
||||
max_id_after = conn.execute(
|
||||
"SELECT MAX(id) FROM event_log"
|
||||
).fetchone()[0]
|
||||
# delete_turn passes ``after_event_id = target_user - 1`` so
|
||||
# everything from target_user forward is gone.
|
||||
assert max_id_after == target_user - 1
|
||||
for ev_id in (target_user, target_asst, trailing):
|
||||
row = conn.execute(
|
||||
"SELECT 1 FROM event_log WHERE id = ?", (ev_id,)
|
||||
).fetchone()
|
||||
assert row is None, f"event {ev_id} should have been deleted"
|
||||
|
||||
# ---- Pre-rewind snapshot landed on disk. ----
|
||||
snapshot_dir = tmp_path / "snapshots" / "rewind"
|
||||
assert snapshot_dir.exists(), (
|
||||
f"snapshot dir not created: {snapshot_dir}"
|
||||
)
|
||||
snapshots = sorted(snapshot_dir.glob("*.json"))
|
||||
assert len(snapshots) >= 1, (
|
||||
f"no rewind snapshot written under {snapshot_dir}"
|
||||
)
|
||||
# Most-recent snapshot's last_event_id == pre-truncate high water
|
||||
# mark, so a "restore" path could fully reverse the delete.
|
||||
latest_snapshot = snapshots[-1]
|
||||
snap_data = _json.loads(latest_snapshot.read_text())
|
||||
assert snap_data["last_event_id"] == max_id_before
|
||||
|
||||
|
||||
# ---------------------------------------------------------------------------
|
||||
# 4. Hide + retrieval: drawer hide drops a turn from read_recent_dialogue,
|
||||
# unhide restores it.
|
||||
# ---------------------------------------------------------------------------
|
||||
|
||||
|
||||
def test_hide_then_unhide_round_trip_through_read_recent_dialogue(
|
||||
app_state_setup, tmp_path
|
||||
):
|
||||
"""Drive a hide -> read -> unhide -> read cycle through the drawer
|
||||
HTTP route and assert ``read_recent_dialogue`` flips visibility
|
||||
each step. T98.3 wires the route; T55 / turn_common owns the
|
||||
``hidden = 0`` filter.
|
||||
|
||||
Cross-feature: the drawer HTTP handler emits a ``manual_edit``
|
||||
event with branch ``turn_hidden``, the manual_edit projector
|
||||
flips ``event_log.hidden``, and the prompt-window reader filters
|
||||
on that column. Three layers — any one breaking would fail this
|
||||
test.
|
||||
|
||||
No canned LLM queue — hide/unhide are pure SQL routes.
|
||||
"""
|
||||
from chat.services.turn_common import read_recent_dialogue
|
||||
|
||||
db = tmp_path / "test.db"
|
||||
_seed_minimal_chat(db)
|
||||
|
||||
with open_db(db) as conn:
|
||||
user_a = append_and_apply(
|
||||
conn,
|
||||
kind="user_turn",
|
||||
payload={
|
||||
"chat_id": "chat_bot_a",
|
||||
"prose": "first user line",
|
||||
"segments": [],
|
||||
},
|
||||
)
|
||||
asst_a = append_and_apply(
|
||||
conn,
|
||||
kind="assistant_turn",
|
||||
payload={
|
||||
"chat_id": "chat_bot_a",
|
||||
"speaker_id": "bot_a",
|
||||
"text": "first reply",
|
||||
"truncated": False,
|
||||
"user_turn_id": user_a,
|
||||
},
|
||||
)
|
||||
user_b = append_and_apply(
|
||||
conn,
|
||||
kind="user_turn",
|
||||
payload={
|
||||
"chat_id": "chat_bot_a",
|
||||
"prose": "second user line",
|
||||
"segments": [],
|
||||
},
|
||||
)
|
||||
asst_b = append_and_apply(
|
||||
conn,
|
||||
kind="assistant_turn",
|
||||
payload={
|
||||
"chat_id": "chat_bot_a",
|
||||
"speaker_id": "bot_a",
|
||||
"text": "second reply",
|
||||
"truncated": False,
|
||||
"user_turn_id": user_b,
|
||||
},
|
||||
)
|
||||
|
||||
# Baseline: all 4 turns visible.
|
||||
baseline = read_recent_dialogue(conn, "chat_bot_a", limit=10)
|
||||
baseline_ids = {t["event_id"] for t in baseline}
|
||||
assert {user_a, asst_a, user_b, asst_b} <= baseline_ids
|
||||
|
||||
# ---- Hide user_b via the drawer route. ----
|
||||
hide_resp = app_state_setup.post(
|
||||
f"/chats/chat_bot_a/drawer/turn/hide/{user_b}",
|
||||
data={"hidden": "1"},
|
||||
)
|
||||
assert hide_resp.status_code == 200
|
||||
|
||||
with open_db(db) as conn:
|
||||
# event_log.hidden flipped.
|
||||
row = conn.execute(
|
||||
"SELECT hidden FROM event_log WHERE id = ?", (user_b,)
|
||||
).fetchone()
|
||||
assert int(row[0]) == 1
|
||||
|
||||
# read_recent_dialogue drops user_b but keeps the others.
|
||||
after_hide = read_recent_dialogue(conn, "chat_bot_a", limit=10)
|
||||
after_hide_ids = {t["event_id"] for t in after_hide}
|
||||
assert user_b not in after_hide_ids
|
||||
# The other 3 turns still surface.
|
||||
assert {user_a, asst_a, asst_b} <= after_hide_ids
|
||||
|
||||
# ---- Unhide via the SAME route with hidden=0. ----
|
||||
unhide_resp = app_state_setup.post(
|
||||
f"/chats/chat_bot_a/drawer/turn/hide/{user_b}",
|
||||
data={"hidden": "0"},
|
||||
)
|
||||
assert unhide_resp.status_code == 200
|
||||
|
||||
with open_db(db) as conn:
|
||||
row = conn.execute(
|
||||
"SELECT hidden FROM event_log WHERE id = ?", (user_b,)
|
||||
).fetchone()
|
||||
assert int(row[0]) == 0
|
||||
|
||||
# read_recent_dialogue restores user_b.
|
||||
after_unhide = read_recent_dialogue(conn, "chat_bot_a", limit=10)
|
||||
after_unhide_ids = {t["event_id"] for t in after_unhide}
|
||||
assert {user_a, asst_a, user_b, asst_b} <= after_unhide_ids
|
||||
|
||||
# Two manual_edit events landed (one per toggle), each with the
|
||||
# turn_hidden branch tag.
|
||||
edits = conn.execute(
|
||||
"SELECT payload_json FROM event_log "
|
||||
"WHERE kind = 'manual_edit' "
|
||||
" AND json_extract(payload_json, '$.target_kind') = 'turn_hidden' "
|
||||
"ORDER BY id"
|
||||
).fetchall()
|
||||
assert len(edits) == 2
|
||||
|
||||
|
||||
# ---------------------------------------------------------------------------
|
||||
# 5. Cross-chat search: memories across 3 chats all surface from /search.
|
||||
# ---------------------------------------------------------------------------
|
||||
|
||||
|
||||
def test_cross_chat_search_surfaces_memories_in_three_chats(
|
||||
app_state_setup, tmp_path
|
||||
):
|
||||
"""Seed 3 chats each owned by bot_a (so the bot row exists for the
|
||||
search route's display-name hydration), write a distinctive
|
||||
memory in each, then GET ``/search?q=<distinctive>`` and assert
|
||||
every chat appears as a result row.
|
||||
|
||||
Cross-feature: T93's :func:`search_all_memories` (no per-owner
|
||||
filter) + T100's HTML route (display-name hydration via
|
||||
``get_bot``/``get_chat``). The route's empty-query short-circuit
|
||||
is incidentally exercised by the request setup but isn't the
|
||||
focus.
|
||||
|
||||
No canned LLM queue — memory_written events are projected directly
|
||||
via ``append_and_apply`` and the search route is pure SQL +
|
||||
template rendering.
|
||||
"""
|
||||
db = tmp_path / "test.db"
|
||||
# Three chats, all hosted by bot_a so bot_a is the owner of all
|
||||
# three memories. _seed_minimal_chat skips the bot/you bootstrap
|
||||
# after the first call so the cumulative seed is consistent.
|
||||
chat_ids = ["chat_bot_a", "chat_bot_a_2", "chat_bot_a_3"]
|
||||
for chat_id in chat_ids:
|
||||
_seed_minimal_chat(db, chat_id=chat_id)
|
||||
|
||||
# Distinctive token — "wisteria" appears nowhere else in the seed.
|
||||
distinctive = "wisteria"
|
||||
with open_db(db) as conn:
|
||||
for idx, chat_id in enumerate(chat_ids):
|
||||
append_and_apply(
|
||||
conn,
|
||||
kind="memory_written",
|
||||
payload={
|
||||
"owner_id": "bot_a",
|
||||
"chat_id": chat_id,
|
||||
"pov_summary": (
|
||||
f"the {distinctive} bloomed by the gate (chat {idx})"
|
||||
),
|
||||
"witness_you": 1,
|
||||
"witness_host": 1,
|
||||
"witness_guest": 0,
|
||||
"source": "direct",
|
||||
"reliability": 1.0,
|
||||
"significance": 1,
|
||||
"pinned": 0,
|
||||
"auto_pinned": 0,
|
||||
},
|
||||
)
|
||||
|
||||
# ---- GET /search?q=wisteria -> all 3 chats appear as result rows. ----
|
||||
response = app_state_setup.get(f"/search?q={distinctive}")
|
||||
assert response.status_code == 200
|
||||
body = response.text
|
||||
|
||||
# Each chat_id appears in a result link href, e.g.
|
||||
# ``href="/chats/chat_bot_a"``. The template renders one
|
||||
# ``<a class="search-result-link" href="/chats/{chat_id}">`` per
|
||||
# row, so a substring match per chat is sufficient.
|
||||
for chat_id in chat_ids:
|
||||
assert f'href="/chats/{chat_id}"' in body, (
|
||||
f"chat {chat_id} missing from /search results: {body!r}"
|
||||
)
|
||||
# The owner display name (BotA) renders for each row — verify >= 3
|
||||
# occurrences so we know all 3 result rows hydrated, not just 1.
|
||||
assert body.count("BotA") >= 3
|
||||
|
||||
# ---- Sanity: distractor query yields no results. ----
|
||||
distractor_response = app_state_setup.get(
|
||||
"/search?q=nonexistentterm12345"
|
||||
)
|
||||
assert distractor_response.status_code == 200
|
||||
distractor_body = distractor_response.text
|
||||
# The "no matches" empty-state copy fires.
|
||||
assert "No matches" in distractor_body
|
||||
for chat_id in chat_ids:
|
||||
assert f'href="/chats/{chat_id}"' not in distractor_body
|
||||
|
||||
Reference in New Issue
Block a user