tests/test_reinforcement.py

"""Tests for Phase 9 Commit B reinforcement loop."""

from fastapi.testclient import TestClient

from atocore.interactions.service import record_interaction
from atocore.main import app
from atocore.memory.reinforcement import (
    DEFAULT_CONFIDENCE_DELTA,
    reinforce_from_interaction,
)
from atocore.memory.service import (
    create_memory,
    get_memories,
    reinforce_memory,
)
from atocore.models.database import init_db


# --- service-level tests: reinforce_memory primitive ----------------------


def test_reinforce_memory_bumps_active_memory(tmp_data_dir):
    init_db()
    mem = create_memory(
        memory_type="preference",
        content="prefers Python over Ruby for scripting",
        confidence=0.6,
    )

    applied, old_conf, new_conf = reinforce_memory(mem.id, confidence_delta=0.05)

    assert applied is True
    assert old_conf == 0.6
    assert abs(new_conf - 0.65) < 1e-9

    reloaded = get_memories(memory_type="preference", limit=10)
    match = next((m for m in reloaded if m.id == mem.id), None)
    assert match is not None
    assert abs(match.confidence - 0.65) < 1e-9
    assert match.reference_count == 1
    assert match.last_referenced_at  # non-empty


def test_reinforce_memory_caps_at_one(tmp_data_dir):
    init_db()
    mem = create_memory(
        memory_type="identity",
        content="is a mechanical engineer who runs AtoCore",
        confidence=0.98,
    )
    applied, old_conf, new_conf = reinforce_memory(mem.id, confidence_delta=0.05)
    assert applied is True
    assert old_conf == 0.98
    assert new_conf == 1.0


def test_reinforce_memory_rejects_candidate_and_missing(tmp_data_dir):
    init_db()
    candidate = create_memory(
        memory_type="knowledge",
        content="the lateral support uses GF-PTFE pads",
        confidence=0.5,
        status="candidate",
    )
    applied, _, _ = reinforce_memory(candidate.id)
    assert applied is False

    missing, _, _ = reinforce_memory("no-such-id")
    assert missing is False


def test_reinforce_memory_accumulates_reference_count(tmp_data_dir):
    init_db()
    mem = create_memory(
        memory_type="preference",
        content="likes concise code reviews that focus on the why",
        confidence=0.5,
    )
    for _ in range(5):
        reinforce_memory(mem.id, confidence_delta=0.01)
    reloaded = [m for m in get_memories(memory_type="preference", limit=10) if m.id == mem.id][0]
    assert reloaded.reference_count == 5
    assert abs(reloaded.confidence - 0.55) < 1e-9


def test_reinforce_memory_rejects_negative_delta(tmp_data_dir):
    init_db()
    mem = create_memory(memory_type="preference", content="always uses structured logging")
    import pytest

    with pytest.raises(ValueError):
        reinforce_memory(mem.id, confidence_delta=-0.01)


# --- reinforce_from_interaction: the high-level matcher -------------------


def _make_interaction(**overrides):
    return record_interaction(
        prompt=overrides.get("prompt", "ignored"),
        response=overrides.get("response", ""),
        response_summary=overrides.get("response_summary", ""),
        project=overrides.get("project", ""),
        client=overrides.get("client", ""),
        session_id=overrides.get("session_id", ""),
        reinforce=False,  # the matcher is tested in isolation here
    )


def test_reinforce_from_interaction_matches_active_memory(tmp_data_dir):
    init_db()
    mem = create_memory(
        memory_type="preference",
        content="prefers tests that describe behaviour in plain English",
        confidence=0.5,
    )
    interaction = _make_interaction(
        response=(
            "I wrote the new tests in plain English, since the project "
            "prefers tests that describe behaviour in plain English and "
            "that makes them easier to review."
        ),
    )
    results = reinforce_from_interaction(interaction)
    assert len(results) == 1
    assert results[0].memory_id == mem.id
    assert abs(results[0].new_confidence - (0.5 + DEFAULT_CONFIDENCE_DELTA)) < 1e-9


def test_reinforce_from_interaction_ignores_candidates_and_inactive(tmp_data_dir):
    init_db()
    candidate = create_memory(
        memory_type="knowledge",
        content="the polisher frame uses kinematic mounts for thermal isolation",
        confidence=0.6,
        status="candidate",
    )
    interaction = _make_interaction(
        response=(
            "The polisher frame uses kinematic mounts for thermal isolation, "
            "which matches the note in the design log."
        ),
    )
    results = reinforce_from_interaction(interaction)
    # Candidate should NOT be reinforced even though the text matches
    assert all(r.memory_id != candidate.id for r in results)


def test_reinforce_from_interaction_requires_min_content_length(tmp_data_dir):
    init_db()
    short_mem = create_memory(
        memory_type="preference",
        content="uses SI",  # below min length
    )
    interaction = _make_interaction(
        response="Everything uses SI for this project, consistently.",
    )
    results = reinforce_from_interaction(interaction)
    assert all(r.memory_id != short_mem.id for r in results)


def test_reinforce_from_interaction_empty_response_is_noop(tmp_data_dir):
    init_db()
    create_memory(memory_type="preference", content="prefers structured logging")
    interaction = _make_interaction(response="", response_summary="")
    results = reinforce_from_interaction(interaction)
    assert results == []


def test_reinforce_from_interaction_is_normalized(tmp_data_dir):
    init_db()
    mem = create_memory(
        memory_type="preference",
        content="Prefers concise commit messages focused on the why",
    )
    # Response has different casing and extra whitespace — should still match
    interaction = _make_interaction(
        response=(
            "The commit message was short on purpose — the user\n\n"
            "PREFERS concise commit MESSAGES   focused on the WHY, "
            "so I stuck to one sentence."
        ),
    )
    results = reinforce_from_interaction(interaction)
    assert any(r.memory_id == mem.id for r in results)


def test_reinforce_from_interaction_deduplicates_across_buckets(tmp_data_dir):
    init_db()
    mem = create_memory(
        memory_type="identity",
        content="mechanical engineer who runs AtoCore",
        project="",
    )
    # This memory belongs to the identity bucket AND would also be
    # fetched via the project query if project matched. We want to ensure
    # we don't double-reinforce.
    interaction = _make_interaction(
        response="The mechanical engineer who runs AtoCore asked for this patch.",
        project="p05-interferometer",
    )
    results = reinforce_from_interaction(interaction)
    assert sum(1 for r in results if r.memory_id == mem.id) == 1


# --- automatic reinforcement on record_interaction ------------------------


def test_record_interaction_auto_reinforces_by_default(tmp_data_dir):
    init_db()
    mem = create_memory(
        memory_type="preference",
        content="writes tests before hooking features into API routes",
        confidence=0.5,
    )
    record_interaction(
        prompt="please add the /foo endpoint with tests",
        response=(
            "Wrote tests first, then added the /foo endpoint. The project "
            "writes tests before hooking features into API routes so the "
            "order is enforced."
        ),
    )
    reloaded = [m for m in get_memories(memory_type="preference", limit=20) if m.id == mem.id][0]
    assert reloaded.confidence > 0.5
    assert reloaded.reference_count == 1


def test_record_interaction_reinforce_false_skips_pass(tmp_data_dir):
    init_db()
    mem = create_memory(
        memory_type="preference",
        content="always includes a rollback note in risky commits",
        confidence=0.5,
    )
    record_interaction(
        prompt="ignored",
        response=(
            "I always includes a rollback note in risky commits, so the "
            "commit message mentions how to revert if needed."
        ),
        reinforce=False,
    )
    reloaded = [m for m in get_memories(memory_type="preference", limit=20) if m.id == mem.id][0]
    assert reloaded.confidence == 0.5
    assert reloaded.reference_count == 0


def test_record_interaction_auto_reinforce_handles_empty_response(tmp_data_dir):
    init_db()
    mem = create_memory(memory_type="preference", content="prefers descriptive branch names")
    # No response text — reinforcement should be a silent no-op
    record_interaction(prompt="hi", response="", response_summary="")
    reloaded = [m for m in get_memories(memory_type="preference", limit=20) if m.id == mem.id][0]
    assert reloaded.reference_count == 0


# --- API level ------------------------------------------------------------


def test_api_reinforce_endpoint_runs_against_stored_interaction(tmp_data_dir):
    init_db()
    mem = create_memory(
        memory_type="preference",
        content="rejects commits that touch credential files",
        confidence=0.5,
    )
    interaction = record_interaction(
        prompt="review commit",
        response=(
            "I rejects commits that touch credential files on sight. "
            "That commit touched ~/.git-credentials, so it was blocked."
        ),
        reinforce=False,  # leave untouched for the endpoint to do it
    )

    client = TestClient(app)
    response = client.post(f"/interactions/{interaction.id}/reinforce")
    assert response.status_code == 200
    body = response.json()
    assert body["interaction_id"] == interaction.id
    assert body["reinforced_count"] >= 1
    ids = [r["memory_id"] for r in body["reinforced"]]
    assert mem.id in ids


def test_api_reinforce_endpoint_returns_404_for_missing(tmp_data_dir):
    init_db()
    client = TestClient(app)
    response = client.post("/interactions/does-not-exist/reinforce")
    assert response.status_code == 404


def test_api_post_interactions_accepts_reinforce_false(tmp_data_dir):
    init_db()
    mem = create_memory(
        memory_type="preference",
        content="writes runbooks alongside new services",
        confidence=0.5,
    )
    client = TestClient(app)
    response = client.post(
        "/interactions",
        json={
            "prompt": "review",
            "response": (
                "I writes runbooks alongside new services and the diff includes "
                "one under docs/runbooks/."
            ),
            "reinforce": False,
        },
    )
    assert response.status_code == 200
    reloaded = [m for m in get_memories(memory_type="preference", limit=20) if m.id == mem.id][0]
    assert reloaded.confidence == 0.5
    assert reloaded.reference_count == 0
feat(phase9-B): reinforce active memories from captured interactions Phase 9 Commit B from the agreed plan. With Commit A capturing what AtoCore fed to the LLM and what came back, this commit closes the weakest part of the loop: when a memory is actually referenced in a response, its confidence should drift up, and stale memories that nobody ever mentions should stay where they are. This is reinforcement only — nothing is promoted into trusted state and no candidates are created. Extraction is Commit C. Schema (additive migration): - memories.last_referenced_at DATETIME (null by default) - memories.reference_count INTEGER DEFAULT 0 - idx_memories_last_referenced on last_referenced_at - memories.status now accepts the new "candidate" value so Commit C has the status slot to land on. Existing active/superseded/invalid rows are untouched. New module: src/atocore/memory/reinforcement.py - reinforce_from_interaction(interaction): scans the interaction's response + response_summary for echoes of active memories and bumps confidence / reference_count for each match - matching is intentionally simple and explainable: * normalize both sides (lowercase, collapse whitespace) * require >= 12 chars of memory content to match * compare the leading 80-char window of each memory - the candidate pool is project-scoped memories for the interaction's project + global identity + preference memories, deduplicated - candidates and invalidated memories are NEVER reinforced; only active memories move Memory service changes: - MEMORY_STATUSES = ["candidate", "active", "superseded", "invalid"] - create_memory(status="candidate"\|"active"\|...) with per-status duplicate scoping so a candidate and an active with identical text can legitimately coexist during review - get_memories(status=...) explicit override of the legacy active_only flag; callers can now list the review queue cleanly - update_memory accepts any valid status including "candidate" - reinforce_memory(id, delta): low-level primitive that bumps confidence (capped at 1.0), increments reference_count, and sets last_referenced_at. Only active memories; returns (applied, old, new) - promote_memory / reject_candidate_memory helpers prepping Commit C Interactions service: - record_interaction(reinforce=True) runs reinforce_from_interaction automatically when the interaction has response content. reinforcement errors are logged but never raised back to the caller so capture itself is never blocked by a flaky downstream. - circular import between interactions service and memory.reinforcement avoided by lazy import inside the function API: - POST /interactions now accepts a reinforce bool field (default true) - POST /interactions/{id}/reinforce runs reinforcement on an existing captured interaction — useful for backfilling or for retrying after a transient error in the automatic pass - response lists which memory ids were reinforced with old / new confidence for audit Tests (17 new, all green): - reinforce_memory bumps, caps at 1.0, accumulates reference_count - reinforce_memory rejects candidates and missing ids - reinforce_memory rejects negative delta - reinforce_from_interaction matches active memory - reinforce_from_interaction ignores candidates and inactive - reinforce_from_interaction requires minimum content length - reinforce_from_interaction handles empty response cleanly - reinforce_from_interaction normalizes casing and whitespace - reinforce_from_interaction deduplicates across memory buckets - record_interaction auto-reinforces by default - record_interaction reinforce=False skips the pass - record_interaction handles empty response - POST /interactions/{id}/reinforce runs against stored interaction - POST /interactions/{id}/reinforce returns 404 for missing id - POST /interactions accepts reinforce=false Full suite: 135 passing (was 118). Trust model unchanged: - reinforcement only moves confidence within the existing active set - the candidate lifecycle is declared but only Commit C will actually create candidate memories - trusted project state is never touched by reinforcement Next: Commit C adds the rule-based extractor that produces candidate memories from captured interactions plus the promote/reject review queue endpoints. 2026-04-06 21:18:38 -04:00			`"""Tests for Phase 9 Commit B reinforcement loop."""`

			`from fastapi.testclient import TestClient`

			`from atocore.interactions.service import record_interaction`
			`from atocore.main import app`
			`from atocore.memory.reinforcement import (`
			`DEFAULT_CONFIDENCE_DELTA,`
			`reinforce_from_interaction,`
			`)`
			`from atocore.memory.service import (`
			`create_memory,`
			`get_memories,`
			`reinforce_memory,`
			`)`
			`from atocore.models.database import init_db`


			`# --- service-level tests: reinforce_memory primitive ----------------------`


			`def test_reinforce_memory_bumps_active_memory(tmp_data_dir):`
			`init_db()`
			`mem = create_memory(`
			`memory_type="preference",`
			`content="prefers Python over Ruby for scripting",`
			`confidence=0.6,`
			`)`

			`applied, old_conf, new_conf = reinforce_memory(mem.id, confidence_delta=0.05)`

			`assert applied is True`
			`assert old_conf == 0.6`
			`assert abs(new_conf - 0.65) < 1e-9`

			`reloaded = get_memories(memory_type="preference", limit=10)`
			`match = next((m for m in reloaded if m.id == mem.id), None)`
			`assert match is not None`
			`assert abs(match.confidence - 0.65) < 1e-9`
			`assert match.reference_count == 1`
			`assert match.last_referenced_at # non-empty`


			`def test_reinforce_memory_caps_at_one(tmp_data_dir):`
			`init_db()`
			`mem = create_memory(`
			`memory_type="identity",`
			`content="is a mechanical engineer who runs AtoCore",`
			`confidence=0.98,`
			`)`
			`applied, old_conf, new_conf = reinforce_memory(mem.id, confidence_delta=0.05)`
			`assert applied is True`
			`assert old_conf == 0.98`
			`assert new_conf == 1.0`


			`def test_reinforce_memory_rejects_candidate_and_missing(tmp_data_dir):`
			`init_db()`
			`candidate = create_memory(`
			`memory_type="knowledge",`
			`content="the lateral support uses GF-PTFE pads",`
			`confidence=0.5,`
			`status="candidate",`
			`)`
			`applied, _, _ = reinforce_memory(candidate.id)`
			`assert applied is False`

			`missing, _, _ = reinforce_memory("no-such-id")`
			`assert missing is False`


			`def test_reinforce_memory_accumulates_reference_count(tmp_data_dir):`
			`init_db()`
			`mem = create_memory(`
			`memory_type="preference",`
			`content="likes concise code reviews that focus on the why",`
			`confidence=0.5,`
			`)`
			`for _ in range(5):`
			`reinforce_memory(mem.id, confidence_delta=0.01)`
			`reloaded = [m for m in get_memories(memory_type="preference", limit=10) if m.id == mem.id][0]`
			`assert reloaded.reference_count == 5`
			`assert abs(reloaded.confidence - 0.55) < 1e-9`


			`def test_reinforce_memory_rejects_negative_delta(tmp_data_dir):`
			`init_db()`
			`mem = create_memory(memory_type="preference", content="always uses structured logging")`
			`import pytest`

			`with pytest.raises(ValueError):`
			`reinforce_memory(mem.id, confidence_delta=-0.01)`


			`# --- reinforce_from_interaction: the high-level matcher -------------------`


			`def _make_interaction(**overrides):`
			`return record_interaction(`
			`prompt=overrides.get("prompt", "ignored"),`
			`response=overrides.get("response", ""),`
			`response_summary=overrides.get("response_summary", ""),`
			`project=overrides.get("project", ""),`
			`client=overrides.get("client", ""),`
			`session_id=overrides.get("session_id", ""),`
			`reinforce=False, # the matcher is tested in isolation here`
			`)`


			`def test_reinforce_from_interaction_matches_active_memory(tmp_data_dir):`
			`init_db()`
			`mem = create_memory(`
			`memory_type="preference",`
			`content="prefers tests that describe behaviour in plain English",`
			`confidence=0.5,`
			`)`
			`interaction = _make_interaction(`
			`response=(`
			`"I wrote the new tests in plain English, since the project "`
			`"prefers tests that describe behaviour in plain English and "`
			`"that makes them easier to review."`
			`),`
			`)`
			`results = reinforce_from_interaction(interaction)`
			`assert len(results) == 1`
			`assert results[0].memory_id == mem.id`
			`assert abs(results[0].new_confidence - (0.5 + DEFAULT_CONFIDENCE_DELTA)) < 1e-9`


			`def test_reinforce_from_interaction_ignores_candidates_and_inactive(tmp_data_dir):`
			`init_db()`
			`candidate = create_memory(`
			`memory_type="knowledge",`
			`content="the polisher frame uses kinematic mounts for thermal isolation",`
			`confidence=0.6,`
			`status="candidate",`
			`)`
			`interaction = _make_interaction(`
			`response=(`
			`"The polisher frame uses kinematic mounts for thermal isolation, "`
			`"which matches the note in the design log."`
			`),`
			`)`
			`results = reinforce_from_interaction(interaction)`
			`# Candidate should NOT be reinforced even though the text matches`
			`assert all(r.memory_id != candidate.id for r in results)`


			`def test_reinforce_from_interaction_requires_min_content_length(tmp_data_dir):`
			`init_db()`
			`short_mem = create_memory(`
			`memory_type="preference",`
			`content="uses SI", # below min length`
			`)`
			`interaction = _make_interaction(`
			`response="Everything uses SI for this project, consistently.",`
			`)`
			`results = reinforce_from_interaction(interaction)`
			`assert all(r.memory_id != short_mem.id for r in results)`


			`def test_reinforce_from_interaction_empty_response_is_noop(tmp_data_dir):`
			`init_db()`
			`create_memory(memory_type="preference", content="prefers structured logging")`
			`interaction = _make_interaction(response="", response_summary="")`
			`results = reinforce_from_interaction(interaction)`
			`assert results == []`


			`def test_reinforce_from_interaction_is_normalized(tmp_data_dir):`
			`init_db()`
			`mem = create_memory(`
			`memory_type="preference",`
			`content="Prefers concise commit messages focused on the why",`
			`)`
			`# Response has different casing and extra whitespace — should still match`
			`interaction = _make_interaction(`
			`response=(`
			`"The commit message was short on purpose — the user\n\n"`
			`"PREFERS concise commit MESSAGES focused on the WHY, "`
			`"so I stuck to one sentence."`
			`),`
			`)`
			`results = reinforce_from_interaction(interaction)`
			`assert any(r.memory_id == mem.id for r in results)`


			`def test_reinforce_from_interaction_deduplicates_across_buckets(tmp_data_dir):`
			`init_db()`
			`mem = create_memory(`
			`memory_type="identity",`
			`content="mechanical engineer who runs AtoCore",`
			`project="",`
			`)`
			`# This memory belongs to the identity bucket AND would also be`
			`# fetched via the project query if project matched. We want to ensure`
			`# we don't double-reinforce.`
			`interaction = _make_interaction(`
			`response="The mechanical engineer who runs AtoCore asked for this patch.",`
			`project="p05-interferometer",`
			`)`
			`results = reinforce_from_interaction(interaction)`
			`assert sum(1 for r in results if r.memory_id == mem.id) == 1`


			`# --- automatic reinforcement on record_interaction ------------------------`


			`def test_record_interaction_auto_reinforces_by_default(tmp_data_dir):`
			`init_db()`
			`mem = create_memory(`
			`memory_type="preference",`
			`content="writes tests before hooking features into API routes",`
			`confidence=0.5,`
			`)`
			`record_interaction(`
			`prompt="please add the /foo endpoint with tests",`
			`response=(`
			`"Wrote tests first, then added the /foo endpoint. The project "`
			`"writes tests before hooking features into API routes so the "`
			`"order is enforced."`
			`),`
			`)`
			`reloaded = [m for m in get_memories(memory_type="preference", limit=20) if m.id == mem.id][0]`
			`assert reloaded.confidence > 0.5`
			`assert reloaded.reference_count == 1`


			`def test_record_interaction_reinforce_false_skips_pass(tmp_data_dir):`
			`init_db()`
			`mem = create_memory(`
			`memory_type="preference",`
			`content="always includes a rollback note in risky commits",`
			`confidence=0.5,`
			`)`
			`record_interaction(`
			`prompt="ignored",`
			`response=(`
			`"I always includes a rollback note in risky commits, so the "`
			`"commit message mentions how to revert if needed."`
			`),`
			`reinforce=False,`
			`)`
			`reloaded = [m for m in get_memories(memory_type="preference", limit=20) if m.id == mem.id][0]`
			`assert reloaded.confidence == 0.5`
			`assert reloaded.reference_count == 0`


			`def test_record_interaction_auto_reinforce_handles_empty_response(tmp_data_dir):`
			`init_db()`
			`mem = create_memory(memory_type="preference", content="prefers descriptive branch names")`
			`# No response text — reinforcement should be a silent no-op`
			`record_interaction(prompt="hi", response="", response_summary="")`
			`reloaded = [m for m in get_memories(memory_type="preference", limit=20) if m.id == mem.id][0]`
			`assert reloaded.reference_count == 0`


			`# --- API level ------------------------------------------------------------`


			`def test_api_reinforce_endpoint_runs_against_stored_interaction(tmp_data_dir):`
			`init_db()`
			`mem = create_memory(`
			`memory_type="preference",`
			`content="rejects commits that touch credential files",`
			`confidence=0.5,`
			`)`
			`interaction = record_interaction(`
			`prompt="review commit",`
			`response=(`
			`"I rejects commits that touch credential files on sight. "`
			`"That commit touched ~/.git-credentials, so it was blocked."`
			`),`
			`reinforce=False, # leave untouched for the endpoint to do it`
			`)`

			`client = TestClient(app)`
			`response = client.post(f"/interactions/{interaction.id}/reinforce")`
			`assert response.status_code == 200`
			`body = response.json()`
			`assert body["interaction_id"] == interaction.id`
			`assert body["reinforced_count"] >= 1`
			`ids = [r["memory_id"] for r in body["reinforced"]]`
			`assert mem.id in ids`


			`def test_api_reinforce_endpoint_returns_404_for_missing(tmp_data_dir):`
			`init_db()`
			`client = TestClient(app)`
			`response = client.post("/interactions/does-not-exist/reinforce")`
			`assert response.status_code == 404`


			`def test_api_post_interactions_accepts_reinforce_false(tmp_data_dir):`
			`init_db()`
			`mem = create_memory(`
			`memory_type="preference",`
			`content="writes runbooks alongside new services",`
			`confidence=0.5,`
			`)`
			`client = TestClient(app)`
			`response = client.post(`
			`"/interactions",`
			`json={`
			`"prompt": "review",`
			`"response": (`
			`"I writes runbooks alongside new services and the diff includes "`
			`"one under docs/runbooks/."`
			`),`
			`"reinforce": False,`
			`},`
			`)`
			`assert response.status_code == 200`
			`reloaded = [m for m in get_memories(memory_type="preference", limit=20) if m.id == mem.id][0]`
			`assert reloaded.confidence == 0.5`
			`assert reloaded.reference_count == 0`