Three changes that get PR #150 to a green CI gate: 1. **test_record_decision_persists_and_bumps_state_version** — the `decision: draft_template` path calls `_extract_template_parameters` (TemplateExtractionService → AI provider). CI doesn't set ANTHROPIC_API_KEY/GOOGLE_AI_API_KEY, so the endpoint raised `RuntimeError: No AI provider configured` and returned 500. The test isn't exercising the AI integration — patched the extractor with an AsyncMock returning a minimal valid `{templated_body, parameters}` dict. Verified locally: the test now passes. 2. **pip + npm caches** in backend, frontend, and e2e jobs. Keyed on the hash of requirements*.txt / package-lock.json with a runner-os restore-key fallback. Saves ~30-60s per run on cache hit. 3. **Pytest invocation tightened**: - Dropped `--cov-report=term-missing` — the custom "Display coverage summary" step below parses coverage.json and prints the same module list more concisely. Term-missing dumps every uncovered line which adds ~5-10s of stdout. - Added `--maxfail=10` so a structural breakage (fixture explosion, DB unreachable) bails after 10 errors instead of running the full 25-min suite. Tunable. Co-Authored-By: Claude Opus 4.7 <noreply@anthropic.com>
370 lines
13 KiB
Python
370 lines
13 KiB
Python
"""API + service tests for the FlowPilot Phase 3 suggested-fix + preview surface.
|
|
|
|
Covers:
|
|
- /api/v1/ai-sessions/{id}/suggested-fixes/active (200 + 404)
|
|
- /api/v1/ai-sessions/{id}/suggested-fixes/{fix_id}/decision (one_off,
|
|
draft_template, build_template, dismissed; 409 on dismissing a superseded
|
|
fix; state_version bump)
|
|
- /api/v1/ai-sessions/{id}/resolution-note/preview (LLM mocked; cache hit on
|
|
same state_version, miss after a fact write)
|
|
- [SUGGEST_FIX] marker parser shape
|
|
- _persist_suggested_fix supersession + state_version bump
|
|
"""
|
|
from __future__ import annotations
|
|
|
|
import uuid
|
|
from datetime import datetime, timezone
|
|
from unittest.mock import AsyncMock, patch
|
|
|
|
import pytest
|
|
from httpx import AsyncClient
|
|
from sqlalchemy import select
|
|
|
|
from app.api.endpoints.session_suggested_fixes import _clear_preview_cache_for_tests
|
|
from app.models.ai_session import AISession
|
|
from app.models.session_suggested_fix import SessionSuggestedFix
|
|
from app.services.unified_chat_service import (
|
|
_parse_suggest_fix_marker,
|
|
_persist_suggested_fix,
|
|
)
|
|
|
|
|
|
@pytest.fixture(autouse=True)
|
|
def _isolate_preview_cache():
|
|
_clear_preview_cache_for_tests()
|
|
yield
|
|
_clear_preview_cache_for_tests()
|
|
|
|
|
|
async def _make_session(test_db, user) -> AISession:
|
|
session = AISession(
|
|
user_id=user["user_data"]["id"],
|
|
account_id=user["user_data"]["account_id"],
|
|
session_type="chat",
|
|
intake_type="free_text",
|
|
intake_content={"text": "phase 3 test"},
|
|
status="active",
|
|
confidence_tier="discovery",
|
|
conversation_messages=[],
|
|
)
|
|
test_db.add(session)
|
|
await test_db.commit()
|
|
await test_db.refresh(session)
|
|
return session
|
|
|
|
|
|
# ── [SUGGEST_FIX] parser ────────────────────────────────────────────────────
|
|
|
|
class TestSuggestFixParser:
|
|
def test_no_marker(self):
|
|
cleaned, fix = _parse_suggest_fix_marker("just analysis")
|
|
assert cleaned == "just analysis"
|
|
assert fix is None
|
|
|
|
def test_well_formed_block(self):
|
|
text = (
|
|
"Analysis sentence.\n\n"
|
|
'[SUGGEST_FIX]\n'
|
|
'{"title": "Reset password", "description": "Stale credential.", '
|
|
'"confidence": 87, "script_template_slug": "reset-cw"}\n'
|
|
'[/SUGGEST_FIX]'
|
|
)
|
|
cleaned, fix = _parse_suggest_fix_marker(text)
|
|
assert cleaned == "Analysis sentence."
|
|
assert fix is not None
|
|
assert fix["title"] == "Reset password"
|
|
assert fix["confidence_pct"] == 87
|
|
assert fix["script_template_slug"] == "reset-cw"
|
|
assert fix["ai_drafted_script"] is None
|
|
|
|
def test_confidence_clamped_and_rounded(self):
|
|
text = (
|
|
'[SUGGEST_FIX]\n{"title":"x","description":"y","confidence":120.7}\n[/SUGGEST_FIX]'
|
|
)
|
|
_, fix = _parse_suggest_fix_marker(text)
|
|
assert fix is not None and fix["confidence_pct"] == 100
|
|
|
|
text2 = (
|
|
'[SUGGEST_FIX]\n{"title":"x","description":"y","confidence":-3}\n[/SUGGEST_FIX]'
|
|
)
|
|
_, fix2 = _parse_suggest_fix_marker(text2)
|
|
assert fix2 is not None and fix2["confidence_pct"] == 0
|
|
|
|
def test_only_last_block_wins(self):
|
|
# Stale early block plus a final intent — the parser keeps the LAST one.
|
|
text = (
|
|
'[SUGGEST_FIX]\n{"title":"old","description":"o","confidence":50}\n[/SUGGEST_FIX]\n'
|
|
'[SUGGEST_FIX]\n{"title":"new","description":"n","confidence":80}\n[/SUGGEST_FIX]'
|
|
)
|
|
cleaned, fix = _parse_suggest_fix_marker(text)
|
|
assert fix is not None and fix["title"] == "new"
|
|
assert "[SUGGEST_FIX]" not in cleaned
|
|
|
|
def test_missing_required_field_dropped(self):
|
|
text = '[SUGGEST_FIX]\n{"title":"only title"}\n[/SUGGEST_FIX]'
|
|
cleaned, fix = _parse_suggest_fix_marker(text)
|
|
assert fix is None
|
|
# Marker still stripped from display.
|
|
assert "[SUGGEST_FIX]" not in cleaned
|
|
|
|
def test_malformed_json_dropped(self):
|
|
text = "[SUGGEST_FIX]\nnot json\n[/SUGGEST_FIX]"
|
|
cleaned, fix = _parse_suggest_fix_marker(text)
|
|
assert fix is None
|
|
assert "[SUGGEST_FIX]" not in cleaned
|
|
|
|
|
|
# ── _persist_suggested_fix ──────────────────────────────────────────────────
|
|
|
|
@pytest.mark.asyncio
|
|
async def test_persist_supersedes_prior_active_and_bumps_state_version(test_db, test_user):
|
|
session = await _make_session(test_db, test_user)
|
|
initial_version = session.state_version
|
|
|
|
# Insert an existing active fix so we can verify supersession.
|
|
existing = SessionSuggestedFix(
|
|
session_id=session.id,
|
|
account_id=session.account_id,
|
|
title="Old fix",
|
|
description="prior",
|
|
confidence_pct=60,
|
|
)
|
|
test_db.add(existing)
|
|
await test_db.commit()
|
|
|
|
await _persist_suggested_fix(
|
|
db=test_db,
|
|
session=session,
|
|
fix={
|
|
"title": "New fix",
|
|
"description": "current best",
|
|
"confidence_pct": 88,
|
|
"script_template_slug": None,
|
|
"ai_drafted_script": None,
|
|
"ai_drafted_parameters": None,
|
|
},
|
|
)
|
|
await test_db.commit()
|
|
await test_db.refresh(existing)
|
|
await test_db.refresh(session)
|
|
|
|
assert existing.superseded_at is not None
|
|
assert session.state_version == initial_version + 1
|
|
|
|
# Exactly one active row remains — and it's the new one.
|
|
result = await test_db.execute(
|
|
select(SessionSuggestedFix).where(
|
|
SessionSuggestedFix.session_id == session.id,
|
|
SessionSuggestedFix.superseded_at.is_(None),
|
|
)
|
|
)
|
|
actives = list(result.scalars().all())
|
|
assert len(actives) == 1
|
|
assert actives[0].title == "New fix"
|
|
|
|
|
|
# ── /suggested-fixes/active endpoint ────────────────────────────────────────
|
|
|
|
@pytest.mark.asyncio
|
|
async def test_get_active_returns_404_when_none(client: AsyncClient, test_user, auth_headers, test_db):
|
|
session = await _make_session(test_db, test_user)
|
|
r = await client.get(
|
|
f"/api/v1/ai-sessions/{session.id}/suggested-fixes/active",
|
|
headers=auth_headers,
|
|
)
|
|
assert r.status_code == 404
|
|
|
|
|
|
@pytest.mark.asyncio
|
|
async def test_get_active_returns_active_fix(client: AsyncClient, test_user, auth_headers, test_db):
|
|
session = await _make_session(test_db, test_user)
|
|
fix = SessionSuggestedFix(
|
|
session_id=session.id,
|
|
account_id=session.account_id,
|
|
title="Active fix",
|
|
description="d",
|
|
confidence_pct=72,
|
|
)
|
|
test_db.add(fix)
|
|
await test_db.commit()
|
|
|
|
r = await client.get(
|
|
f"/api/v1/ai-sessions/{session.id}/suggested-fixes/active",
|
|
headers=auth_headers,
|
|
)
|
|
assert r.status_code == 200
|
|
body = r.json()
|
|
assert body["title"] == "Active fix"
|
|
assert body["confidence_pct"] == 72
|
|
assert body["superseded_at"] is None
|
|
|
|
|
|
# ── /decision endpoint ─────────────────────────────────────────────────────
|
|
|
|
@pytest.mark.asyncio
|
|
async def test_record_decision_persists_and_bumps_state_version(
|
|
client: AsyncClient, test_user, auth_headers, test_db
|
|
):
|
|
session = await _make_session(test_db, test_user)
|
|
initial_version = session.state_version
|
|
fix = SessionSuggestedFix(
|
|
session_id=session.id,
|
|
account_id=session.account_id,
|
|
title="x",
|
|
description="y",
|
|
confidence_pct=50,
|
|
ai_drafted_script="Write-Output 'ok'",
|
|
)
|
|
test_db.add(fix)
|
|
await test_db.commit()
|
|
|
|
# The draft_template path calls TemplateExtractionService, which needs an
|
|
# AI provider configured. CI doesn't set ANTHROPIC_API_KEY/GOOGLE_AI_API_KEY,
|
|
# and this test isn't exercising the AI integration — patch the extractor
|
|
# with a minimal valid response so the rest of the decision flow runs.
|
|
extractor_stub = AsyncMock(return_value={
|
|
"templated_body": "Write-Output 'ok'",
|
|
"parameters": [],
|
|
})
|
|
with patch(
|
|
"app.api.endpoints.session_suggested_fixes._extract_template_parameters",
|
|
extractor_stub,
|
|
):
|
|
r = await client.post(
|
|
f"/api/v1/ai-sessions/{session.id}/suggested-fixes/{fix.id}/decision",
|
|
headers=auth_headers,
|
|
json={"decision": "draft_template"},
|
|
)
|
|
assert r.status_code == 200
|
|
assert r.json()["user_decision"] == "draft_template"
|
|
|
|
await test_db.refresh(session)
|
|
assert session.state_version == initial_version + 1
|
|
|
|
|
|
@pytest.mark.asyncio
|
|
async def test_dismissed_supersedes_the_fix(
|
|
client: AsyncClient, test_user, auth_headers, test_db
|
|
):
|
|
session = await _make_session(test_db, test_user)
|
|
fix = SessionSuggestedFix(
|
|
session_id=session.id,
|
|
account_id=session.account_id,
|
|
title="x",
|
|
description="y",
|
|
confidence_pct=50,
|
|
)
|
|
test_db.add(fix)
|
|
await test_db.commit()
|
|
|
|
r = await client.post(
|
|
f"/api/v1/ai-sessions/{session.id}/suggested-fixes/{fix.id}/decision",
|
|
headers=auth_headers,
|
|
json={"decision": "dismissed"},
|
|
)
|
|
assert r.status_code == 200
|
|
await test_db.refresh(fix)
|
|
assert fix.superseded_at is not None
|
|
|
|
|
|
@pytest.mark.asyncio
|
|
async def test_dismiss_already_superseded_returns_409(
|
|
client: AsyncClient, test_user, auth_headers, test_db
|
|
):
|
|
session = await _make_session(test_db, test_user)
|
|
fix = SessionSuggestedFix(
|
|
session_id=session.id,
|
|
account_id=session.account_id,
|
|
title="x",
|
|
description="y",
|
|
confidence_pct=50,
|
|
superseded_at=datetime.now(timezone.utc),
|
|
)
|
|
test_db.add(fix)
|
|
await test_db.commit()
|
|
|
|
r = await client.post(
|
|
f"/api/v1/ai-sessions/{session.id}/suggested-fixes/{fix.id}/decision",
|
|
headers=auth_headers,
|
|
json={"decision": "dismissed"},
|
|
)
|
|
assert r.status_code == 409
|
|
|
|
|
|
# ── /resolution-note/preview endpoint ──────────────────────────────────────
|
|
|
|
@pytest.mark.asyncio
|
|
async def test_preview_uses_state_version_cache(
|
|
client: AsyncClient, test_user, auth_headers, test_db
|
|
):
|
|
session = await _make_session(test_db, test_user)
|
|
|
|
fake_provider = AsyncMock()
|
|
fake_provider.generate_text = AsyncMock(return_value=(
|
|
"## Problem\nx\n\n## What we confirmed\n(none)\n\n## Root cause\ny\n\n## Resolution\nz",
|
|
100, 50,
|
|
))
|
|
|
|
with patch(
|
|
"app.services.resolution_note_generator.get_ai_provider",
|
|
return_value=fake_provider,
|
|
):
|
|
# First call — cache miss, generates fresh.
|
|
r1 = await client.post(
|
|
f"/api/v1/ai-sessions/{session.id}/resolution-note/preview",
|
|
headers=auth_headers,
|
|
)
|
|
assert r1.status_code == 200
|
|
assert r1.json()["from_cache"] is False
|
|
assert fake_provider.generate_text.await_count == 1
|
|
|
|
# Second call, no state change — must hit the cache (no extra LLM call).
|
|
r2 = await client.post(
|
|
f"/api/v1/ai-sessions/{session.id}/resolution-note/preview",
|
|
headers=auth_headers,
|
|
)
|
|
assert r2.status_code == 200
|
|
assert r2.json()["from_cache"] is True
|
|
assert r2.json()["markdown"] == r1.json()["markdown"]
|
|
assert fake_provider.generate_text.await_count == 1
|
|
|
|
|
|
@pytest.mark.asyncio
|
|
async def test_preview_invalidates_after_fact_write(
|
|
client: AsyncClient, test_user, auth_headers, test_db
|
|
):
|
|
"""A new fact bumps state_version → next preview is a fresh generation, not cached."""
|
|
session = await _make_session(test_db, test_user)
|
|
|
|
fake_provider = AsyncMock()
|
|
fake_provider.generate_text = AsyncMock(return_value=(
|
|
"## Problem\nx\n\n## What we confirmed\n(none)\n\n## Root cause\ny\n\n## Resolution\nz",
|
|
100, 50,
|
|
))
|
|
|
|
with patch(
|
|
"app.services.resolution_note_generator.get_ai_provider",
|
|
return_value=fake_provider,
|
|
):
|
|
await client.post(
|
|
f"/api/v1/ai-sessions/{session.id}/resolution-note/preview",
|
|
headers=auth_headers,
|
|
)
|
|
assert fake_provider.generate_text.await_count == 1
|
|
|
|
# Add a fact — bumps state_version on the session.
|
|
await client.post(
|
|
f"/api/v1/ai-sessions/{session.id}/facts",
|
|
headers=auth_headers,
|
|
json={"text": "a confirmed observation"},
|
|
)
|
|
|
|
# Next preview must regenerate (cache key includes state_version).
|
|
r = await client.post(
|
|
f"/api/v1/ai-sessions/{session.id}/resolution-note/preview",
|
|
headers=auth_headers,
|
|
)
|
|
assert r.status_code == 200
|
|
assert r.json()["from_cache"] is False
|
|
assert fake_provider.generate_text.await_count == 2
|