test(gameplay): add canonical loop smoke evidence (#302)
Some checks failed
CI / test-and-quality (push) Failing after 3m42s
CI / test-and-quality (pull_request) Successful in 3m36s

This commit is contained in:
2026-03-16 15:20:06 +00:00
parent 112a85a22d
commit 9970257f32
4 changed files with 434 additions and 87 deletions

View File

@@ -0,0 +1,55 @@
# Issue #302 Evidence — canonical bluff → guess → reveal → scoreboard regression
## Runnable command
```bash
python manage.py migrate --noinput
python manage.py smoke_staging --artifact docs/artifacts/issue-302-canonical-loop-smoke.json
```
`migrate` is the normal local bootstrap precondition when the database has not been initialized yet; the regression evidence itself is produced by `smoke_staging`.
## What the regression proves
`smoke_staging` now exercises one full canonical round and fails fast with step-specific diagnostics if any of these break:
1. `start_round` lands the session in `lie` and returns a concrete `round_question_id`.
2. Final `submit_lie` auto-advances the session to `guess` and exposes mixed answers containing both the correct answer and player bluffs.
3. Final `submit_guess` auto-advances the session to `reveal` and returns the canonical reveal payload.
4. The reveal payload includes:
- correct answer
- all lies
- all guesses
- fooled-player references for bluff hits
5. The first canonical state read after reveal promotes the session to `scoreboard`.
6. Scoreboard promotion preserves the same reveal payload and exposes a leaderboard with `scoreboard_ready=true`.
## Artifact shape
When `--artifact` is provided, the JSON file records:
- the exact smoke command
- session code and round question id
- deterministic guess plan used to produce both bluff hits and one correct guess
- per-step evidence for:
- `create_session`
- `join_players`
- `start_round`
- `auto_guess_transition`
- `submit_guesses`
- `auto_reveal_transition`
- `auto_scoreboard_transition`
- `finish_game`
- reveal summary (`correct_answer`, lie/guess counts, fooled-player ids, correct guess player ids)
- promoted scoreboard leaderboard payload
## Targeted test coverage
Backend regression coverage lives in `lobby/tests.py`:
- `test_smoke_staging_command_runs_full_flow`
- `test_smoke_staging_writes_phase_evidence_artifact_when_requested`
Together they ensure the command stays runnable in normal workflow and that the evidence artifact contains phase-by-phase proof instead of only a generic pass/fail.
Refs #287 #302

View File

@@ -0,0 +1,110 @@
{
"ok": true,
"command": "python manage.py smoke_staging --artifact <path>",
"generated_at": "2026-03-16T15:19:30.105231+00:00",
"question": {
"prompt": "Smoke prompt?",
"correct_answer": "Correct"
},
"steps": [
{
"step": "create_session",
"session_status": "lobby"
},
{
"step": "join_players",
"players_count": 3
},
{
"step": "start_round",
"session_status": "lie",
"round_question_id": 1
},
{
"step": "auto_guess_transition",
"session_status": "guess",
"answers": [
"Lie from P3",
"Lie from P1",
"Lie from P2",
"Correct"
]
},
{
"step": "submit_guesses",
"guess_results": [
{
"player_id": 1,
"selected_text": "Lie from P2",
"is_correct": false,
"fooled_player_id": 2
},
{
"player_id": 2,
"selected_text": "Correct",
"is_correct": true,
"fooled_player_id": null
},
{
"player_id": 3,
"selected_text": "Lie from P1",
"is_correct": false,
"fooled_player_id": 1
}
]
},
{
"step": "auto_reveal_transition",
"session_status": "reveal",
"reveal": {
"correct_answer": "Correct",
"lies_count": 3,
"guesses_count": 3,
"fooled_player_ids": [
1,
2
],
"correct_guess_player_ids": [
2
]
}
},
{
"step": "auto_scoreboard_transition",
"session_status": "scoreboard",
"leaderboard": [
{
"id": 2,
"nickname": "P2",
"score": 7
},
{
"id": 1,
"nickname": "P1",
"score": 2
},
{
"id": 3,
"nickname": "P3",
"score": 0
}
]
},
{
"step": "finish_game",
"session_status": "finished"
}
],
"session_code": "7YV59E",
"players": [
"P1",
"P2",
"P3"
],
"round_question_id": 1,
"guess_plan": {
"P1": "Lie from P2",
"P2": "Correct",
"P3": "Lie from P1"
}
}

View File

@@ -10,7 +10,7 @@ from fupogfakta.models import Category, GameSession, Player, Question, RoundQues
class Command(BaseCommand): class Command(BaseCommand):
help = "Run minimal staging smoke flow for lobby gameplay" help = "Run canonical gameplay smoke/regression flow for bluff -> guess -> reveal -> scoreboard"
def add_arguments(self, parser): def add_arguments(self, parser):
parser.add_argument( parser.add_argument(
@@ -18,6 +18,26 @@ class Command(BaseCommand):
help="Optional path to write smoke result artifact as JSON", help="Optional path to write smoke result artifact as JSON",
) )
def _fail(self, step: str, detail: str, payload=None):
message = f"{step} failed: {detail}"
if payload is not None:
message += f" | payload={json.dumps(payload, sort_keys=True)}"
raise CommandError(message)
def _expect_status(self, response, expected_status: int, step: str):
if response.status_code != expected_status:
try:
payload = response.json()
except ValueError:
payload = {"raw": response.content.decode("utf-8", errors="replace")}
self._fail(step, f"expected HTTP {expected_status}, got {response.status_code}", payload)
return response.json()
def _expect_session_status(self, payload: dict, expected_status: str, step: str):
actual_status = payload.get("session", {}).get("status")
if actual_status != expected_status:
self._fail(step, f"expected session.status={expected_status}, got {actual_status}", payload)
def handle(self, *args, **options): def handle(self, *args, **options):
GameSession.objects.all().delete() GameSession.objects.all().delete()
Player.objects.all().delete() Player.objects.all().delete()
@@ -30,11 +50,14 @@ class Command(BaseCommand):
category.is_active = True category.is_active = True
category.save(update_fields=["is_active"]) category.save(update_fields=["is_active"])
Question.objects.get_or_create( question, _ = Question.objects.get_or_create(
category=category, category=category,
prompt="Smoke prompt?", prompt="Smoke prompt?",
defaults={"correct_answer": "Correct", "is_active": True}, defaults={"correct_answer": "Correct", "is_active": True},
) )
if not question.is_active:
question.is_active = True
question.save(update_fields=["is_active"])
User = get_user_model() User = get_user_model()
host, _ = User.objects.get_or_create(username="smoke-host") host, _ = User.objects.get_or_create(username="smoke-host")
@@ -42,111 +65,254 @@ class Command(BaseCommand):
host.is_staff = True host.is_staff = True
host.save() host.save()
artifact = {
"ok": True,
"command": "python manage.py smoke_staging --artifact <path>",
"generated_at": datetime.now(timezone.utc).isoformat(),
"question": {
"prompt": question.prompt,
"correct_answer": question.correct_answer,
},
"steps": [],
}
host_client = Client() host_client = Client()
host_client.force_login(host) host_client.force_login(host)
create_res = host_client.post("/lobby/sessions/create", content_type="application/json") create_payload = self._expect_status(
if create_res.status_code != 201: host_client.post("/lobby/sessions/create", content_type="application/json"),
raise CommandError(f"create_session failed: {create_res.status_code} {create_res.content!r}") 201,
"create_session",
code = create_res.json()["session"]["code"] )
code = create_payload["session"]["code"]
artifact["session_code"] = code
artifact["steps"].append(
{
"step": "create_session",
"session_status": create_payload["session"]["status"],
}
)
players = [] players = []
for nickname in ["P1", "P2", "P3"]: for nickname in ["P1", "P2", "P3"]:
join_res = Client().post( join_payload = self._expect_status(
"/lobby/sessions/join", Client().post(
data=json.dumps({"code": code, "nickname": nickname}), "/lobby/sessions/join",
content_type="application/json", data=json.dumps({"code": code, "nickname": nickname}),
content_type="application/json",
),
201,
f"join_session[{nickname}]",
) )
if join_res.status_code != 201: players.append(join_payload["player"])
raise CommandError(f"join_session failed for {nickname}: {join_res.status_code}") artifact["players"] = [player["nickname"] for player in players]
players.append(join_res.json()["player"]) artifact["steps"].append(
{
start_res = host_client.post( "step": "join_players",
f"/lobby/sessions/{code}/rounds/start", "players_count": len(players),
data=json.dumps({"category_slug": category.slug}), }
content_type="application/json",
) )
if start_res.status_code != 201:
raise CommandError(f"start_round failed: {start_res.status_code}")
round_question_id = start_res.json()["round_question"]["id"] start_payload = self._expect_status(
host_client.post(
f"/lobby/sessions/{code}/rounds/start",
data=json.dumps({"category_slug": category.slug}),
content_type="application/json",
),
201,
"start_round",
)
self._expect_session_status(start_payload, GameSession.Status.LIE, "start_round")
round_question_id = start_payload["round_question"]["id"]
artifact["round_question_id"] = round_question_id
artifact["steps"].append(
{
"step": "start_round",
"session_status": start_payload["session"]["status"],
"round_question_id": round_question_id,
}
)
answers = [] answers = []
lie_transition_payload = None
for player in players: for player in players:
nick = player["nickname"] nickname = player["nickname"]
lie_res = Client().post( lie_payload = self._expect_status(
f"/lobby/sessions/{code}/questions/{round_question_id}/lies/submit", Client().post(
data=json.dumps( f"/lobby/sessions/{code}/questions/{round_question_id}/lies/submit",
{ data=json.dumps(
"player_id": player["id"], {
"session_token": player["session_token"], "player_id": player["id"],
"text": f"Lie from {nick}", "session_token": player["session_token"],
} "text": f"Lie from {nickname}",
}
),
content_type="application/json",
), ),
content_type="application/json", 201,
f"submit_lie[{nickname}]",
) )
if lie_res.status_code != 201: if lie_payload.get("answers"):
raise CommandError(f"submit_lie failed for {nick}: {lie_res.status_code}") answers = lie_payload["answers"]
if lie_res.json().get("answers"): lie_transition_payload = lie_payload
answers = lie_res.json()["answers"]
if not answers: if not answers:
detail_res = host_client.get(f"/lobby/sessions/{code}") detail_payload = self._expect_status(host_client.get(f"/lobby/sessions/{code}"), 200, "session_detail_after_lies")
if detail_res.status_code != 200: answers = detail_payload.get("round_question", {}).get("answers", [])
raise CommandError(f"session_detail after lies failed: {detail_res.status_code}") self._expect_session_status(detail_payload, GameSession.Status.GUESS, "session_detail_after_lies")
answers = detail_res.json().get("round_question", {}).get("answers", []) lie_transition_payload = detail_payload
if not answers: if not answers:
raise CommandError("canonical lie->guess transition returned empty answers") self._fail("auto_guess_transition", "canonical lie->guess transition returned empty answers")
for player in players: if not any(answer.get("text") == question.correct_answer for answer in answers):
nick = player["nickname"] self._fail("auto_guess_transition", "mixed answers missing correct answer", {"answers": answers})
selected = next((a for a in answers if a.get("player_id") != player["id"]), answers[0]) if len(answers) < len(players) + 1:
guess_res = Client().post( self._fail(
f"/lobby/sessions/{code}/questions/{round_question_id}/guesses/submit", "auto_guess_transition",
data=json.dumps( "mixed answers shorter than expected bluff set",
{ {"answers": answers, "players_count": len(players)},
"player_id": player["id"],
"session_token": player["session_token"],
"selected_text": selected["text"],
}
),
content_type="application/json",
) )
if guess_res.status_code != 201:
raise CommandError(f"submit_guess failed for {nick}: {guess_res.status_code}")
detail_res = host_client.get(f"/lobby/sessions/{code}") self._expect_session_status(lie_transition_payload, GameSession.Status.GUESS, "auto_guess_transition")
if detail_res.status_code != 200: artifact["steps"].append(
raise CommandError(f"session_detail after guesses failed: {detail_res.status_code}") {
if detail_res.json()["session"]["status"] != GameSession.Status.SCOREBOARD: "step": "auto_guess_transition",
raise CommandError("canonical guess->reveal->scoreboard transition did not reach scoreboard") "session_status": lie_transition_payload["session"]["status"],
"answers": [answer["text"] for answer in answers],
}
)
finish_res = host_client.post(f"/lobby/sessions/{code}/finish", content_type="application/json") answer_texts = {answer["text"] for answer in answers}
if finish_res.status_code != 200: correct_answer = next((answer["text"] for answer in answers if answer.get("text") == question.correct_answer), None)
raise CommandError(f"finish_game failed: {finish_res.status_code}") if correct_answer is None:
self._fail("submit_guesses", "could not resolve correct answer from mixed answers", {"answers": answers})
guess_plan = {
players[0]["nickname"]: "Lie from P2",
players[1]["nickname"]: correct_answer,
players[2]["nickname"]: "Lie from P1",
}
missing_guess_targets = {text for text in guess_plan.values() if text not in answer_texts}
if missing_guess_targets:
self._fail(
"submit_guesses",
"expected bluff targets missing from mixed answers",
{"answers": answers, "missing_guess_targets": sorted(missing_guess_targets)},
)
artifact["guess_plan"] = guess_plan
guess_payloads = []
for player in players:
nickname = player["nickname"]
guess_payload = self._expect_status(
Client().post(
f"/lobby/sessions/{code}/questions/{round_question_id}/guesses/submit",
data=json.dumps(
{
"player_id": player["id"],
"session_token": player["session_token"],
"selected_text": guess_plan[nickname],
}
),
content_type="application/json",
),
201,
f"submit_guess[{nickname}]",
)
guess_payloads.append(guess_payload)
reveal_payload = guess_payloads[-1]
self._expect_session_status(reveal_payload, GameSession.Status.REVEAL, "auto_reveal_transition")
if not reveal_payload.get("phase_transition", {}).get("auto_advanced"):
self._fail("auto_reveal_transition", "expected auto_advanced=true on final guess", reveal_payload)
reveal = reveal_payload.get("reveal")
if not reveal:
self._fail("auto_reveal_transition", "missing canonical reveal payload", reveal_payload)
if reveal.get("correct_answer") != question.correct_answer:
self._fail(
"auto_reveal_transition",
"reveal payload returned wrong correct answer",
{"expected": question.correct_answer, "reveal": reveal},
)
if len(reveal.get("lies", [])) != len(players):
self._fail("auto_reveal_transition", "unexpected lie count in reveal payload", reveal)
if len(reveal.get("guesses", [])) != len(players):
self._fail("auto_reveal_transition", "unexpected guess count in reveal payload", reveal)
fooled_guesses = [guess for guess in reveal["guesses"] if not guess.get("is_correct")]
correct_guesses = [guess for guess in reveal["guesses"] if guess.get("is_correct")]
if len(fooled_guesses) != 2:
self._fail("auto_reveal_transition", "expected exactly two bluff guesses", reveal)
if len(correct_guesses) != 1:
self._fail("auto_reveal_transition", "expected exactly one correct guess", reveal)
if any(guess.get("fooled_player_id") is None for guess in fooled_guesses):
self._fail("auto_reveal_transition", "bluff guesses missing fooled_player_id", reveal)
artifact["steps"].append(
{
"step": "submit_guesses",
"guess_results": [
{
"player_id": payload["guess"]["player_id"],
"selected_text": payload["guess"]["selected_text"],
"is_correct": payload["guess"]["is_correct"],
"fooled_player_id": payload["guess"].get("fooled_player_id"),
}
for payload in guess_payloads
],
}
)
artifact["steps"].append(
{
"step": "auto_reveal_transition",
"session_status": reveal_payload["session"]["status"],
"reveal": {
"correct_answer": reveal["correct_answer"],
"lies_count": len(reveal["lies"]),
"guesses_count": len(reveal["guesses"]),
"fooled_player_ids": sorted(guess["fooled_player_id"] for guess in fooled_guesses),
"correct_guess_player_ids": sorted(guess["player_id"] for guess in correct_guesses),
},
}
)
detail_payload = self._expect_status(host_client.get(f"/lobby/sessions/{code}"), 200, "session_detail_after_guesses")
self._expect_session_status(detail_payload, GameSession.Status.SCOREBOARD, "auto_scoreboard_transition")
if detail_payload.get("reveal") != reveal:
self._fail("auto_scoreboard_transition", "scoreboard promotion changed canonical reveal payload", detail_payload)
scoreboard = detail_payload.get("scoreboard")
if not scoreboard:
self._fail("auto_scoreboard_transition", "missing scoreboard payload after promotion", detail_payload)
if len(scoreboard) != len(players):
self._fail("auto_scoreboard_transition", "unexpected scoreboard length", detail_payload)
if not detail_payload.get("phase_view_model", {}).get("readiness", {}).get("scoreboard_ready"):
self._fail("auto_scoreboard_transition", "scoreboard_ready=false after promotion", detail_payload)
artifact["steps"].append(
{
"step": "auto_scoreboard_transition",
"session_status": detail_payload["session"]["status"],
"leaderboard": scoreboard,
}
)
finish_payload = self._expect_status(
host_client.post(f"/lobby/sessions/{code}/finish", content_type="application/json"),
200,
"finish_game",
)
self._expect_session_status(finish_payload, GameSession.Status.FINISHED, "finish_game")
artifact["steps"].append(
{
"step": "finish_game",
"session_status": finish_payload["session"]["status"],
}
)
artifact_path = options.get("artifact") artifact_path = options.get("artifact")
if artifact_path: if artifact_path:
artifact = {
"ok": True,
"command": "smoke_staging",
"generated_at": datetime.now(timezone.utc).isoformat(),
"session_code": code,
"players": [player["nickname"] for player in players],
"round_question_id": round_question_id,
"steps": [
"create_session",
"join_players",
"start_round",
"submit_lies",
"auto_guess_transition",
"submit_guesses",
"auto_reveal_to_scoreboard",
"finish_game",
],
}
output_path = Path(artifact_path) output_path = Path(artifact_path)
output_path.parent.mkdir(parents=True, exist_ok=True) output_path.parent.mkdir(parents=True, exist_ok=True)
output_path.write_text(json.dumps(artifact, indent=2) + "\n", encoding="utf-8") output_path.write_text(json.dumps(artifact, indent=2) + "\n", encoding="utf-8")

View File

@@ -1905,7 +1905,7 @@ class SmokeStagingCommandTests(TestCase):
self.assertEqual(session.status, GameSession.Status.FINISHED) self.assertEqual(session.status, GameSession.Status.FINISHED)
self.assertEqual(Player.objects.filter(session=session).count(), 3) self.assertEqual(Player.objects.filter(session=session).count(), 3)
def test_smoke_staging_writes_artifact_when_requested(self): def test_smoke_staging_writes_phase_evidence_artifact_when_requested(self):
with tempfile.TemporaryDirectory() as tmp_dir: with tempfile.TemporaryDirectory() as tmp_dir:
artifact_path = Path(tmp_dir) / "smoke.json" artifact_path = Path(tmp_dir) / "smoke.json"
call_command("smoke_staging", artifact=str(artifact_path)) call_command("smoke_staging", artifact=str(artifact_path))
@@ -1913,24 +1913,40 @@ class SmokeStagingCommandTests(TestCase):
self.assertTrue(artifact_path.exists()) self.assertTrue(artifact_path.exists())
payload = json.loads(artifact_path.read_text(encoding="utf-8")) payload = json.loads(artifact_path.read_text(encoding="utf-8"))
self.assertTrue(payload["ok"]) self.assertTrue(payload["ok"])
self.assertEqual(payload["command"], "smoke_staging") self.assertEqual(payload["command"], "python manage.py smoke_staging --artifact <path>")
self.assertEqual(payload["players"], ["P1", "P2", "P3"]) self.assertEqual(payload["players"], ["P1", "P2", "P3"])
self.assertIn("generated_at", payload) self.assertIn("generated_at", payload)
self.assertIn("session_code", payload) self.assertIn("session_code", payload)
self.assertEqual(payload["question"]["correct_answer"], "Correct")
self.assertEqual(payload["guess_plan"]["P2"], "Correct")
step_names = [step["step"] for step in payload["steps"]]
self.assertEqual( self.assertEqual(
payload["steps"], step_names,
[ [
"create_session", "create_session",
"join_players", "join_players",
"start_round", "start_round",
"submit_lies",
"auto_guess_transition", "auto_guess_transition",
"submit_guesses", "submit_guesses",
"auto_reveal_to_scoreboard", "auto_reveal_transition",
"auto_scoreboard_transition",
"finish_game", "finish_game",
], ],
) )
reveal_step = payload["steps"][5]
self.assertEqual(reveal_step["session_status"], GameSession.Status.REVEAL)
self.assertEqual(reveal_step["reveal"]["correct_answer"], "Correct")
self.assertEqual(reveal_step["reveal"]["lies_count"], 3)
self.assertEqual(reveal_step["reveal"]["guesses_count"], 3)
self.assertEqual(len(reveal_step["reveal"]["fooled_player_ids"]), 2)
self.assertEqual(len(reveal_step["reveal"]["correct_guess_player_ids"]), 1)
scoreboard_step = payload["steps"][6]
self.assertEqual(scoreboard_step["session_status"], GameSession.Status.SCOREBOARD)
self.assertEqual(len(scoreboard_step["leaderboard"]), 3)
class I18nResolverTests(TestCase): class I18nResolverTests(TestCase):
def test_resolve_locale_accepts_language_tags_and_normalizes_to_supported_base_locale(self): def test_resolve_locale_accepts_language_tags_and_normalizes_to_supported_base_locale(self):