"""Frozen canonical prompts for the Weeyuga benchmark harness. These three prompts NEVER change once shipped. New prompts get new IDs (P-NEW1, P-NEW2, ...). See docs/BENCHMARKS/HARNESS.md ยง3. """ PROMPTS = { "P-EASY": { "intent": "trivial โ€” single-token response space, near-zero work", "prompt": "hi", "max_tokens": 64, }, "P-MEDIUM": { "intent": "bounded structured task โ€” 4 sentences on a known topic", "prompt": "Explain in 4 sentences why the sky appears blue at noon.", "max_tokens": 512, }, "P-HARD": { "intent": "open-ended creative โ€” 200-word generation", "prompt": ( "Write a 200-word story about a fisherman who discovers a " "coin from a sunken empire." ), "max_tokens": 1024, }, }