from textwrap import dedent
from dotenv import load_dotenv
load_dotenv()

from arcllm import load_model, Message
from rich import print
from rich.panel import Panel
from rich.console import Console

console = Console()
model = load_model('anthropic')

async def ask(prompt: str, *, system: str | None = None) -> str:
    msgs = []
    if system:
        msgs.append(Message(role='system', content=system))
    msgs.append(Message(role='user', content=prompt))
    resp = await model.invoke(msgs)
    return resp.content or ''

PAPER = dedent('''
    We present a method for accelerating tokamak plasma simulations using
    a graph-neural-network surrogate trained on 12,000 hours of HPC runs.
    The surrogate predicts edge-plasma density 200x faster than the
    reference fluid solver, with mean absolute error under 4% across
    held-out shots. We do not address pellet injection or RMP coil
    configurations. Code available; data released under DOE-cleared
    embargo until 2027.
''').strip()

PROMPTS = {
    'BAD (vague)':
        'Summarize this:\n\n' + PAPER,
    'MEDIUM (specifies length)':
        f'Summarize this in 2 sentences:\n\n{PAPER}',
    'GOOD (structured ask)': dedent(f'''
        Summarize this paper as 3 bullets:
        - Contribution (what is new)
        - Method (how)
        - Limitations (what it does NOT do)

        Paper:
        {PAPER}
    ''').strip(),
    'GREAT (role + format + bound)': dedent(f'''
        You are a national-lab program manager skimming proposals.
        Read the paper and output exactly this Markdown table:

        | Field | Value |
        |---|---|
        | Contribution | _≤12 words_ |
        | Method | _≤12 words_ |
        | Speedup | _quote the number_ |
        | Accuracy | _quote the number_ |
        | Out of scope | _≤12 words_ |
        | Availability | _quote the wording_ |

        Paper:
        {PAPER}
    ''').strip(),
}

for label, prompt in PROMPTS.items():
    out = await ask(prompt)
    console.print(Panel(out, title=f'[bold]{label}[/bold]', border_style='cyan'))

import json

INCIDENT = dedent('''
    Around 09:02 on April 12, run 42 hit a DRAM ECC error on node-7.
    The job auto-rerouted to node-8 and finished by 09:05.
    Operator on shift was Singh. No data loss reported.
''').strip()

PLAN_SYSTEM = (
    'You are a planning step. Do NOT extract data. '
    'Output ONLY a JSON array of {"field": ..., "type": ..., "required": ...} objects '
    'describing what should be extracted from the incident report.'
)

plan_text = await ask(
    f'Plan extraction fields for this incident report:\n\n{INCIDENT}',
    system=PLAN_SYSTEM,
)
console.print(Panel(plan_text, title='PLAN', border_style='yellow'))

# parse the JSON (strip code fences if the model used them)
import re
json_text = re.search(r'\[.*\]', plan_text, re.DOTALL).group(0)
plan = json.loads(json_text)
print(f'\nplan parsed: {len(plan)} fields')

DO_SYSTEM = (
    'You are an extraction step. Extract values for EXACTLY the fields listed in the plan. '
    'Output ONLY a JSON object keyed by field name. Use null when a value is missing.'
)

do_text = await ask(
    dedent(f'''
        Plan:
        {json.dumps(plan, indent=2)}

        Incident report:
        {INCIDENT}
    ''').strip(),
    system=DO_SYSTEM,
)
console.print(Panel(do_text, title='DO', border_style='green'))

extracted = json.loads(re.search(r'\{.*\}', do_text, re.DOTALL).group(0))
print(f'\nextracted {len(extracted)} fields')

CHECK_SYSTEM = (
    'You are a validation step. Compare extracted output against the plan. '
    'Output ONLY JSON: {"ok": bool, "missing": [field...], "extra": [field...], "type_mismatches": [...]}'
)

check_text = await ask(
    dedent(f'''
        Plan:
        {json.dumps(plan, indent=2)}

        Extracted:
        {json.dumps(extracted, indent=2)}
    ''').strip(),
    system=CHECK_SYSTEM,
)
console.print(Panel(check_text, title='CHECK', border_style='red'))

verdict = json.loads(re.search(r'\{.*\}', check_text, re.DOTALL).group(0))
print(f'\nok={verdict.get("ok")}')

Anti-pattern	Example	Fix
Vague	"make it better"	Specify what better means: shorter? more cited? more concrete?
Kitchen-sink	30 instructions in one prompt	Split into stages. The model can't track 30 things at once.
Contradictory	"be exhaustive but terse"	Pick one. Or rank: "as terse as you can while still naming each gene."
Hidden context	"as we discussed earlier"	Restate the context. The model didn't read your last meeting.
Buried lede	actual task in line 47 of background	Put the task in the first line. Move background to the end.

Notebook 02 — Prompts That Work¶

Setup¶

1. Good vs bad — same task, four prompts¶

2. The five anti-patterns¶

3. Plan · Do · Check — three prompts, one task¶

Stage 1 — PLAN¶

Stage 2 — DO¶

Stage 3 — CHECK¶

4. Why this matters¶

Takeaway¶