from dotenv import load_dotenv
load_dotenv()

from arcllm import load_model, Message
from arcllm._pii import RegexPiiDetector, redact_text
from arcrun import run, SandboxConfig, make_execute_tool
from rich import print
from rich.panel import Panel
from rich.console import Console
from rich.table import Table

console = Console()

RAW = (
    'Hi, please email jane.doe@nationallab.gov about subject 47. '
    'Her SSN is 123-45-6789 and the corp card on file is 4242 4242 4242 4242. '
    'My cell is 555-867-5309.'
)

detector = RegexPiiDetector()
matches = detector.detect(RAW)

tbl = Table(title='PII findings')
tbl.add_column('type', style='red')
tbl.add_column('span')
tbl.add_column('matched text')
for m in matches:
    tbl.add_row(m.pii_type, f'{m.start}-{m.end}', repr(m.matched_text))
console.print(tbl)

console.print(Panel(redact_text(RAW, matches), title='redacted', border_style='green'))

model_redacted = load_model('anthropic', security={'pii_enabled': True})

resp = await model_redacted.invoke([
    Message(role='user', content=f'Summarize what you can see about this customer: {RAW}')
])
console.print(Panel(resp.content or '', title='LLM response (saw redacted text)', border_style='cyan'))

model = load_model('anthropic')
exec_tool = make_execute_tool(timeout_seconds=10, max_output_bytes=4096)

events_open: list = []
result_open = await run(
    model=model, tools=[exec_tool],
    sandbox=SandboxConfig(allowed_tools=['execute_python']),
    system_prompt='Use execute_python when math is needed.',
    task='Compute the first 10 Fibonacci numbers and print them.',
    on_event=events_open.append,
)
console.print(Panel(result_open.content or '', title='OPEN sandbox — tool allowed', border_style='green'))
n_denied = sum(1 for e in events_open if e.type == 'tool.denied')
print(f'  turns={result_open.turns}  tool_calls={result_open.tool_calls_made}  tool.denied events: {n_denied}')

events_closed: list = []
result_closed = await run(
    model=model, tools=[exec_tool],
    sandbox=SandboxConfig(allowed_tools=[]),  # empty allowlist => nothing fires
    system_prompt='Use execute_python when math is needed.',
    task='Compute the first 5 Fibonacci numbers.',
    on_event=events_closed.append,
    max_turns=3,
)
denied = [dict(e.data) for e in events_closed if e.type == 'tool.denied']
console.print(Panel(str(denied), title='CLOSED sandbox — tool.denied events', border_style='red'))
print(f'  turns={result_closed.turns}  tool_calls={result_closed.tool_calls_made}')

events_exec: list = []
exec_result = await run(
    model=model, tools=[make_execute_tool(timeout_seconds=15, max_output_bytes=8192)],
    sandbox=SandboxConfig(allowed_tools=['execute_python']),
    system_prompt='Use execute_python to compute things rather than reasoning step-by-step.',
    task='Find all prime numbers under 100 using a sieve. Print them comma-separated.',
    on_event=events_exec.append,
)

for e in events_exec:
    if e.type == 'tool.start' and e.data.get('name') == 'execute_python':
        code_run = e.data.get('arguments', {}).get('code', '')
        console.print(Panel(code_run, title='code the agent wrote', border_style='yellow'))

console.print(Panel(exec_result.content or '', title='final answer', border_style='cyan'))

from arcrun.builtins.contained_execute import make_contained_execute_tool
tool = make_contained_execute_tool(
    image='python:3.12-slim',
    timeout_seconds=30,
    max_output_bytes=65536,
    mem_limit='256m',         # cgroup memory ceiling
    cpu_period=100_000,       # CFS period (microseconds)
    cpu_quota=50_000,         # 50% of one core
    pids_limit=64,            # process count cap
    tmpfs_size='64m',         # writable tmpfs only — no host FS
    network_disabled=True,    # no egress, no exfiltration
)

import logging
logging.basicConfig(level=logging.INFO, format='%(name)s %(message)s', force=True)

model_audited = load_model(
    'anthropic',
    security={'pii_enabled': True},
    audit={'log_level': 'INFO'},
)
_ = await model_audited.invoke([Message(role='user', content='What is 2 + 2?')])
print('(audit metadata logged above by arcllm.modules.audit — no message content)')

from arcrun.builtins import make_task_complete_tool, make_budget_breach_args
complete_tool = make_task_complete_tool()
# loop sees usage cross threshold → emits budget breach via task_complete

model = load_model(
    'anthropic',
    security={'pii_enabled': True, 'signing_enabled': True},  # PII redact + Ed25519 sign
    audit={'log_level': 'INFO'},                              # PII-safe metadata logs
    telemetry={'budget_scope': 'agent:plasma-007'},           # cost ceilings
    rate_limit=True,                                          # provider TPS caps
    retry=True,                                               # exponential backoff
    fallback=True,                                            # provider failover
    otel=True,                                                # OpenTelemetry export
)

result = await run(
    model=model,
    tools=[make_execute_tool(timeout_seconds=10, max_output_bytes=8192)],
    sandbox=SandboxConfig(allowed_tools=['execute_python']),
    system_prompt=YOUR_SYSTEM,
    task=YOUR_TASK,
)

assert result.verify_integrity().valid  # tamper-evident chain

Defense	Mechanism	OWASP map
PII redaction	`security={'pii_enabled': True}` on `load_model()`	LLM02 (Sensitive Disclosure)
Tool allowlist	`SandboxConfig(allowed_tools=[...])`	LLM06 (Excessive Agency)
Sandboxed code exec	`make_execute_tool` (subprocess) / `make_contained_execute_tool` (Docker)	LLM05 + ASI05 (RCE)
PII-safe audit	`audit={...}` (metadata-only by default)	LLM07 (log hygiene)
Cost / token budgets	`telemetry={'budget_scope': ...}` + `task_complete` terminator	LLM10 (Unbounded Consumption)
Tamper-evident chain	`verify_chain()` (notebook 06)	NIST AU-9, AU-10

Notebook 07 — Security at Runtime¶

Setup¶

1. PII detection — what's in the message?¶

2. Plug it into the LLM call — `SecurityModule`¶

3. Sandbox — only allowed tools fire¶

4. Sandboxed code execution — `make_execute_tool`¶

5. Container isolation for higher tiers — `make_contained_execute_tool`¶

6. PII-safe audit by default — `AuditModule`¶

7. Budgets — `task_complete` and `make_budget_breach_args`¶

8. The full security stack on one call¶

Takeaway¶

Notebook 07 — Security at Runtime¶

Setup¶

1. PII detection — what's in the message?¶

2. Plug it into the LLM call — SecurityModule¶

3. Sandbox — only allowed tools fire¶

4. Sandboxed code execution — make_execute_tool¶

5. Container isolation for higher tiers — make_contained_execute_tool¶

6. PII-safe audit by default — AuditModule¶

7. Budgets — task_complete and make_budget_breach_args¶

8. The full security stack on one call¶

Takeaway¶

2. Plug it into the LLM call — `SecurityModule`¶

4. Sandboxed code execution — `make_execute_tool`¶

5. Container isolation for higher tiers — `make_contained_execute_tool`¶

6. PII-safe audit by default — `AuditModule`¶

7. Budgets — `task_complete` and `make_budget_breach_args`¶