e.stopPropagation()} style={{ width: '100%', maxWidth: 880, maxHeight: 'calc(100vh - 80px)', overflowY: 'auto', background: 'var(--bg)', border: '1px solid var(--line-2)', borderRadius: 6, padding: 20, fontFamily: 'var(--font-body)', }}>

Agent capability tests

brain + API + recall + citation discipline · {manifest.length} tests

{err && (

{err}

)} {/* Run controls */}

{report && ( = 0.7 ? '#d9a85f' : '#d96a6a', }}> {report.passed}/{report.n} pass · {(report.pass_rate * 100).toFixed(0)}% · {report.duration_s}s · ~{report.approx_tokens_input + report.approx_tokens_output} tokens )}

{/* Manifest with results merged in */} {manifest.map(t => { const r = report?.results?.find(x => x.id === t.id); const isSel = selected.has(t.id); const status = r ? (r.passed ? 'pass' : 'fail') : 'idle'; const accent = status === 'pass' ? '#5fb37c' : status === 'fail' ? '#d96a6a' : 'var(--line)'; return (

toggle(t.id)} style={{ marginRight: 4, cursor: 'pointer' }} /> {t.id} {t.tag} {r && ( <> {r.tool_pass ? '✓' : '✗'} tool {r.content_pass ? '✓' : '✗'} content {t.must_cite_path && ( {r.citation_pass ? '✓' : '✗'} cite )} {r.duration_s}s · {r.tools_called.join(',') || '—'} )}

{t.question}

{t.must_call_tool && (

must call: {t.must_call_tool} {t.must_contain.length > 0 && ` · must contain: ${t.must_contain.join(', ')}`} {t.must_cite_path && ' · must cite path'}

)} {r && r.notes.length > 0 && (

{r.notes.map((n, i) =>

⚠ {n}

)}

)} {r && r.response_preview && (

{r.response_preview}

)}

); })}