:root{
  --bg:#0f1116; --bg2:#161921; --bg3:#1f232d; --fg:#e7e9ee; --muted:#8a8f9b;
  --border:#2a2f3a; --accent:#8ab4ff; --accent2:#ffb347;
  --pass:#39d17b; --fail:#ef5a5a; --neutral:#555a68;
  --pass-bg:#0f5234; --fail-bg:#5a1818;
}
*{box-sizing:border-box}
html,body{margin:0;padding:0;font:14px/1.5 -apple-system,BlinkMacSystemFont,"SF Pro Text","Segoe UI",Inter,system-ui,sans-serif;background:var(--bg);color:var(--fg);}
a{color:var(--accent);text-decoration:none}
a:hover{text-decoration:underline}
code,pre{font-family:"SF Mono","JetBrains Mono",Menlo,Consolas,monospace;font-size:12.5px}
pre{background:var(--bg2);padding:10px 12px;border:1px solid var(--border);border-radius:6px;overflow:auto;white-space:pre-wrap;word-break:break-word}
code{background:var(--bg3);padding:1px 6px;border-radius:4px}

header{background:var(--bg2);border-bottom:1px solid var(--border);position:sticky;top:0;z-index:10}
header .container{display:flex;align-items:center;gap:20px;flex-wrap:wrap;padding:10px 20px}
header h1{font-size:17px;margin:0;font-weight:600}
nav{display:flex;gap:2px}
nav a{padding:6px 14px;border-radius:6px;color:var(--muted);font-weight:500}
nav a.active{background:var(--bg3);color:var(--fg)}
.meta{margin-left:auto;color:var(--muted);font-size:12px}

main.container{padding:20px}
.container{max-width:1600px;margin:0 auto}
footer{padding:20px;color:var(--muted);font-size:12px}

.view{display:none}
.view.active{display:block}

.toolbar{display:flex;gap:12px;align-items:center;padding:8px 0 16px;flex-wrap:wrap}
.toolbar label{display:inline-flex;gap:6px;align-items:center;color:var(--muted);font-size:13px}
.toolbar input[type=search],.toolbar select{background:var(--bg2);color:var(--fg);border:1px solid var(--border);border-radius:5px;padding:5px 8px;font-size:13px;min-width:180px}

.card-grid{display:grid;grid-template-columns:repeat(auto-fill,minmax(280px,1fr));gap:10px}
.card{background:var(--bg2);border:1px solid var(--border);border-radius:8px;padding:12px 14px;cursor:pointer;transition:border-color .1s}
.card:hover{border-color:var(--accent)}
.card h3{margin:0 0 4px;font-size:14px}
.card .sub{color:var(--muted);font-size:12px;margin-bottom:8px}
.card .kv{display:grid;grid-template-columns:max-content auto;gap:1px 10px;font-size:12px}
.card .kv dt{color:var(--muted)}
.card .kv dd{margin:0}
.card .score{font-weight:700;font-variant-numeric:tabular-nums}

.badge{display:inline-block;padding:2px 7px;border-radius:10px;font-size:11px;font-weight:600;background:var(--bg3);color:var(--muted);margin-right:4px}
.badge.reasoning-off{background:#1d3c28;color:#92e6b2}
.badge.reasoning-on{background:#4a2e12;color:#f5c27e}
.badge.reasoning-on-default{background:#34294a;color:#cba0ff}
.badge.reasoning-on-always{background:#5a1f3a;color:#f096c9}

/* Heatmap */
.heatmap-wrap{overflow-x:auto;border:1px solid var(--border);border-radius:8px;background:var(--bg2)}
table.heatmap{border-collapse:collapse;font-size:12px;width:100%;min-width:1000px}
table.heatmap th,table.heatmap td{padding:4px 6px;text-align:center;white-space:nowrap;border-right:1px solid var(--border);border-bottom:1px solid var(--border)}
table.heatmap thead th{background:var(--bg3);font-weight:600;color:var(--muted);position:sticky;top:0;z-index:1}
table.heatmap tbody th{background:var(--bg2);text-align:left;position:sticky;left:0;z-index:1;font-weight:500;max-width:280px;overflow:hidden;text-overflow:ellipsis}
table.heatmap td.cell{font-variant-numeric:tabular-nums;font-weight:600;cursor:pointer}
table.heatmap td.cell:hover{outline:2px solid var(--accent);outline-offset:-2px}
table.heatmap td.empty{color:var(--muted);background:var(--bg2)}

/* Panels */
.panel{background:var(--bg2);border:1px solid var(--border);border-radius:8px;padding:18px 22px;margin-top:20px}
.panel h2{margin:0 0 14px;font-size:18px}
.panel h3{margin:20px 0 8px;font-size:15px;color:var(--muted)}
.panel .close{float:right;color:var(--muted);cursor:pointer;font-size:18px;line-height:1;background:none;border:0}
.hidden{display:none}

/* Tables */
table.data{border-collapse:collapse;width:100%;font-size:13px}
table.data th,table.data td{padding:6px 10px;text-align:left;border-bottom:1px solid var(--border)}
table.data th{background:var(--bg3);font-weight:600;color:var(--muted);text-transform:uppercase;font-size:11px;letter-spacing:.03em}
table.data tr:hover{background:var(--bg3)}
td.num{text-align:right;font-variant-numeric:tabular-nums}
td.score-pass{color:var(--pass);font-weight:700}
td.score-fail{color:var(--fail)}
td.score-partial{color:var(--accent2)}

.pass-dot{color:var(--pass)}
.fail-dot{color:var(--fail)}

.task-row{background:var(--bg2);border:1px solid var(--border);border-radius:6px;padding:10px 14px;margin-bottom:6px;cursor:pointer}
.task-row:hover{border-color:var(--accent)}
.task-row .name{font-weight:600}
.task-row .suite-chip{font-size:11px;color:var(--muted);margin-left:8px}
.task-row .prompt-snippet{color:var(--muted);font-size:12px;margin-top:4px;max-height:3em;overflow:hidden;text-overflow:ellipsis}

.chip{display:inline-block;padding:1px 8px;background:var(--bg3);border-radius:10px;font-size:11px;color:var(--muted);margin-right:4px}

.compare-grid{display:grid;grid-template-columns:1fr 1fr;gap:20px;margin-top:12px}

/* Global search */
.global-search{position:relative;margin-left:auto;margin-right:16px;min-width:280px;flex:0 0 320px}
.global-search input{width:100%;background:var(--bg3);color:var(--fg);border:1px solid var(--border);border-radius:18px;padding:6px 14px;font-size:13px}
.global-search input:focus{outline:none;border-color:var(--accent)}
.typeahead{position:absolute;top:calc(100% + 4px);right:0;left:0;background:var(--bg2);border:1px solid var(--border);border-radius:8px;max-height:60vh;overflow-y:auto;display:none;z-index:20;box-shadow:0 4px 20px rgba(0,0,0,.5)}
.typeahead.open{display:block}
.typeahead-group{padding:6px 10px 4px;font-size:10px;text-transform:uppercase;color:var(--muted);letter-spacing:.08em;background:var(--bg3);border-bottom:1px solid var(--border);position:sticky;top:0}
.typeahead-item{padding:6px 12px;cursor:pointer;font-size:13px;border-bottom:1px solid var(--border)}
.typeahead-item:hover,.typeahead-item.selected{background:var(--bg3);color:var(--accent)}
.typeahead-item .hint{color:var(--muted);font-size:11px;margin-left:8px}
.typeahead-item mark{background:rgba(138,180,255,.3);color:var(--fg);padding:0 2px;border-radius:2px}

.hint{margin-top:10px;padding:10px 14px;background:var(--bg2);border-left:3px solid var(--accent);border-radius:4px;font-size:12.5px;color:var(--muted)}
.hint strong{color:var(--fg)}

/* Overview heatmap cell when showing both score + tps — two lines per cell */
table.heatmap td.cell .score-primary{display:block;font-size:13px;font-weight:700;line-height:1.15}
table.heatmap td.cell .tps{display:block;font-size:10px;font-weight:500;opacity:.75;letter-spacing:.02em;line-height:1.1;margin-top:1px}
table.heatmap td.cell{padding:5px 6px;vertical-align:middle;position:relative}

/* Winner: BEST combination of score AND speed in its column. Distinctive gold. */
table.heatmap td.cell.winner{
  box-shadow: inset 0 0 0 2px #f5c842, 0 0 10px rgba(245,200,66,.35);
  background: linear-gradient(135deg, hsl(50, 60%, 28%) 0%, hsl(140, 55%, 24%) 60%) !important;
  color: #fff9d9 !important;
}
table.heatmap td.cell.winner .score-primary{font-weight:800;text-shadow:0 1px 2px rgba(0,0,0,.5)}
table.heatmap td.cell.winner .tps{opacity:1;color:#ffe28a;font-weight:600}
table.heatmap td.cell .win-badge{
  position:absolute;top:2px;right:4px;font-size:11px;color:#f5c842;
  text-shadow:0 0 4px rgba(245,200,66,.6);font-weight:700;pointer-events:none;
}
/* Runner-up: top 2-3 in column — subtle cyan ring so they're visible but secondary */
table.heatmap td.cell.runner-up{
  box-shadow: inset 0 0 0 1px rgba(138,180,255,.55);
}
table.heatmap td.cell.runner-up .score-primary{font-weight:700}

/* Roles tab */
.role-card{background:var(--bg2);border:1px solid var(--border);border-radius:8px;padding:14px 18px;margin-bottom:14px}
.role-card h3{margin:0 0 8px;font-size:16px;display:flex;align-items:center;gap:10px}
.role-card h3 .suite-list{font-size:11px;font-weight:400;color:var(--muted)}
.role-rank-table{font-size:13px;width:100%}
.role-rank-table td{padding:4px 10px;border-bottom:1px solid var(--border)}
.role-rank-table td.rank{color:var(--muted);width:28px;text-align:right}
.role-rank-table td.model{width:auto}
.role-rank-table td.score{font-weight:600;width:80px;text-align:right;font-variant-numeric:tabular-nums}
.role-rank-table td.tps{width:80px;text-align:right;color:var(--muted);font-variant-numeric:tabular-nums}
.role-rank-table td.composite{width:80px;text-align:right;font-weight:600;font-variant-numeric:tabular-nums}
.role-card .best{background:linear-gradient(90deg,hsla(140,50%,25%,.35),transparent)}

/* Family comparison */
.family-header{margin-bottom:10px;color:var(--muted)}
.family-header strong{color:var(--fg)}

/* Host chip in header */
.hostchip{display:inline-block;padding:1px 8px;margin-left:8px;background:var(--bg3);border-radius:10px;font-size:11px;color:var(--muted);cursor:help}

/* Testing tab */
#testingDot{display:inline-block;width:8px;height:8px;border-radius:50%;margin-left:4px}
#testingDot.live-dot{background:#39d17b;box-shadow:0 0 8px rgba(57,209,123,.8);animation:pulse 1.2s infinite}
@keyframes pulse{0%,100%{opacity:1;transform:scale(1)}50%{opacity:.5;transform:scale(.85)}}
.live-dot{display:inline-block;width:10px;height:10px;border-radius:50%;background:#39d17b;box-shadow:0 0 10px rgba(57,209,123,.8);animation:pulse 1.2s infinite;margin-right:6px;vertical-align:middle}

.progress-bar{height:6px;background:var(--bg3);border-radius:3px;overflow:hidden}
.progress-bar-fill{height:100%;background:linear-gradient(90deg,var(--accent),#39d17b);transition:width .3s}

.testing-table tr.row-running{background:rgba(138,180,255,.08)}
.testing-table tr.row-running td{border-bottom:1px solid rgba(138,180,255,.2)}
.testing-table tr.row-done{opacity:.85}
.testing-table tr.row-pending{opacity:.55}

.status-badge{display:inline-block;padding:2px 8px;border-radius:10px;font-size:11px;font-weight:600}
.status-running{background:#1a3a5c;color:#8ab4ff}
.status-done{background:#1d3c28;color:#92e6b2}
.status-pending{background:var(--bg3);color:var(--muted)}
.status-failed{background:var(--fail-bg);color:#ef5a5a}

.param-chip{display:inline-block;padding:0 5px;margin:1px 2px 1px 0;background:var(--bg3);border:1px solid var(--border);border-radius:3px;font-size:9.5px;font-family:"SF Mono",Menlo,monospace;color:#d5ddea;white-space:nowrap;line-height:1.55;max-width:200px;overflow:hidden;text-overflow:ellipsis}
.param-chip.param-load{background:#1a2438;border-color:#2a3a5a;color:#a8c4f0}  /* load-side params use a cool-blue tint */

/* Params cell in Testing tab — fixed width, wraps inside */
.testing-table td:last-child{max-width:280px;white-space:normal;line-height:1.4}

/* Reasoning state chip — explicit visual so you can see at-a-glance whether reasoning was active during a run */
.reasoning-chip{display:inline-block;padding:2px 8px;border-radius:10px;font-size:11px;font-weight:600;white-space:nowrap;font-family:"SF Mono",Menlo,monospace}
.reasoning-chip.r-off    {background:#0f3a24;color:#92e6b2;border:1px solid #1d5c3a}  /* green: disabled */
.reasoning-chip.r-on     {background:#4a2e12;color:#f5c27e;border:1px solid #6a4420}  /* orange: enabled */
.reasoning-chip.r-always {background:#4a1e3a;color:#f096c9;border:1px solid #6a2a54}  /* magenta: always */
.reasoning-chip.r-low    {background:#3a2e1a;color:#e8c77e;border:1px solid #5a4428}  /* pale orange: low effort */
.reasoning-chip.r-med    {background:#4a2e12;color:#f5b060;border:1px solid #6a4420}
.reasoning-chip.r-high   {background:#5a1e12;color:#ef7a5a;border:1px solid #7a2e20}
.reasoning-chip.r-na     {background:var(--bg3);color:var(--muted);border:1px solid var(--border)}
