:root{font-family:system-ui,-apple-system,Segoe UI,Roboto,Helvetica,Arial,sans-serif;line-height:1.5;font-weight:400;color-scheme:light;color:#213547;background-color:#f5f5f5;font-synthesis:none;text-rendering:optimizeLegibility;-webkit-font-smoothing:antialiased;-moz-osx-font-smoothing:grayscale}*{box-sizing:border-box}body{margin:0;min-width:320px;min-height:100vh}#root{width:100%;min-height:100vh}*{box-sizing:border-box;margin:0;padding:0}body{font-family:-apple-system,BlinkMacSystemFont,Segoe UI,Roboto,Oxygen,Ubuntu,sans-serif;background:#fafafa;color:#333;line-height:1.6}.app{max-width:960px;margin:0 auto;padding:40px 20px}.loading,.error{text-align:center;padding:60px 20px;color:#666}.landing-header{text-align:center;margin-bottom:48px}.landing-header h1{font-size:2.5rem;font-weight:600;margin:0 0 12px;letter-spacing:-.5px}.tagline{font-size:1.1rem;color:#666;margin:0}.task-grid{display:grid;gap:24px;margin-bottom:48px}.task-card{display:block;background:#fff;border:1px solid #e0e0e0;border-radius:8px;padding:28px;text-decoration:none;color:inherit;transition:box-shadow .2s,border-color .2s}.task-card:hover{box-shadow:0 4px 12px #00000014;border-color:#ccc}.task-card h2{font-size:1.4rem;font-weight:600;margin:0 0 12px}.task-card .description{color:#555;margin:0 0 16px}.task-stats{display:flex;gap:24px;margin-bottom:16px}.task-stats .stat{font-size:.9rem;color:#888}.view-link{color:#2563eb;font-weight:500}.landing-footer{text-align:center;padding-top:24px;border-top:1px solid #e0e0e0;color:#666}.landing-footer p{margin:0}.task-detail{background:#fff;border:1px solid #e0e0e0;border-radius:8px;padding:32px}.task-header{margin-bottom:32px;padding-bottom:24px;border-bottom:1px solid #eee}.breadcrumb{margin-bottom:16px;font-size:.9rem}.back-link{color:#2563eb;text-decoration:none}.back-link:hover{text-decoration:underline}.breadcrumb .separator{margin:0 8px;color:#ccc}.breadcrumb .current{color:#666}.task-header h1{font-size:2rem;font-weight:600;margin:0 0 8px}.task-description{font-size:1.1rem;color:#555;margin:0}.task-context{background:#f8f9fa;border-radius:6px;padding:24px;margin-bottom:24px}.task-context h2{font-size:1rem;font-weight:600;text-transform:uppercase;letter-spacing:.5px;color:#666;margin:0 0 16px}.task-context .instruction{margin:0 0 16px;line-height:1.7}.tools-list,.expected-sequence{font-size:.95rem;margin-bottom:8px}.expected-sequence code{background:#e8e8e8;padding:2px 8px;border-radius:4px;font-family:SF Mono,Monaco,monospace}.example-section{margin-bottom:32px}.example-section h2{font-size:1rem;font-weight:600;text-transform:uppercase;letter-spacing:.5px;color:#666;margin:0 0 16px}.example-box{border-left:3px solid #2563eb;padding-left:20px}.user-query{margin-bottom:16px}.user-query .label,.expected-calls .label{display:block;font-size:.85rem;font-weight:600;color:#888;margin-bottom:4px}.user-query p{margin:0;font-style:italic;color:#333}.expected-calls ol{margin:8px 0 0;padding-left:20px}.expected-calls li{margin-bottom:8px}.expected-calls code{background:#e8f4fd;color:#1e40af;padding:2px 6px;border-radius:3px;font-family:SF Mono,Monaco,monospace;font-size:.9rem}.expected-calls .args{color:#666;font-size:.9rem}.results-section h2{font-size:1rem;font-weight:600;text-transform:uppercase;letter-spacing:.5px;color:#666;margin:0 0 16px}.results-meta{display:flex;gap:24px;margin-bottom:16px;font-size:.9rem;color:#888}.results-table{width:100%;border-collapse:collapse;font-size:.95rem}.results-table th{text-align:left;padding:12px 16px;background:#f8f9fa;border-bottom:2px solid #e0e0e0;font-weight:600;color:#555;font-size:.85rem;text-transform:uppercase;letter-spacing:.3px}.results-table td{padding:14px 16px;border-bottom:1px solid #eee}.results-table tr:hover{background:#fafafa}.model-name{font-weight:500}.medal{margin-right:6px}.metric{font-family:SF Mono,Monaco,monospace;font-size:.9rem}.runs{color:#888}.status{display:inline-block;padding:3px 10px;border-radius:12px;font-size:.75rem;font-weight:600;text-transform:uppercase}.status.fresh{background:#dcfce7;color:#166534}.status.stale{background:#fef3c7;color:#92400e}@media(max-width:640px){.app{padding:20px 16px}.landing-header h1{font-size:2rem}.task-card{padding:20px}.task-stats{flex-direction:column;gap:8px}.task-detail{padding:20px}.results-table{font-size:.85rem}.results-table th,.results-table td{padding:10px 8px}}.clickable-row{cursor:pointer}.row-link{color:inherit;text-decoration:none}.row-link:hover{color:#2563eb}.run-detail{background:#fff;border:1px solid #e0e0e0;border-radius:8px;padding:32px}.run-header{margin-bottom:32px;padding-bottom:24px;border-bottom:1px solid #eee}.run-header h1{font-size:1.8rem;font-weight:600;margin:0 0 8px}.run-meta{color:#666;margin:0}.run-summary{margin-bottom:32px}.summary-cards{display:grid;grid-template-columns:repeat(4,1fr);gap:16px}.summary-card{background:#f8f9fa;border-radius:8px;padding:20px;text-align:center}.summary-value{display:block;font-size:1.8rem;font-weight:600;color:#333;font-family:SF Mono,Monaco,monospace}.summary-label{display:block;font-size:.85rem;color:#666;margin-top:4px}.examples-section h2{font-size:1rem;font-weight:600;text-transform:uppercase;letter-spacing:.5px;color:#666;margin:0 0 16px}.examples-table{width:100%;border-collapse:collapse;font-size:.95rem}.examples-table th{text-align:left;padding:12px 16px;background:#f8f9fa;border-bottom:2px solid #e0e0e0;font-weight:600;color:#555;font-size:.85rem;text-transform:uppercase;letter-spacing:.3px}.examples-table td{padding:14px 16px;border-bottom:1px solid #eee}.examples-table tr:hover{background:#fafafa}.example-id{font-weight:500}.result{font-family:SF Mono,Monaco,monospace;font-size:.9rem;text-align:center}.result.pass{color:#166534}.result.fail{color:#dc2626}.result.partial{color:#d97706}.timing{color:#888;font-family:SF Mono,Monaco,monospace;font-size:.85rem}.example-compare{background:#fff;border:1px solid #e0e0e0;border-radius:8px;padding:32px}.compare-header{margin-bottom:24px;padding-bottom:24px;border-bottom:1px solid #eee}.compare-header h1{font-size:1.6rem;font-weight:600;margin:0 0 8px;font-family:SF Mono,Monaco,monospace}.compare-meta{color:#666;margin:0}.scores-summary{display:flex;gap:12px;margin-bottom:24px}.score-badge{display:inline-block;padding:6px 14px;border-radius:20px;font-size:.9rem;font-weight:500}.score-badge.pass{background:#dcfce7;color:#166534}.score-badge.fail{background:#fee2e2;color:#dc2626}.score-badge.partial{background:#fef3c7;color:#d97706}.compare-grid{display:grid;grid-template-columns:1fr 1fr;gap:24px}.compare-column{background:#f8f9fa;border-radius:8px;padding:20px}.compare-column h2{font-size:.9rem;font-weight:600;text-transform:uppercase;letter-spacing:.5px;color:#666;margin:0 0 16px}.compare-column.gold{border-left:3px solid #2563eb}.compare-column.actual{border-left:3px solid #7c3aed}.trace-list{display:flex;flex-direction:column;gap:12px}.trace-item{display:flex;gap:12px;background:#fff;border-radius:6px;padding:12px;border:1px solid #e0e0e0}.trace-item.match{border-color:#86efac;background:#f0fdf4}.trace-item.partial-match{border-color:#fde047;background:#fefce8}.trace-item.mismatch{border-color:#fca5a5;background:#fef2f2}.trace-item.skipped{border-style:dashed;background:#fafafa}.call-number{display:flex;align-items:center;justify-content:center;width:28px;height:28px;background:#e0e0e0;border-radius:50%;font-size:.85rem;font-weight:600;color:#666;flex-shrink:0}.match-indicator,.partial-indicator,.mismatch-indicator{margin-left:4px;font-size:.75rem}.match-indicator{color:#166534}.partial-indicator{color:#d97706}.mismatch-indicator{color:#dc2626}.call-content{flex:1;min-width:0}.call-name{display:inline-block;background:#e8f4fd;color:#1e40af;padding:2px 8px;border-radius:4px;font-family:SF Mono,Monaco,monospace;font-size:.9rem;margin-bottom:8px}.call-name.wrong{background:#fee2e2;color:#dc2626}.call-args{margin:0;font-family:SF Mono,Monaco,monospace;font-size:.8rem;color:#555;background:#f1f5f9;padding:8px;border-radius:4px;overflow-x:auto;white-space:pre-wrap;word-break:break-all}.call-args.wrong{background:#fef2f2;color:#991b1b}.no-calls{color:#888;font-style:italic;padding:20px;text-align:center}.skipped-label{color:#888;font-style:italic}@media(max-width:768px){.summary-cards{grid-template-columns:repeat(2,1fr)}.compare-grid{grid-template-columns:1fr}}.view-tabs{display:flex;gap:8px;margin-bottom:24px}.view-tab{padding:10px 20px;border:1px solid #e0e0e0;background:#fff;border-radius:6px;cursor:pointer;font-size:.9rem;font-weight:500;color:#666;transition:all .2s}.view-tab:hover{border-color:#ccc;color:#333}.view-tab.active{background:#2563eb;border-color:#2563eb;color:#fff}.timeline-view{background:#f8f9fa;border-radius:8px;padding:24px}.timeline-turns{display:flex;flex-direction:column;gap:16px}.timeline-turn{display:flex;gap:16px;background:#fff;border-radius:8px;padding:16px;border-left:4px solid #e0e0e0}.timeline-turn-user{border-left-color:#2563eb}.timeline-turn-assistant{border-left-color:#7c3aed}.timeline-turn-tool{border-left-color:#059669;background:#f0fdf4}.timeline-timestamp{flex-shrink:0;width:70px;font-family:SF Mono,Monaco,monospace;font-size:.85rem;color:#888;text-align:right;padding-top:2px}.timeline-content{flex:1;min-width:0}.timeline-role{font-size:.8rem;font-weight:600;text-transform:uppercase;letter-spacing:.5px;color:#666;margin-bottom:8px}.timeline-turn-user .timeline-role{color:#2563eb}.timeline-turn-assistant .timeline-role{color:#7c3aed}.timeline-turn-tool .timeline-role{color:#059669}.timeline-body{color:#333}.timeline-text{line-height:1.6;white-space:pre-wrap}.timeline-args{margin:8px 0 0;font-family:SF Mono,Monaco,monospace;font-size:.85rem;background:#f1f5f9;padding:12px;border-radius:6px;overflow-x:auto;white-space:pre-wrap;word-break:break-all}.timeline-result{margin-top:12px}.timeline-result summary{cursor:pointer;font-size:.85rem;color:#666;font-weight:500}.timeline-result summary:hover{color:#333}.timeline-result pre{margin:8px 0 0;font-family:SF Mono,Monaco,monospace;font-size:.8rem;background:#e8f4fd;padding:12px;border-radius:6px;overflow-x:auto;white-space:pre-wrap;word-break:break-all;max-height:200px;overflow-y:auto}.timeline-summary{display:flex;gap:24px;margin-top:20px;padding-top:16px;border-top:1px solid #e0e0e0;font-size:.9rem;color:#666}.timeline-summary span{font-family:SF Mono,Monaco,monospace}.proposal-banner{background:#f0f7ff;border:1px solid #cce0ff;border-radius:8px;padding:16px 20px;margin-bottom:32px;display:flex;justify-content:space-between;align-items:center;gap:16px}.proposal-banner span{color:#1a4b8c;font-size:.95rem}.proposal-link{color:#2563eb;text-decoration:none;font-weight:500;white-space:nowrap}.proposal-link:hover{text-decoration:underline}.proposal-page{max-width:720px;margin:0 auto}.proposal-nav{margin-bottom:32px}.proposal-content{background:#fff;border-radius:8px;padding:40px;box-shadow:0 1px 3px #0000001a}.proposal-content h1{font-size:1.8rem;margin-bottom:8px;line-height:1.3}.proposal-content h2{font-size:1.3rem;margin-top:32px;margin-bottom:16px;padding-top:16px;border-top:1px solid #eee}.proposal-content h2:first-of-type{border-top:none;padding-top:0}.proposal-content p{margin-bottom:16px}.proposal-content ul,.proposal-content ol{margin-bottom:16px;padding-left:24px}.proposal-content li{margin-bottom:8px}.proposal-content code{background:#f5f5f5;padding:2px 6px;border-radius:4px;font-family:SF Mono,Monaco,monospace;font-size:.9em}.proposal-content pre{background:#f5f5f5;padding:16px;border-radius:8px;overflow-x:auto;margin-bottom:16px}.proposal-content pre code{background:none;padding:0}.proposal-content hr{border:none;border-top:1px solid #eee;margin:24px 0}.proposal-content strong{font-weight:600}@media print{body{background:#fff}.task-detail{box-shadow:none;border:1px solid #000}}
