| |
| |
| |
| |
| <!doctype html> |
| <html lang="en"> |
| <head> |
| <meta charset="UTF-8" /> |
| <link rel="icon" type="image/png" href="./favicon.png?v=3" /> |
| <meta name="viewport" content="width=device-width, initial-scale=1.0" /> |
| <meta name="description" content="The Open Agent Leaderboard. Systematic evaluation across diverse environments without domain-specific tuning." /> |
| <title>Open Agent Leaderboard</title> |
| <link rel="preconnect" href="https://fonts.googleapis.com"> |
| <link rel="preconnect" href="https://fonts.gstatic.com" crossorigin> |
| <link href="https://fonts.googleapis.com/css2?family=Inter:wght@300;400;500;600;700;800;900&family=JetBrains+Mono:wght@400;500;600&display=swap" rel="stylesheet"> |
| <script src="https://cdn.jsdelivr.net/npm/chart.js@4.4.7/dist/chart.umd.min.js"></script> |
| |
| <script>var t=localStorage.getItem('exgentic-theme');if(t==='light'||(t===null&&window.matchMedia('(prefers-color-scheme:light)').matches))document.documentElement.classList.add('light-mode-early');</script> |
| <link rel="stylesheet" href="./styles.css"> |
| </head> |
|
|
| <body> |
|
|
| |
| <header class="site-header" id="header"> |
| <div class="header-inner"> |
| <a href="https://exgentic.github.io" target="_blank" aria-label="Exgentic Home" class="nav-logo-link"> |
| <svg class="nav-logo-icon" viewBox="0 0 40 48" fill="none" stroke="none"> |
| <polygon points="4,8 36,8 20,30" class="tri-outer"/> |
| <polygon points="4,44 36,44 20,22" class="tri-outer"/> |
| <polygon points="9,10 31,10 20,17" class="tri-inner"/> |
| <polygon points="9,42 31,42 20,35" class="tri-inner"/> |
| </svg> |
| <span class="nav-logo-text">Exgentic</span> |
| </a> |
| <button class="mobile-toggle" id="mobileToggle" aria-label="Toggle navigation">☰</button> |
| <nav class="header-nav" id="headerNav"> |
| <a href="#leaderboard">Leaderboard</a> |
| <a href="#pareto">Efficiency</a> |
| <a href="https://arxiv.org/abs/2602.22953" target="_blank" rel="noopener">Paper</a> |
| <a href="https://github.com/Exgentic/exgentic" target="_blank" rel="noopener" class="btn-nav"> |
| <svg width="16" height="16" viewBox="0 0 16 16" fill="currentColor" style="vertical-align:middle;margin-right:4px"><path d="M8 0C3.58 0 0 3.58 0 8c0 3.54 2.29 6.53 5.47 7.59.4.07.55-.17.55-.38 0-.19-.01-.82-.01-1.49-2.01.37-2.53-.49-2.69-.94-.09-.23-.48-.94-.82-1.13-.28-.15-.68-.52-.01-.53.63-.01 1.08.58 1.23.82.72 1.21 1.87.87 2.33.66.07-.52.28-.87.51-1.07-1.78-.2-3.64-.89-3.64-3.95 0-.87.31-1.59.82-2.15-.08-.2-.36-1.02.08-2.12 0 0 .67-.21 2.2.82.64-.18 1.32-.27 2-.27.68 0 1.36.09 2 .27 1.53-1.04 2.2-.82 2.2-.82.44 1.1.16 1.92.08 2.12.51.56.82 1.27.82 2.15 0 3.07-1.87 3.75-3.65 3.95.29.25.54.73.54 1.48 0 1.07-.01 1.93-.01 2.2 0 .21.15.46.55.38A8.013 8.013 0 0016 8c0-4.42-3.58-8-8-8z"/></svg> |
| GitHub |
| </a> |
| <button class="theme-toggle" id="themeToggle" title="Toggle light/dark mode">☾</button> |
| </nav> |
| </div> |
| </header> |
|
|
| |
| <section class="section-alt" id="leaderboard"> |
| <div class="container"> |
| <span class="section-label">Exgentic</span> |
| <h2 class="section-title revealed">Open Agent Leaderboard</h2> |
| <p class="section-subtitle">Systematic evaluation of AI agents across diverse environments — without domain-specific tuning.</p> |
| <div class="leaderboard-controls"><h3>Leaderboard</h3><div><select class="filter-select" id="modelFilter"><option value="all">All Models</option></select></div></div> |
| <div class="table-wrap"><table class="lb-table" id="lbTable"><thead><tr id="lbHead"></tr></thead><tbody id="lbBody"></tbody></table></div> |
| <div class="lb-footer"> |
| <a href="./results.csv" download>Download CSV</a><span>·</span> |
| <a href="./results-README.md">Data Info</a><span>·</span> |
| <a href="./LICENSE-DATA.txt">License (CDLA-Permissive-2.0)</a> |
| </div> |
| </div> |
| </section> |
|
|
| |
| <section id="pareto"> |
| <div class="container"> |
| <span class="section-label">Trade-offs</span> |
| <h2 class="section-title revealed">Cost-Performance Frontier</h2> |
| <p class="section-subtitle">The Pareto frontier of agent efficiency — accuracy vs. spend.</p> |
| <div class="chart-container"> |
| <div class="chart-canvas-wrap"><canvas id="cpChart"></canvas></div> |
| <div class="chart-model-legend" id="modelLegend" style="text-align:center;margin-top:8px;font-size:.75rem;color:var(--text-muted);font-family:'JetBrains Mono',monospace"></div> |
| </div> |
| </div> |
| </section> |
|
|
| <script> |
| |
| const header=document.getElementById('header'); |
| window.addEventListener('scroll',()=>{header.classList.toggle('scrolled',window.scrollY>50)},{passive:true}); |
| document.getElementById('mobileToggle').addEventListener('click',()=>{document.getElementById('headerNav').classList.toggle('open')}); |
| </script> |
| <script src="./scripts/leaderboard.js" data-base="./"></script> |
| <script> |
| |
| (function(){ |
| const btn=document.getElementById('themeToggle'); |
| const saved=localStorage.getItem('exgentic-theme'); |
| if(saved==='light') document.body.classList.add('light-mode'); |
| document.documentElement.classList.remove('light-mode-early'); |
| function update(){ |
| const isLight=document.body.classList.contains('light-mode'); |
| btn.innerHTML=isLight?'☀':'☾'; |
| localStorage.setItem('exgentic-theme',isLight?'light':'dark'); |
| } |
| update(); |
| btn.addEventListener('click',()=>{ |
| document.body.classList.toggle('light-mode'); |
| update(); |
| if(window._chartData) renderChart(window._chartData); |
| }); |
| })(); |
| </script> |
| </body> |
| </html> |
|
|