Skip to content

Commit c7ddabc

Browse files
authored
Merge pull request #38 from SWE-bench/add-cost-col
[WIP] Add cost column and docent link
2 parents 38bf023 + 91eabd4 commit c7ddabc

File tree

1 file changed

+12
-6
lines changed

1 file changed

+12
-6
lines changed

js/mainResults.js

Lines changed: 12 additions & 6 deletions
Original file line numberDiff line numberDiff line change
@@ -43,6 +43,10 @@ function sortItems(a, b, field, direction) {
4343
case 'trajs':
4444
case 'site':
4545
return item[field] ? 1 : 0;
46+
case 'instance_cost':
47+
return parseFloat(item.instance_cost) || 0;
48+
case 'trajs_docent':
49+
return item.trajs_docent && item.trajs_docent !== false ? 1 : 0;
4650
case 'release':
4751
return (item['mini-swe-agent_version'] || '').toLowerCase();
4852
default:
@@ -96,10 +100,11 @@ function renderLeaderboardTable(leaderboard) {
96100
<tr>
97101
<th class="sortable" data-sort="name">Model</th>
98102
<th class="sortable" data-sort="resolved">% Resolved</th>
103+
${isBashOnly ? '<th class="sortable" data-sort="instance_cost" title="Average cost per task instance in the benchmark">Avg. $</th>' : ''}
99104
<th class="sortable" data-sort="org">Org</th>
100105
<th class="sortable" data-sort="date">Date</th>
101-
<th class="sortable" data-sort="site">Site</th>
102-
${isBashOnly ? '<th class="sortable" data-sort="release">Release</th>' : ''}
106+
${!isBashOnly ? '<th class="sortable" data-sort="site">Site</th>' : ''}
107+
${isBashOnly ? '<th class="sortable" data-sort="release" title="mini-swe-agent release with which the benchmark was run. Click the release to see the release note. Generally, results should be very comparable across releases.">Release</th>' : ''}
103108
</tr>
104109
</thead>
105110
<tbody>
@@ -121,6 +126,7 @@ function renderLeaderboardTable(leaderboard) {
121126
</div>
122127
</td>
123128
<td><span class="number fw-medium text-primary">${parseFloat(item.resolved).toFixed(2)}</span></td>
129+
${isBashOnly ? `<td class="text-right"><span class="number fw-medium text-primary">${item.instance_cost !== null && item.instance_cost !== undefined ? parseFloat(item.instance_cost).toFixed(2) : ''}</span></td>` : ''}
124130
<td>
125131
${item.logo && item.logo.length > 0 ? `
126132
<div style="display: flex; align-items: center;">
@@ -129,14 +135,14 @@ function renderLeaderboardTable(leaderboard) {
129135
` : '-'}
130136
</td>
131137
<td><span class="label-date text-muted">${item.date}</span></td>
132-
<td class="centered-text text-center">
138+
${!isBashOnly ? `<td class="centered-text text-center">
133139
${item.site ? `<a href="${item.site}" target="_blank" rel="noopener noreferrer"><i class="fas fa-external-link-alt"></i></a>` : '<span class="text-muted">-</span>'}
134-
</td>
135-
${isBashOnly ? `<td><span class="text-muted font-mono">${item['mini-swe-agent_version'] || '-'}</span></td>` : ''}
140+
</td>` : ''}
141+
${isBashOnly ? `<td><span class="text-muted font-mono">${item['mini-swe-agent_version'] && item['mini-swe-agent_version'] !== '0.0.0' ? `<a href="https://github.com/SWE-agent/mini-swe-agent/tree/v${item['mini-swe-agent_version']}" target="_blank" rel="noopener noreferrer">${item['mini-swe-agent_version']}</a>` : (item['mini-swe-agent_version'] || '-')}</span></td>` : ''}
136142
</tr>
137143
`).join('')}
138144
<tr class="no-results" style="display: none;">
139-
<td colspan="${isBashOnly ? '8' : '7'}" class="text-center">
145+
<td colspan="${isBashOnly ? '9' : '7'}" class="text-center">
140146
No entries match the selected filters. Try adjusting your filters.
141147
</td>
142148
</tr>

0 commit comments

Comments
 (0)