Skip to content

Commit d7615e4

Browse files
committed
Restore high reasoning suffixes
1 parent 88b71b7 commit d7615e4

1 file changed

Lines changed: 21 additions & 21 deletions

File tree

data/leaderboards.json

Lines changed: 21 additions & 21 deletions
Original file line numberDiff line numberDiff line change
@@ -15,7 +15,7 @@
1515
],
1616
"logs": null,
1717
"mini-swe-agent_version": "2.0.0",
18-
"name": "Claude 4.5 Opus",
18+
"name": "Claude 4.5 Opus (high reasoning)",
1919
"os_model": false,
2020
"os_system": true,
2121
"per_instance_details": {
@@ -2544,7 +2544,7 @@
25442544
],
25452545
"logs": null,
25462546
"mini-swe-agent_version": "2.0.0",
2547-
"name": "Gemini 3 Flash",
2547+
"name": "Gemini 3 Flash (high reasoning)",
25482548
"os_model": false,
25492549
"os_system": true,
25502550
"per_instance_details": {
@@ -5073,7 +5073,7 @@
50735073
],
50745074
"logs": null,
50755075
"mini-swe-agent_version": "2.0.0",
5076-
"name": "MiniMax M2.5",
5076+
"name": "MiniMax M2.5 (high reasoning)",
50775077
"os_model": false,
50785078
"os_system": true,
50795079
"per_instance_details": {
@@ -15189,7 +15189,7 @@
1518915189
],
1519015190
"logs": null,
1519115191
"mini-swe-agent_version": "2.0.0",
15192-
"name": "GLM-5",
15192+
"name": "GLM-5 (high reasoning)",
1519315193
"os_model": false,
1519415194
"os_system": true,
1519515195
"per_instance_details": {
@@ -17718,7 +17718,7 @@
1771817718
],
1771917719
"logs": null,
1772017720
"mini-swe-agent_version": "2.0.0",
17721-
"name": "GPT-5-2",
17721+
"name": "GPT-5-2 (high reasoning)",
1772217722
"os_model": false,
1772317723
"os_system": true,
1772417724
"per_instance_details": {
@@ -20247,7 +20247,7 @@
2024720247
],
2024820248
"logs": "s3://swe-bench-submissions/bash-only/20251211_mini-v1.17.2_gpt-5.2-2025-12-11-high/logs",
2024920249
"mini-swe-agent_version": "1.17.2",
20250-
"name": "GPT-5.2 (2025-12-11)",
20250+
"name": "GPT-5.2 (2025-12-11) (high reasoning)",
2025120251
"os_model": false,
2025220252
"os_system": true,
2025320253
"per_instance_details": {
@@ -22776,7 +22776,7 @@
2277622776
],
2277722777
"logs": null,
2277822778
"mini-swe-agent_version": "2.0.0",
22779-
"name": "Claude 4.5 Sonnet",
22779+
"name": "Claude 4.5 Sonnet (high reasoning)",
2278022780
"os_model": false,
2278122781
"os_system": true,
2278222782
"per_instance_details": {
@@ -25305,7 +25305,7 @@
2530525305
],
2530625306
"logs": null,
2530725307
"mini-swe-agent_version": "2.0.0",
25308-
"name": "Kimi K2.5",
25308+
"name": "Kimi K2.5 (high reasoning)",
2530925309
"os_model": false,
2531025310
"os_system": true,
2531125311
"per_instance_details": {
@@ -30363,7 +30363,7 @@
3036330363
],
3036430364
"logs": null,
3036530365
"mini-swe-agent_version": "2.0.0",
30366-
"name": "DeepSeek V3.2",
30366+
"name": "DeepSeek V3.2 (high reasoning)",
3036730367
"os_model": false,
3036830368
"os_system": true,
3036930369
"per_instance_details": {
@@ -40454,7 +40454,7 @@
4045440454
],
4045540455
"logs": null,
4045640456
"mini-swe-agent_version": "2.0.0",
40457-
"name": "Claude 4.5 Haiku",
40457+
"name": "Claude 4.5 Haiku (high reasoning)",
4045840458
"os_model": false,
4045940459
"os_system": true,
4046040460
"per_instance_details": {
@@ -113459,7 +113459,7 @@
113459113459
],
113460113460
"logs": "s3://swe-bench-submissions/multilingual/20260213_mini-v2.0.0a0_gpt-5-2-high/logs",
113461113461
"mini-swe-agent_version": "2.0.0a0",
113462-
"name": "GPT-5.2",
113462+
"name": "GPT-5.2 (high reasoning)",
113463113463
"os_model": false,
113464113464
"os_system": true,
113465113465
"per_instance_details": {
@@ -120273,7 +120273,7 @@
120273120273
],
120274120274
"logs": null,
120275120275
"mini-swe-agent_version": "2.0.0",
120276-
"name": "mini-SWE-agent + Claude 4.5 Opus",
120276+
"name": "mini-SWE-agent + Claude 4.5 Opus (high reasoning)",
120277120277
"os_model": false,
120278120278
"os_system": true,
120279120279
"per_instance_details": {
@@ -122831,7 +122831,7 @@
122831122831
],
122832122832
"logs": null,
122833122833
"mini-swe-agent_version": "2.0.0",
122834-
"name": "mini-SWE-agent + Gemini 3 Flash",
122834+
"name": "mini-SWE-agent + Gemini 3 Flash (high reasoning)",
122835122835
"os_model": false,
122836122836
"os_system": true,
122837122837
"per_instance_details": {
@@ -125361,7 +125361,7 @@
125361125361
],
125362125362
"logs": null,
125363125363
"mini-swe-agent_version": "2.0.0",
125364-
"name": "mini-SWE-agent + MiniMax M2.5",
125364+
"name": "mini-SWE-agent + MiniMax M2.5 (high reasoning)",
125365125365
"os_model": false,
125366125366
"os_system": true,
125367125367
"per_instance_details": {
@@ -135765,7 +135765,7 @@
135765135765
],
135766135766
"logs": null,
135767135767
"mini-swe-agent_version": "2.0.0",
135768-
"name": "mini-SWE-agent + GLM-5",
135768+
"name": "mini-SWE-agent + GLM-5 (high reasoning)",
135769135769
"os_model": false,
135770135770
"os_system": true,
135771135771
"per_instance_details": {
@@ -138295,7 +138295,7 @@
138295138295
],
138296138296
"logs": null,
138297138297
"mini-swe-agent_version": "2.0.0",
138298-
"name": "mini-SWE-agent + GPT-5-2",
138298+
"name": "mini-SWE-agent + GPT-5-2 (high reasoning)",
138299138299
"os_model": false,
138300138300
"os_system": true,
138301138301
"per_instance_details": {
@@ -140874,7 +140874,7 @@
140874140874
],
140875140875
"logs": "s3://swe-bench-submissions/verified/20251211_mini-v1.17.2_gpt-5.2-2025-12-11-high/logs",
140876140876
"mini-swe-agent_version": "1.17.2",
140877-
"name": "mini-SWE-agent + GPT-5.2 (2025-12-11)",
140877+
"name": "mini-SWE-agent + GPT-5.2 (2025-12-11) (high reasoning)",
140878140878
"os_model": false,
140879140879
"os_system": true,
140880140880
"per_instance_details": {
@@ -143404,7 +143404,7 @@
143404143404
],
143405143405
"logs": null,
143406143406
"mini-swe-agent_version": "2.0.0",
143407-
"name": "mini-SWE-agent + Claude 4.5 Sonnet",
143407+
"name": "mini-SWE-agent + Claude 4.5 Sonnet (high reasoning)",
143408143408
"os_model": false,
143409143409
"os_system": true,
143410143410
"per_instance_details": {
@@ -146088,7 +146088,7 @@
146088146088
],
146089146089
"logs": null,
146090146090
"mini-swe-agent_version": "2.0.0",
146091-
"name": "mini-SWE-agent + Kimi K2.5",
146091+
"name": "mini-SWE-agent + Kimi K2.5 (high reasoning)",
146092146092
"os_model": false,
146093146093
"os_system": true,
146094146094
"per_instance_details": {
@@ -151298,7 +151298,7 @@
151298151298
],
151299151299
"logs": null,
151300151300
"mini-swe-agent_version": "2.0.0",
151301-
"name": "mini-SWE-agent + DeepSeek V3.2",
151301+
"name": "mini-SWE-agent + DeepSeek V3.2 (high reasoning)",
151302151302
"os_model": false,
151303151303
"os_system": true,
151304151304
"per_instance_details": {
@@ -161506,7 +161506,7 @@
161506161506
],
161507161507
"logs": null,
161508161508
"mini-swe-agent_version": "2.0.0",
161509-
"name": "mini-SWE-agent + Claude 4.5 Haiku",
161509+
"name": "mini-SWE-agent + Claude 4.5 Haiku (high reasoning)",
161510161510
"os_model": false,
161511161511
"os_system": true,
161512161512
"per_instance_details": {

0 commit comments

Comments
 (0)