|
1829 | 1829 | ],
|
1830 | 1830 | "warning": null
|
1831 | 1831 | },
|
| 1832 | + { |
| 1833 | + "name": "mini-SWE-agent + Kimi K2 Instruct", |
| 1834 | + "logo": [ |
| 1835 | + "https://mini-swe-agent.com/latest/assets/mini_square.svg" |
| 1836 | + ], |
| 1837 | + "site": "https://mini-swe-agent.com/latest/", |
| 1838 | + "folder": "20250807_mini-v1.7.0_Kimi-K2-Instruct", |
| 1839 | + "resolved": 43.8, |
| 1840 | + "date": "2025-08-07", |
| 1841 | + "logs": "s3://swe-bench-experiments/verified/20250807_mini-v1.7.0_Kimi-K2-Instruct/logs", |
| 1842 | + "trajs": "s3://swe-bench-experiments/verified/20250807_mini-v1.7.0_Kimi-K2-Instruct/trajs", |
| 1843 | + "os_model": true, |
| 1844 | + "os_system": true, |
| 1845 | + "checked": true, |
| 1846 | + "tags": [ |
| 1847 | + "Org: Moonshot AI", |
| 1848 | + "Model: Kimi-K2-Instruct", |
| 1849 | + "System: Attempts - 1", |
| 1850 | + "Org: SWE-agent" |
| 1851 | + ], |
| 1852 | + "warning": null |
| 1853 | + }, |
1832 | 1854 | {
|
1833 | 1855 | "name": "Solver (2024-09-12)",
|
1834 | 1856 | "logo": [
|
|
2439 | 2461 | ],
|
2440 | 2462 | "warning": null
|
2441 | 2463 | },
|
| 2464 | + { |
| 2465 | + "name": "mini-SWE-agent + gpt-oss-120b", |
| 2466 | + "logo": [ |
| 2467 | + "https://mini-swe-agent.com/latest/assets/mini_square.svg" |
| 2468 | + ], |
| 2469 | + "site": "https://mini-swe-agent.com/latest/", |
| 2470 | + "folder": "20250807_mini-v1.7.0_gpt-oss-120b", |
| 2471 | + "resolved": 26.0, |
| 2472 | + "date": "2025-08-07", |
| 2473 | + "logs": "s3://swe-bench-experiments/verified/20250807_mini-v1.7.0_gpt-oss-120b/logs", |
| 2474 | + "trajs": "s3://swe-bench-experiments/verified/20250807_mini-v1.7.0_gpt-oss-120b/trajs", |
| 2475 | + "os_model": true, |
| 2476 | + "os_system": true, |
| 2477 | + "checked": true, |
| 2478 | + "tags": [ |
| 2479 | + "Org: OpenAI", |
| 2480 | + "Model: gpt-oss-120b", |
| 2481 | + "System: Attempts - 1", |
| 2482 | + "Org: SWE-agent" |
| 2483 | + ], |
| 2484 | + "warning": null |
| 2485 | + }, |
2442 | 2486 | {
|
2443 | 2487 | "name": "nFactorial (2024-10-01)",
|
2444 | 2488 | "logo": [
|
|
5049 | 5093 | "warning": null,
|
5050 | 5094 | "mini-swe-agent_version": "1.0.0"
|
5051 | 5095 | },
|
| 5096 | + { |
| 5097 | + "name": "Kimi K2 Instruct", |
| 5098 | + "logo": [ |
| 5099 | + "https://avatars.githubusercontent.com/u/129152888?s=200&v=4" |
| 5100 | + ], |
| 5101 | + "site": "https://moonshotai.github.io/Kimi-K2/", |
| 5102 | + "folder": "20250807_mini-v1.7.0_Kimi-K2-Instruct", |
| 5103 | + "resolved": 43.8, |
| 5104 | + "date": "2025-08-07", |
| 5105 | + "logs": "s3://swe-bench-experiments/bash-only/20250807_mini-v1.7.0_Kimi-K2-Instruct/logs", |
| 5106 | + "trajs": "s3://swe-bench-experiments/bash-only/20250807_mini-v1.7.0_Kimi-K2-Instruct/trajs", |
| 5107 | + "os_model": true, |
| 5108 | + "os_system": true, |
| 5109 | + "checked": true, |
| 5110 | + "tags": [ |
| 5111 | + "Org: Moonshot AI", |
| 5112 | + "Model: Kimi-K2-Instruct", |
| 5113 | + "System: Attempts - 1" |
| 5114 | + ], |
| 5115 | + "warning": null, |
| 5116 | + "mini-swe-agent_version": "1.7.0" |
| 5117 | + }, |
5052 | 5118 | {
|
5053 | 5119 | "name": "GPT-4.1 (2025-04-14)",
|
5054 | 5120 | "logo": [
|
|
5115 | 5181 | "warning": null,
|
5116 | 5182 | "mini-swe-agent_version": "1.0.0"
|
5117 | 5183 | },
|
| 5184 | + { |
| 5185 | + "name": "gpt-oss-120b", |
| 5186 | + "logo": [ |
| 5187 | + "https://upload.wikimedia.org/wikipedia/commons/6/66/OpenAI_logo_2025_%28symbol%29.svg" |
| 5188 | + ], |
| 5189 | + "site": "https://platform.openai.com/docs/models/gpt-oss-120b", |
| 5190 | + "folder": "20250807_mini-v1.7.0_gpt-oss-120b", |
| 5191 | + "resolved": 26.0, |
| 5192 | + "date": "2025-08-07", |
| 5193 | + "logs": "s3://swe-bench-experiments/bash-only/20250807_mini-v1.7.0_gpt-oss-120b/logs", |
| 5194 | + "trajs": "s3://swe-bench-experiments/bash-only/20250807_mini-v1.7.0_gpt-oss-120b/trajs", |
| 5195 | + "os_model": true, |
| 5196 | + "os_system": true, |
| 5197 | + "checked": true, |
| 5198 | + "tags": [ |
| 5199 | + "Org: OpenAI", |
| 5200 | + "Model: gpt-oss-120b", |
| 5201 | + "System: Attempts - 1" |
| 5202 | + ], |
| 5203 | + "warning": null, |
| 5204 | + "mini-swe-agent_version": "1.7.0" |
| 5205 | + }, |
5118 | 5206 | {
|
5119 | 5207 | "name": "GPT-4.1-mini (2025-04-14)",
|
5120 | 5208 | "logo": [
|
|
0 commit comments