Skip to content

Commit a77ba69

Browse files
add os models
1 parent 69abe42 commit a77ba69

File tree

1 file changed

+88
-0
lines changed

1 file changed

+88
-0
lines changed

data/leaderboards.json

Lines changed: 88 additions & 0 deletions
Original file line numberDiff line numberDiff line change
@@ -1829,6 +1829,28 @@
18291829
],
18301830
"warning": null
18311831
},
1832+
{
1833+
"name": "mini-SWE-agent + Kimi K2 Instruct",
1834+
"logo": [
1835+
"https://mini-swe-agent.com/latest/assets/mini_square.svg"
1836+
],
1837+
"site": "https://mini-swe-agent.com/latest/",
1838+
"folder": "20250807_mini-v1.7.0_Kimi-K2-Instruct",
1839+
"resolved": 43.8,
1840+
"date": "2025-08-07",
1841+
"logs": "s3://swe-bench-experiments/verified/20250807_mini-v1.7.0_Kimi-K2-Instruct/logs",
1842+
"trajs": "s3://swe-bench-experiments/verified/20250807_mini-v1.7.0_Kimi-K2-Instruct/trajs",
1843+
"os_model": true,
1844+
"os_system": true,
1845+
"checked": true,
1846+
"tags": [
1847+
"Org: Moonshot AI",
1848+
"Model: Kimi-K2-Instruct",
1849+
"System: Attempts - 1",
1850+
"Org: SWE-agent"
1851+
],
1852+
"warning": null
1853+
},
18321854
{
18331855
"name": "Solver (2024-09-12)",
18341856
"logo": [
@@ -2439,6 +2461,28 @@
24392461
],
24402462
"warning": null
24412463
},
2464+
{
2465+
"name": "mini-SWE-agent + gpt-oss-120b",
2466+
"logo": [
2467+
"https://mini-swe-agent.com/latest/assets/mini_square.svg"
2468+
],
2469+
"site": "https://mini-swe-agent.com/latest/",
2470+
"folder": "20250807_mini-v1.7.0_gpt-oss-120b",
2471+
"resolved": 26.0,
2472+
"date": "2025-08-07",
2473+
"logs": "s3://swe-bench-experiments/verified/20250807_mini-v1.7.0_gpt-oss-120b/logs",
2474+
"trajs": "s3://swe-bench-experiments/verified/20250807_mini-v1.7.0_gpt-oss-120b/trajs",
2475+
"os_model": true,
2476+
"os_system": true,
2477+
"checked": true,
2478+
"tags": [
2479+
"Org: OpenAI",
2480+
"Model: gpt-oss-120b",
2481+
"System: Attempts - 1",
2482+
"Org: SWE-agent"
2483+
],
2484+
"warning": null
2485+
},
24422486
{
24432487
"name": "nFactorial (2024-10-01)",
24442488
"logo": [
@@ -5049,6 +5093,28 @@
50495093
"warning": null,
50505094
"mini-swe-agent_version": "1.0.0"
50515095
},
5096+
{
5097+
"name": "Kimi K2 Instruct",
5098+
"logo": [
5099+
"https://avatars.githubusercontent.com/u/129152888?s=200&v=4"
5100+
],
5101+
"site": "https://moonshotai.github.io/Kimi-K2/",
5102+
"folder": "20250807_mini-v1.7.0_Kimi-K2-Instruct",
5103+
"resolved": 43.8,
5104+
"date": "2025-08-07",
5105+
"logs": "s3://swe-bench-experiments/bash-only/20250807_mini-v1.7.0_Kimi-K2-Instruct/logs",
5106+
"trajs": "s3://swe-bench-experiments/bash-only/20250807_mini-v1.7.0_Kimi-K2-Instruct/trajs",
5107+
"os_model": true,
5108+
"os_system": true,
5109+
"checked": true,
5110+
"tags": [
5111+
"Org: Moonshot AI",
5112+
"Model: Kimi-K2-Instruct",
5113+
"System: Attempts - 1"
5114+
],
5115+
"warning": null,
5116+
"mini-swe-agent_version": "1.7.0"
5117+
},
50525118
{
50535119
"name": "GPT-4.1 (2025-04-14)",
50545120
"logo": [
@@ -5115,6 +5181,28 @@
51155181
"warning": null,
51165182
"mini-swe-agent_version": "1.0.0"
51175183
},
5184+
{
5185+
"name": "gpt-oss-120b",
5186+
"logo": [
5187+
"https://upload.wikimedia.org/wikipedia/commons/6/66/OpenAI_logo_2025_%28symbol%29.svg"
5188+
],
5189+
"site": "https://platform.openai.com/docs/models/gpt-oss-120b",
5190+
"folder": "20250807_mini-v1.7.0_gpt-oss-120b",
5191+
"resolved": 26.0,
5192+
"date": "2025-08-07",
5193+
"logs": "s3://swe-bench-experiments/bash-only/20250807_mini-v1.7.0_gpt-oss-120b/logs",
5194+
"trajs": "s3://swe-bench-experiments/bash-only/20250807_mini-v1.7.0_gpt-oss-120b/trajs",
5195+
"os_model": true,
5196+
"os_system": true,
5197+
"checked": true,
5198+
"tags": [
5199+
"Org: OpenAI",
5200+
"Model: gpt-oss-120b",
5201+
"System: Attempts - 1"
5202+
],
5203+
"warning": null,
5204+
"mini-swe-agent_version": "1.7.0"
5205+
},
51185206
{
51195207
"name": "GPT-4.1-mini (2025-04-14)",
51205208
"logo": [

0 commit comments

Comments
 (0)