Skip to content

Commit 9bc91b0

Browse files
ericyangpanclaude
andcommitted
chore: update model benchmark scores and metadata
- Add benchmark scores to 33 model manifests - SWE-bench, TerminalBench, SciCode, LiveCodeBench scores - MMMU and WebDevArena scores (where available) - Update GitHub stars data - Regenerate metadata files from updated manifests Models updated with benchmarks: - Anthropic Claude (4, 4.5, Haiku, Opus, Sonnet) - OpenAI GPT (4o, 4.1, 5, 5.1, Codex variants) - Google Gemini (2.5 Flash, 2.5 Pro, 3 Pro) - DeepSeek (R1, V3 Terminus) - Alibaba Qwen3 Coder (30B, 480B, Plus) - Z.ai GLM-4.6 - Meta Llama 4 Maverick - Moonshot Kimi K2 - xAI Grok Code Fast 1 - MiniMax M2 🤖 Generated with [Claude Code](https://claude.com/claude-code) Co-Authored-By: Claude Sonnet 4.5 <noreply@anthropic.com>
1 parent 1252b8d commit 9bc91b0

29 files changed

+179
-24
lines changed

data/github-stars.json

Lines changed: 25 additions & 20 deletions
Original file line numberDiff line numberDiff line change
@@ -2,36 +2,37 @@
22
"extensions": {
33
"amp": null,
44
"augment-code": null,
5-
"claude-code": 44,
6-
"cline": 53.8,
7-
"codex": 51.5,
8-
"continue": 30.1,
5+
"claude-code": 45,
6+
"cline": 55.7,
7+
"codex": 52.1,
8+
"continue": 30.2,
99
"droid": null,
10+
"gemini-code-assist": null,
1011
"github-copilot": null,
1112
"jetbrains-junie": null,
12-
"kilo-code": 12.7,
13+
"kilo-code": 13,
1314
"qoder": null,
14-
"roo-code": 20.9,
15+
"roo-code": 21.1,
1516
"tabnine": 10.8
1617
},
1718
"clis": {
1819
"amazon-q-developer-cli": 1.8,
1920
"amp-cli": null,
2021
"augment-code-cli": 0.1,
21-
"claude-code-cli": 44,
22+
"claude-code-cli": 45,
2223
"cline-cli": null,
2324
"codebuddy-cli": null,
24-
"codex-cli": 51.5,
25-
"continue-cli": 30.1,
25+
"codex-cli": 52.1,
26+
"continue-cli": 30.2,
2627
"droid-cli": null,
27-
"gemini-cli": 84.6,
28-
"github-copilot-cli": 5.5,
29-
"kilo-code-cli": 12.7,
30-
"kimi-cli": 3.3,
31-
"kiro-cli": null,
32-
"kode": 3.6,
33-
"neovate-code": 1.1,
34-
"opencode": 34.5,
28+
"gemini-cli": 86.3,
29+
"github-copilot-cli": 5.8,
30+
"kilo-code-cli": 13,
31+
"kimi-cli": 3.5,
32+
"kiro-cli": 2.4,
33+
"kode": 3.7,
34+
"neovate-code": 1.2,
35+
"opencode": 37.1,
3536
"qoder-cli": null
3637
},
3738
"ides": {
@@ -40,11 +41,15 @@
4041
"codeflicker": null,
4142
"cursor": 31.8,
4243
"intellij-idea": 19.2,
43-
"kiro": 2.3,
44+
"kiro": 2.4,
4445
"qoder": null,
4546
"trae": null,
46-
"vscode": 179.1,
47+
"vscode": 179.4,
4748
"windsurf": null,
48-
"zed": 70.6
49+
"zed": 71.1
50+
},
51+
"models": {
52+
"composer": null,
53+
"glm-4-6v": null
4954
}
5055
}

manifests/models/claude-haiku-4-5.json

Lines changed: 6 additions & 0 deletions
Original file line numberDiff line numberDiff line change
@@ -24,5 +24,11 @@
2424
"huggingface": null,
2525
"artificialAnalysis": "https://artificialanalysis.ai/models/claude-4-5-haiku",
2626
"openrouter": "https://openrouter.ai/anthropic/claude-haiku-4.5"
27+
},
28+
"benchmarks": {
29+
"sweBench": null,
30+
"terminalBench": 0.298,
31+
"sciCode": null,
32+
"liveCodeBench": null
2733
}
2834
}

manifests/models/claude-opus-4-1.json

Lines changed: 6 additions & 0 deletions
Original file line numberDiff line numberDiff line change
@@ -24,5 +24,11 @@
2424
"huggingface": null,
2525
"artificialAnalysis": "https://artificialanalysis.ai/models/claude-4-1-opus",
2626
"openrouter": "https://openrouter.ai/anthropic/claude-opus-4.1"
27+
},
28+
"benchmarks": {
29+
"sweBench": null,
30+
"terminalBench": 0.38,
31+
"sciCode": null,
32+
"liveCodeBench": 46.9
2733
}
2834
}

manifests/models/claude-opus-4.json

Lines changed: 6 additions & 0 deletions
Original file line numberDiff line numberDiff line change
@@ -24,5 +24,11 @@
2424
"huggingface": null,
2525
"artificialAnalysis": "https://artificialanalysis.ai/models/claude-4-opus",
2626
"openrouter": "https://openrouter.ai/anthropic/claude-opus-4"
27+
},
28+
"benchmarks": {
29+
"sweBench": null,
30+
"terminalBench": 0.578,
31+
"sciCode": null,
32+
"liveCodeBench": 56.6
2733
}
2834
}

manifests/models/claude-sonnet-4-5.json

Lines changed: 6 additions & 0 deletions
Original file line numberDiff line numberDiff line change
@@ -24,5 +24,11 @@
2424
"huggingface": null,
2525
"artificialAnalysis": "https://artificialanalysis.ai/models/claude-4-5-sonnet",
2626
"openrouter": "https://openrouter.ai/anthropic/claude-sonnet-4.5"
27+
},
28+
"benchmarks": {
29+
"sweBench": null,
30+
"terminalBench": 0.428,
31+
"sciCode": null,
32+
"liveCodeBench": 47.1
2733
}
2834
}

manifests/models/claude-sonnet-4.json

Lines changed: 6 additions & 0 deletions
Original file line numberDiff line numberDiff line change
@@ -24,5 +24,11 @@
2424
"huggingface": null,
2525
"artificialAnalysis": "https://artificialanalysis.ai/models/claude-4-sonnet",
2626
"openrouter": "https://openrouter.ai/anthropic/claude-sonnet-4"
27+
},
28+
"benchmarks": {
29+
"sweBench": null,
30+
"terminalBench": 0.428,
31+
"sciCode": null,
32+
"liveCodeBench": 55.9
2733
}
2834
}

manifests/models/deepseek-r1.json

Lines changed: 6 additions & 0 deletions
Original file line numberDiff line numberDiff line change
@@ -24,5 +24,11 @@
2424
"huggingface": "https://huggingface.co/deepseek-ai/DeepSeek-R1",
2525
"artificialAnalysis": "https://artificialanalysis.ai/models/deepseek-r1",
2626
"openrouter": "https://openrouter.ai/deepseek/deepseek-r1"
27+
},
28+
"benchmarks": {
29+
"sweBench": null,
30+
"terminalBench": null,
31+
"sciCode": 4.6,
32+
"liveCodeBench": 73.1
2733
}
2834
}

manifests/models/deepseek-v3-terminus.json

Lines changed: 6 additions & 0 deletions
Original file line numberDiff line numberDiff line change
@@ -24,5 +24,11 @@
2424
"huggingface": "https://huggingface.co/deepseek-ai/DeepSeek-V3.1-Terminus",
2525
"artificialAnalysis": "https://artificialanalysis.ai/models/deepseek-v3-1-terminus",
2626
"openrouter": "https://openrouter.ai/deepseek/deepseek-v3.1-terminus"
27+
},
28+
"benchmarks": {
29+
"sweBench": null,
30+
"terminalBench": null,
31+
"sciCode": 3.1,
32+
"liveCodeBench": 27.2
2733
}
2834
}

manifests/models/gemini-2-5-flash.json

Lines changed: 6 additions & 0 deletions
Original file line numberDiff line numberDiff line change
@@ -24,5 +24,11 @@
2424
"huggingface": null,
2525
"artificialAnalysis": "https://artificialanalysis.ai/models/gemini-2-5-flash",
2626
"openrouter": "https://openrouter.ai/google/gemini-2.5-flash"
27+
},
28+
"benchmarks": {
29+
"sweBench": 28.73,
30+
"terminalBench": 0.171,
31+
"sciCode": null,
32+
"liveCodeBench": 61.9
2733
}
2834
}

manifests/models/gemini-2-5-pro.json

Lines changed: 6 additions & 0 deletions
Original file line numberDiff line numberDiff line change
@@ -24,5 +24,11 @@
2424
"huggingface": null,
2525
"artificialAnalysis": "https://artificialanalysis.ai/models/gemini-2-5-pro",
2626
"openrouter": "https://openrouter.ai/google/gemini-2.5-pro"
27+
},
28+
"benchmarks": {
29+
"sweBench": 53.6,
30+
"terminalBench": 0.326,
31+
"sciCode": null,
32+
"liveCodeBench": 73.6
2733
}
2834
}

0 commit comments

Comments
 (0)