| #1 | GPT-5.2-CodexOpenAI | 75.7 | |
| #2 | GPT-5OpenAI | 75.6 | |
| #3 | GPT-5.1OpenAI | 75 | |
| #4 | GPT-5.5OpenAI | 74.3 | |
| #5 | KAT-Coder-Pro V1Kuaishou | 74 | |
| #6 | GPT-5.3-CodexOpenAI | 74 | |
| #7 | Claude Opus 4.5Anthropic | 74 | |
| #8 | GPT-5.4OpenAI | 74 | |
| #9 | MiMo-V2.5-ProXiaomi | 73.3 | |
| #10 | Gemini 3.1 ProGoogle | 72.7 | |
| #11 | GPT-5.2OpenAI | 72.7 | |
| #12 | Gemini 3.5 FlashGoogle | 71 | |
| #13 | Gemini 3 ProGoogle | 70.7 | |
| #14 | Claude Sonnet 4.6Anthropic | 70.7 | |
| #15 | Claude Opus 4.6Anthropic | 70.7 | |
| #16 | Claude Opus 4.7Anthropic | 70.3 | |
| #17 | Claude Haiku 4.5Anthropic | 70.3 | |
| #18 | Muse SparkMeta | 69.7 | |
| #19 | Qwen3.6 PlusAlibaba | 69.7 | |
| #20 | Qwen3.6 MaxAlibaba | 69.7 | |
| #21 | Kimi K2.6Moonshot AI | 69.7 | |
| #22 | GPT-5.4 miniOpenAI | 69.3 | |
| #23 | o3OpenAI | 69.3 | |
| #24 | Qwen3.7 MaxAlibaba | 69 | |
| #25 | GPT-5 CodexOpenAI | 69 | |
| #26 | DeepSeek V3.2 ExpDeepSeek | 69 | |
| #27 | MiniMax M2.7MiniMax | 68.7 | |
| #28 | Qwen3.6 27BAlibaba | 68.7 | |
| #29 | Grok 4.1 FastxAI | 68 | |
| #30 | Grok 4xAI | 68 | |
| #31 | GPT-5 miniOpenAI | 68 | |
| #32 | Claude Opus 4.8Anthropic | 67.7 | |
| #33 | GPT-5.1-CodexOpenAI | 67.3 | |
| #34 | Qwen3.5-27BAlibaba | 67.3 | |
| #35 | Qwen3 235B A22B 2507Alibaba | 67 | |
| #36 | MiMo-V2-OmniXiaomi | 66.7 | |
| #37 | Qwen3.5-122B-A10BAlibaba | 66.7 | |
| #38 | Kimi K2 ThinkingMoonshot AI | 66.3 | |
| #39 | DeepSeek-V4-ProDeepSeek | 66.3 | |
| #40 | Gemini 3 FlashGoogle | 66.3 | |
| #41 | Claude Opus 4.1Anthropic | 66.3 | |
| #42 | KAT-Coder-Pro V2Kuaishou | 66 | |
| #43 | Qwen3 Max ThinkingAlibaba | 66 | |
| #44 | MiniMax M2.5MiniMax | 66 | |
| #45 | GPT-5.4 nanoOpenAI | 66 | |
| #46 | Gemini 2.5 ProGoogle | 66 | |
| #47 | Qwen3.5 397B A17BAlibaba | 65.7 | |
| #48 | Claude Sonnet 4.5Anthropic | 65.7 | |
| #49 | Doubao Seed CodeByteDance | 65.3 | |
| #50 | Gemini 3.1 Flash LiteGoogle | 65.3 | |
| #51 | Kimi K2.5Moonshot AI | 65.3 | |
| #52 | DeepSeek V3.1 TerminusDeepSeek | 65 | |
| #53 | DeepSeek-V3.2DeepSeek | 65 | |
| #54 | Grok 4.3xAI | 65 | |
| #55 | Grok 4 FastxAI | 64.7 | |
| #56 | Claude Sonnet 4Anthropic | 64.7 | |
| #57 | MiMo-V2-FlashXiaomi | 64.3 | |
| #58 | Ring-2.6-1TInclusionAI | 64.3 | |
| #59 | GLM 4.7Zhipu AI | 64 | |
| #60 | MiMo-V2-Omni-0327Xiaomi | 63.7 | |
| #61 | Qwen3.6 35B A3BAlibaba | 63.7 | |
| #62 | GLM-5Zhipu AI | 63.3 | |
| #63 | DeepSeek-V4-FlashDeepSeek | 63 | |
| #64 | MiMo-V2.5Xiaomi | 62.7 | |
| #65 | GPT-5.1-Codex-MiniOpenAI | 62.7 | |
| #66 | Qwen3.5-35B-A3BAlibaba | 62.7 | |
| #67 | GLM 5.1Zhipu AI | 62.3 | |
| #68 | Gemma 4 31BGoogle | 62 | |
| #69 | Nova 2.0 ProAmazon | 61.7 | |
| #70 | Gemini 2.5 FlashGoogle | 61.7 | |
| #71 | GLM 5V TurboZhipu AI | 61 | |
| #72 | Mistral Medium 3.5Mistral AI | 61 | |
| #73 | MiniMax-M2MiniMax | 61 | |
| #74 | GPT-4.1OpenAI | 61 | |
| #75 | MiMo-V2-ProXiaomi | 60.7 | |
| #76 | GLM 5 TurboZhipu AI | 60.7 | |
| #77 | Claude 3.7 SonnetAnthropic | 60.7 | |
| #78 | Qwen3-Next-80B-A3BAlibaba | 60.3 | |
| #79 | NVIDIA Nemotron 3 Super 120B A12BNVIDIA | 60 | |
| #80 | DeepSeek V3.2 SpecialeDeepSeek | 59.3 | |
| #81 | o1OpenAI | 59.3 | |
| #82 | Qwen3 30B A3B 2507Alibaba | 59 | |
| #83 | Grok 4.20 0309xAI | 59 | |
| #84 | MiniMax M2.1MiniMax | 59 | |
| #85 | Qwen3.5-9BAlibaba | 59 | |
| #86 | Qwen3 VL 235B A22BAlibaba | 58.7 | |
| #87 | Nova 2 LiteAmazon | 58.3 | |
| #88 | Grok 4.20 0309 v2xAI | 58 | |
| #89 | Seed-OSS-36B-InstructByteDance | 57.7 | |
| #90 | Qwen3.5 4BAlibaba | 55.7 | |
| #91 | K-EXAONELG AI Research | 55.7 | |
| #92 | Gemma 4 26B A4BGoogle | 55.7 | |
| #93 | Qwen3 VL 32BAlibaba | 55.3 | |
| #94 | JT-35B-FlashChina Mobile | 55.3 | |
| #95 | o4-miniOpenAI | 55 | |
| #96 | DeepSeek-R1-0528DeepSeek | 54.7 | |
| #97 | Hy3Tencent | 54.7 | |
| #98 | Grok-3xAI | 54.7 | |
| #99 | MiniMax M1 80kMiniMax | 54.3 | |
| #100 | Step 3.5 Flash 2603StepFun | 54.3 | |
| #101 | GLM-4.6Zhipu AI | 54.3 | |
| #102 | Nova 2.0 OmniAmazon | 53.7 | |
| #103 | DeepSeek-V3.1DeepSeek | 53.3 | |
| #104 | GPT-4oOpenAI | 53 | |
| #105 | Qwen3.5 Omni PlusAlibaba | 52.7 | |
| #106 | K2 Think V2MBZUAI Institute of Foundation Models | 52.7 | |
| #107 | Kimi K2 0905Moonshot AI | 52.3 | |
| #108 | DeepSeek-R1DeepSeek | 52.3 | |
| #109 | MiniMax M1 40kMiniMax | 51.7 | |
| #110 | Magistral Medium 1.2Mistral AI | 51.3 | |
| #111 | Gemini 2.5 Flash LiteGoogle | 51.3 | |
| #112 | Qwen3 Next 80B A3B InstructAlibaba | 51.3 | |
| #113 | Kimi K2Moonshot AI | 51 | |
| #114 | gpt-oss-120bOpenAI | 50.7 | |
| #115 | Apriel-v1.6-15B-ThinkerServiceNow | 50.3 | |
| #116 | Grok 3 mini ReasoningxAI | 50.3 | |
| #117 | EXAONE 4.5 33BLG AI Research | 49.3 | |
| #118 | Grok Code Fast 1xAI | 48.3 | |
| #119 | GLM-4.5Zhipu AI | 48.3 | |
| #120 | Qwen3 MaxAlibaba | 46.7 | |
| #121 | Command ACohere | 46 | |
| #122 | Llama 4 MaverickMeta | 46 | |
| #123 | Ring-1TInclusionAI | 45.7 | |
| #124 | Mistral Small 4Mistral AI | 44.7 | |
| #125 | Qwen3.5 Omni FlashAlibaba | 44 | |
| #126 | GLM 4.5 AirZhipu AI | 43.7 | |
| #127 | Step 3.5 FlashStepFun | 43 | |
| #128 | Qwen3 Coder 480B A35B InstructAlibaba | 42.3 | |
| #129 | GPT-4.1 MiniOpenAI | 42.3 | |
| #130 | GPT-5 nanoOpenAI | 41.7 | |
| #131 | DeepSeek-V3 0324DeepSeek | 41 | |
| #132 | Qwen3 VL 30B A3BAlibaba | 40.7 | |
| #133 | GLM 4.6VZhipu AI | 40.3 | |
| #134 | NVIDIA Nemotron Nano 12B v2 VLNVIDIA | 40 | |
| #135 | Qwen3 Coder NextAlibaba | 40 | |
| #136 | o3-miniOpenAI | 39.3 | |
| #137 | Qwen3 4B 2507Alibaba | 37.7 | |
| #138 | Mercury 2Inception | 36.3 | |
| #139 | Solar Open 100BUpstage | 36 | |
| #140 | Claude Opus 4Anthropic | 36 | |
| #141 | Nemotron 3 Nano Omni 30B A3B ReasoningNVIDIA | 35.7 | |
| #142 | GLM 4.7 FlashZhipu AI | 35 | |
| #143 | Ling-1TInclusionAI | 34.7 | |
| #144 | Ling-2.6-1TInclusionAI | 34.7 | |
| #145 | Mistral Large 3Mistral AI | 34.7 | |
| #146 | Nemotron Cascade 2 30B A3BNVIDIA | 34 | |
| #147 | Llama Nemotron Super 49B v1.5NVIDIA | 34 | |
| #148 | NVIDIA Nemotron 3 Nano 30B A3BNVIDIA | 33.7 | |
| #149 | K2-V2MBZUAI Institute of Foundation Models | 33.3 | |
| #150 | Trinity Large ThinkingArcee AI | 33 | |
| #151 | INTELLECT-3Prime Intellect | 32.3 | |
| #152 | Qwen3 VL 235B A22B InstructAlibaba | 31.7 | |
| #153 | Qwen3 VL 32B InstructAlibaba | 31.3 | |
| #154 | Qwen3-235B-A22B-Instruct-2507Alibaba | 31.2 | |
| #155 | Qwen3 VL 8BAlibaba | 31 | |
| #156 | gpt-oss-20bOpenAI | 31 | |
| #157 | Gemma 4 E4BGoogle | 30.7 | |
| #158 | Nova PremierAmazon | 30 | |
| #159 | Devstral 2Mistral AI | 30 | |
| #160 | Qwen3 Coder 30B A3B InstructAlibaba | 29 | |
| #161 | DeepSeek-V3DeepSeek | 29 | |
| #162 | Devstral MediumMistral AI | 28.7 | |
| #163 | Gemini 2.0 FlashGoogle | 28.3 | |
| #164 | Mistral Medium 3Mistral AI | 28 | |
| #165 | Solar Pro 3Upstage | 27 | |
| #166 | Devstral SmallMistral AI | 26.7 | |
| #167 | Llama 4 ScoutMeta | 25.8 | |
| #168 | LongCat Flash LiteLongCat | 25.7 | |
| #169 | Kimi Linear 48B A3B InstructMoonshot AI | 25.7 | |
| #170 | QwQ-32BAlibaba | 25 | |
| #171 | Ling-2.6-flashInclusionAI | 25 | |
| #172 | Llama 3.1 405B InstructMeta | 24.3 | |
| #173 | Devstral Small 2Mistral AI | 24 | |
| #174 | Ministral 3 8BMistral AI | 24 | |
| #175 | Qwen3.5 2BAlibaba | 23.7 | |
| #176 | Qwen3 VL 30B A3B InstructAlibaba | 23.7 | |
| #177 | Claude 3.5 HaikuAnthropic | 23.3 | |
| #178 | Qwen3 30B A3B 2507 InstructAlibaba | 22.7 | |
| #179 | NVIDIA Nemotron Nano 9B V2NVIDIA | 22.7 | |
| #180 | Ministral 3 14BMistral AI | 22 | |
| #181 | Cogito v2.1Deep Cogito | 21.7 | |
| #182 | Qwen3 VL 4BAlibaba | 21.3 | |
| #183 | Ring-flash-2.0InclusionAI | 21 | |
| #184 | Claude 3 HaikuAnthropic | 21 | |
| #185 | Hermes 4 - Llama-3.1 405BNous Research | 20.7 | |
| #186 | Qwen2.5 72B InstructAlibaba | 20.3 | |
| #187 | Apriel-v1.5-15B-ThinkerServiceNow | 20 | |
| #188 | Mistral Small 3.1Mistral AI | 19.7 | |
| #189 | Mistral Medium 3.1Mistral AI | 19.7 | |
| #190 | Nova ProAmazon | 19 | |
| #191 | Granite 4.1 30BIBM | 18.7 | |
| #192 | Nova LiteAmazon | 17.7 | |
| #193 | Mistral Small 3.2Mistral AI | 17.3 | |
| #194 | Jamba Large 1.7AI21 Labs | 17.3 | |
| #195 | Llama-3.3 Nemotron Super 49B v1NVIDIA | 17 | |
| #196 | GPT-4.1 NanoOpenAI | 17 | |
| #197 | NVIDIA Nemotron 3 Nano 4BNVIDIA | 16.7 | |
| #198 | Magistral Small 1.2Mistral AI | 16.3 | |
| #199 | Llama 3.1 8B InstructMeta | 15.7 | |
| #200 | Qwen3 VL 8B InstructAlibaba | 15.3 | |
| #201 | Ling-flash-2.0InclusionAI | 15 | |
| #202 | Gemma 4 E2BGoogle | 15 | |
| #203 | Llama 3.3 70B InstructMeta | 15 | |
| #204 | Tri-21B-ThinkTrillion Labs | 14.7 | |
| #205 | EXAONE 4.0 32BLG AI Research | 14 | |
| #206 | Phi 4 Mini InstructMicrosoft | 13.7 | |
| #207 | Qwen3 VL 4B InstructAlibaba | 13 | |
| #208 | DeepSeek R1 0528 Qwen3 8BDeepSeek | 13 | |
| #209 | Motif-2-12.7B-ReasoningMotif Technologies | 13 | |
| #210 | Jamba 1.7 MiniAI21 Labs | 12.7 | |
| #211 | Granite 4.1 8BIBM | 12 | |
| #212 | JT-MINIChina Mobile | 11.7 | |
| #213 | HyperCLOVA X SEED ThinkNaver | 11.7 | |
| #214 | Llama 3.2 11B InstructMeta | 11.7 | |
| #215 | Ministral 3 3BMistral AI | 11.7 | |
| #216 | Mi:dm K 2.5 ProKorea Telecom | 11 | |
| #217 | DeepSeek R1 Distill Llama 70BDeepSeek | 11 | |
| #218 | Pixtral LargeMistral AI | 10.3 | |
| #219 | Nova MicroAmazon | 9.7 | |
| #220 | DeepSeek R1 Distill Qwen 32BDeepSeek | 9.7 | |
| #221 | Granite 4.0 H SmallIBM | 9 | |
| #222 | Falcon-H1R-7BTII UAE | 8.7 | |
| #223 | Qwen3 4B 2507 InstructAlibaba | 7.3 | |
| #224 | Llama 3.1 Nemotron Ultra 253B v1NVIDIA | 7.3 | |
| #225 | Jamba Reasoning 3BAI21 Labs | 7 | |
| #226 | Llama 3.1 Nemotron 70B InstructNVIDIA | 7 | |
| #227 | DeepSeek R1 Distill Qwen 14BDeepSeek | 7 | |
| #228 | Gemma 3 12B InstructGoogle | 6.7 | |
| #229 | Ling-mini-2.0InclusionAI | 6.7 | |
| #230 | Qwen3.5 0.8BAlibaba | 6.7 | |
| #231 | ERNIE 5.0 ThinkingBaidu | 6.7 | |
| #232 | Hermes 4 - Llama-3.1 70BNous Research | 6.7 | |
| #233 | MiniCPM-V 4.6 1.3BOpenBMB | 6.3 | |
| #234 | Granite 4.0 H 1BIBM | 6.3 | |
| #235 | Llama 3.1 70B InstructMeta | 6.3 | |
| #236 | Gemma 3 4B InstructGoogle | 5.7 | |
| #237 | Gemma 3 27B InstructGoogle | 5.7 | |
| #238 | Mistral Large 2Mistral AI | 5.3 | |
| #239 | Llama 3.2 1B InstructMeta | 5 | |
| #240 | MiniCPM5-1BOpenBMB | 4.7 | |
| #241 | Granite 3.3 8BIBM | 4.3 | |
| #242 | Granite 4.0 1BIBM | 4 | |
| #243 | Granite 4.0 MicroIBM | 4 | |
| #244 | Granite 4.1 3BIBM | 3 | |
| #245 | ERNIE 4.5 300B A47BBaidu | 2.3 | |
| #246 | Phi-3 Mini Instruct 3.8BMicrosoft | 2 | |
| #247 | Llama 3.2 3B InstructMeta | 2 | |
| #248 | DeepSeek R1 Distill Qwen 1.5BDeepSeek | 0.3 | |
| #249 | Qwen3 0.6BAlibaba | 0 | |
| #250 | Qwen3 4BAlibaba | 0 | |
| #251 | Qwen3 1.7BAlibaba | 0 | |
| #252 | Sarvam MSarvam | 0 | |
| #253 | OLMo 2 7BAllen Institute for AI | 0 | |
| #254 | OLMo 2 32BAllen Institute for AI | 0 | |
| #255 | LFM2 1.2BLiquid AI | 0 | |
| #256 | Magistral Small 1Mistral AI | 0 | |
| #257 | Magistral Medium 1Mistral AI | 0 | |
| #258 | Mistral 7B InstructMistral AI | 0 | |
| #259 | Gemma 3n E2B InstructGoogle | 0 | |
| #260 | Gemma 3n E4B InstructGoogle | 0 | |
| #261 | Gemma 3 1B InstructGoogle | 0 | |
| #262 | Qwen3 Omni 30B A3B InstructAlibaba | 0 | |
| #263 | Qwen3 Omni 30B A3BAlibaba | 0 | |
| #264 | Tiny Aya GlobalCohere | 0 | |
| #265 | Apertus 70B InstructSwiss AI Initiative | 0 | |
| #266 | Apertus 8B InstructSwiss AI Initiative | 0 | |
| #267 | Nanbeige4.1-3BNanbeige | 0 | |
| #268 | Sarvam 30BSarvam | 0 | |
| #269 | Sarvam 105BSarvam | 0 | |
| #270 | Exaone 4.0 1.2BLG AI Research | 0 | |
| #271 | Granite 4.0 350MIBM | 0 | |
| #272 | Granite 4.0 H 350MIBM | 0 | |
| #273 | Olmo 3.1 32B ThinkAllen Institute for AI | 0 | |
| #274 | Molmo2-8BAllen Institute for AI | 0 | |
| #275 | Olmo 3.1 32B InstructAllen Institute for AI | 0 | |
| #276 | Olmo 3 7B ThinkAllen Institute for AI | 0 | |
| #277 | Molmo 7B-DAllen Institute for AI | 0 | |
| #278 | Olmo 3 7B InstructAllen Institute for AI | 0 | |
| #279 | Step3 VL 10BStepFun | 0 | |
| #280 | Llama 3.1 Nemotron Nano 4B v1.1NVIDIA | 0 | |
| #281 | Solar Pro 2Upstage | 0 | |
| #282 | LFM2.5-VL-1.6BLiquid AI | 0 | |
| #283 | LFM2.5-1.2B-ThinkingLiquid AI | 0 | |
| #284 | LFM2 2.6BLiquid AI | 0 | |
| #285 | LFM2.5-1.2B-InstructLiquid AI | 0 | |
| #286 | LFM2 8B A1BLiquid AI | 0 | |
| #287 | Gemma 3 270MGoogle | 0 | |
| #288 | Reka Flash 3Reka AI | 0 | |
| #289 | DeepSeek R1 Distill Llama 8BDeepSeek | 0 | |
| #290 | Llama 3 8B InstructMeta | 0 | |
| #291 | Llama 3 70B InstructMeta | 0 | |
| #292 | Phi 4Microsoft | 0 | |
| #293 | Mistral Small 3Mistral AI | 0 | |
| #294 | Qwen3 235B A22BAlibaba | 0 | |
| #295 | Qwen3 32BAlibaba | 0 | |
| #296 | Qwen3 14BAlibaba | 0 | |
| #297 | Qwen3 8BAlibaba | 0 | |
| #298 | Qwen3 30B A3BAlibaba | 0 | |
| #299 | GLM 4.5VZhipu AI | 0 | |
| #300 | Olmo 3 32B ThinkAllen Institute for AI | 0 | |
| #301 | LFM2-24B-A2BLiquid AI | 0 | |