| 1 | Claude Opus 4.6Anthropic | Anthropic | 83.9 | 83.7 | 96 | 72.1 | -- |
| 2 | Claude Sonnet 4.6Anthropic | Anthropic | 80.9 | 79.6 | 95.2 | 68.4 | -- |
| 3 | GPT-5.4OpenAI | OpenAI | 78.7 | 80 | 97.5 | -- | -- |
| 4 | Claude Opus 4.5Anthropic | Anthropic | 78.3 | 80.9 | 95.2 | -- | -- |
| 5 | GPT-5.2OpenAI | OpenAI | 77.5 | 78 | 97 | -- | -- |
| 6 | GPT-5.1OpenAI | OpenAI | 76.7 | 76.5 | 96.8 | -- | -- |
| 7 | Claude Sonnet 4.5Anthropic | Anthropic | 76.2 | 77.2 | 94.5 | -- | -- |
| 8 | GPT-5OpenAI | OpenAI | 75.8 | 75 | 96.5 | -- | -- |
| 9 | Gemini 3 Flash PreviewGoogle | Google | 75.6 | 78 | 92 | -- | -- |
| 10 | o3OpenAI | OpenAI | 74.3 | 71.7 | 97 | -- | -- |
| 11 | Claude Opus 4Anthropic | Anthropic | 73.9 | 72.5 | 95 | -- | -- |
| 12 | Grok 4xAI | xAI | 72.8 | 70 | 95.5 | -- | -- |
| 13 | o4 MiniOpenAI | OpenAI | 71.7 | 68.1 | 95 | -- | -- |
| 14 | GPT-5.5OpenAI | OpenAI | 71 | 88.7 | -- | -- | -- |
| 15 | GPT-5.5 ProOpenAI | OpenAI | 71 | 88.7 | -- | -- | -- |
| 16 | Claude Opus 4.7Anthropic | Anthropic | 70.1 | 87.6 | -- | -- | -- |
| 17 | GPT-4o-miniOpenAI | OpenAI | 69.8 | -- | 87.2 | -- | -- |
| 18 | Claude Haiku 4.5Anthropic | Anthropic | 68.9 | 66.6 | 89.8 | -- | -- |
| 19 | Claude Sonnet 4Anthropic | Anthropic | 66.9 | 72.7 | 93.8 | 32.4 | -- |
| 20 | Gemini 2.5 FlashGoogle | Google | 65.8 | 60.4 | 90 | -- | -- |
| 21 | Gemini 3.1 Pro PreviewGoogle | Google | 64.5 | 80.6 | -- | -- | -- |
| 22 | DeepSeek V4 ProDeepSeek | DeepSeek | 64.5 | 80.6 | -- | -- | -- |
| 23 | GPT-4 TurboOpenAI | OpenAI | 60.9 | -- | 87.1 | 48.2 | -- |
| 24 | Llama 3.3 70B InstructMeta | Meta | 60.9 | -- | 88.4 | 46.9 | -- |
| 25 | MiniMax M2.5MiniMax | MiniMax | 60.6 | 75.8 | -- | -- | -- |
| 26 | GPT-4OpenAI | OpenAI | 60.5 | -- | 88.4 | 46 | -- |
| 27 | Claude 3.5 HaikuAnthropic | Anthropic | 60.4 | -- | 88.1 | 46.1 | -- |
| 28 | GPT-5.2 Chat(回退)OpenAI | OpenAI | 60 | -- | -- | -- | 60 |
| 29 | GLM 5.1(回退)Zhipu AI | Zhipu AI | 60 | -- | -- | -- | 60 |
| 30 | Grok 4.1 Fast(回退)xAI | xAI | 60 | -- | -- | -- | 60 |
| 31 | MiMo-V2.5-Pro(回退)Xiaomi | Xiaomi | 60 | -- | -- | -- | 60 |
| 32 | Kimi K2.6(回退)Moonshot AI | Moonshot AI | 60 | -- | -- | -- | 60 |
| 33 | Qwen3.6 Max Preview(回退)Alibaba | Alibaba | 60 | -- | -- | -- | 60 |
| 34 | GLM 5(回退)Zhipu AI | Zhipu AI | 60 | -- | -- | -- | 60 |
| 35 | Grok 4.3(回退)xAI | xAI | 60 | -- | -- | -- | 60 |
| 36 | Gemma 4 31B(回退)Google | Google | 60 | -- | -- | -- | 60 |
| 37 | Claude Opus 4.1(回退)Anthropic | Anthropic | 60 | -- | -- | -- | 60 |
| 38 | Qwen3.6 Plus(回退)Alibaba | Alibaba | 60 | -- | -- | -- | 60 |
| 39 | MiMo-V2-Pro(回退)Xiaomi | Xiaomi | 60 | -- | -- | -- | 60 |
| 40 | Qwen3.5 397B A17B(回退)Alibaba | Alibaba | 60 | -- | -- | -- | 60 |
| 41 | GLM 4.7(回退)Zhipu AI | Zhipu AI | 60 | -- | -- | -- | 60 |
| 42 | Gemma 4 26B A4B (回退)Google | Google | 60 | -- | -- | -- | 60 |
| 43 | Gemini 3.1 Flash Lite Preview(回退)Google | Google | 60 | -- | -- | -- | 60 |
| 44 | DeepSeek V4 Flash(回退)DeepSeek | DeepSeek | 60 | -- | -- | -- | 60 |
| 45 | GPT-5 Chat(回退)OpenAI | OpenAI | 60 | -- | -- | -- | 60 |
| 46 | GLM 4.6(回退)Zhipu AI | Zhipu AI | 60 | -- | -- | -- | 60 |
| 47 | MiMo-V2.5(回退)Xiaomi | Xiaomi | 60 | -- | -- | -- | 60 |
| 48 | DeepSeek V3.2(回退)DeepSeek | DeepSeek | 60 | -- | -- | -- | 60 |
| 49 | DeepSeek V3.2 Exp(回退)DeepSeek | DeepSeek | 60 | -- | -- | -- | 60 |
| 50 | Grok 4 Fast(回退)xAI | xAI | 60 | -- | -- | -- | 60 |
| 51 | Qwen3.5-122B-A10B(回退)Alibaba | Alibaba | 60 | -- | -- | -- | 60 |
| 52 | DeepSeek V3.1(回退)DeepSeek | DeepSeek | 60 | -- | -- | -- | 60 |
| 53 | Hy3 preview(回退)Tencent | Tencent | 60 | -- | -- | -- | 60 |
| 54 | DeepSeek V3.1 Terminus(回退)DeepSeek | DeepSeek | 60 | -- | -- | -- | 60 |
| 55 | Qwen3 VL 235B A22B Instruct(回退)Alibaba | Alibaba | 60 | -- | -- | -- | 60 |
| 56 | GLM 4.5(回退)Zhipu AI | Zhipu AI | 60 | -- | -- | -- | 60 |
| 57 | MiniMax M2.7(回退)MiniMax | MiniMax | 60 | -- | -- | -- | 60 |
| 58 | Qwen3.5-27B(回退)Alibaba | Alibaba | 60 | -- | -- | -- | 60 |
| 59 | Qwen3 Next 80B A3B Instruct(回退)Alibaba | Alibaba | 60 | -- | -- | -- | 60 |
| 60 | Qwen3.5-Flash(回退)Alibaba | Alibaba | 60 | -- | -- | -- | 60 |
| 61 | Qwen3.5-35B-A3B(回退)Alibaba | Alibaba | 60 | -- | -- | -- | 60 |
| 62 | Qwen3 VL 235B A22B Thinking(回退)Alibaba | Alibaba | 60 | -- | -- | -- | 60 |
| 63 | Step 3.5 Flash(回退)StepFun | StepFun | 60 | -- | -- | -- | 60 |
| 64 | GLM 4.6V(回退)Zhipu AI | Zhipu AI | 60 | -- | -- | -- | 60 |
| 65 | Trinity Large Thinking(回退)arcee-ai | arcee-ai | 60 | -- | -- | -- | 60 |
| 66 | Trinity Large Preview(回退)arcee-ai | arcee-ai | 60 | -- | -- | -- | 60 |
| 67 | GLM 4.5 Air(回退)Zhipu AI | Zhipu AI | 60 | -- | -- | -- | 60 |
| 68 | Qwen3 Next 80B A3B Thinking(回退)Alibaba | Alibaba | 60 | -- | -- | -- | 60 |
| 69 | GLM 4.7 Flash(回退)Zhipu AI | Zhipu AI | 60 | -- | -- | -- | 60 |
| 70 | MiniMax M1(回退)MiniMax | MiniMax | 60 | -- | -- | -- | 60 |
| 71 | o3 Mini High(回退)OpenAI | OpenAI | 60 | -- | -- | -- | 60 |
| 72 | Grok 3 Mini Beta(回退)xAI | xAI | 60 | -- | -- | -- | 60 |
| 73 | Command A(回退)Cohere | Cohere | 60 | -- | -- | -- | 60 |
| 74 | GLM 4.5V(回退)Zhipu AI | Zhipu AI | 60 | -- | -- | -- | 60 |
| 75 | Qwen3 8B(回退)Alibaba | Alibaba | 60 | -- | -- | -- | 60 |
| 76 | Mercury 2(回退)Inception | Inception | 60 | -- | -- | -- | 60 |
| 77 | Llama 3.3 Nemotron Super 49B V1.5(回退)NVIDIA | NVIDIA | 60 | -- | -- | -- | 60 |
| 78 | Nova 2 Lite(回退)Amazon | Amazon | 60 | -- | -- | -- | 60 |
| 79 | gpt-oss-20b(回退)OpenAI | OpenAI | 60 | -- | -- | -- | 60 |
| 80 | Mistral Large 2407(回退)Mistral AI | Mistral AI | 60 | -- | -- | -- | 60 |
| 81 | Olmo 3 32B Think(回退)Allen AI | Allen AI | 60 | -- | -- | -- | 60 |
| 82 | GPT-4.1OpenAI | OpenAI | 58.8 | 54.6 | 91.5 | 31.8 | -- |
| 83 | Phi 4Microsoft | Microsoft | 57.6 | -- | 82.6 | 45.5 | -- |
| 84 | Llama 3.1 70B InstructMeta | Meta | 57 | -- | 80.5 | 46.1 | -- |
| 85 | o1OpenAI | OpenAI | 57 | 48.9 | 92.4 | 32.4 | -- |
| 86 | DeepSeek V3DeepSeek | DeepSeek | 56.6 | 42 | 82.6 | 50 | -- |
| 87 | Gemma 2 27BGoogle | Google | 55.6 | -- | 69.5 | -- | -- |
| 88 | Mistral LargeMistral AI | Mistral AI | 54.9 | -- | 92 | 30 | -- |
| 89 | GPT-4oOpenAI | OpenAI | 54.7 | 30.8 | 90.2 | 51.1 | -- |
| 90 | Llama 3 70B InstructMeta | Meta | 54.5 | -- | 77.4 | 43.6 | -- |
| 91 | Grok 3xAI | xAI | 52.9 | -- | 90.5 | 27 | -- |
| 92 | Claude 3 HaikuAnthropic | Anthropic | 52.3 | -- | 76.8 | 39.4 | -- |
| 93 | DeepSeek V3 0324DeepSeek | DeepSeek | 50.5 | -- | 84.5 | 27.7 | -- |
| 94 | Llama 4 MaverickMeta | Meta | 50.2 | 21 | 89.5 | 49.7 | -- |
| 95 | MiniMax M2MiniMax | MiniMax | 48.8 | 61 | -- | -- | -- |
| 96 | GPT-5 MiniOpenAI | OpenAI | 47.8 | 59.8 | -- | -- | -- |
| 97 | R1 0528DeepSeek | DeepSeek | 46.1 | 57.6 | -- | -- | -- |
| 98 | Llama 3.1 8B InstructMeta | Meta | 46 | -- | 69.5 | 32.8 | -- |
| 99 | Gemini 2.0 FlashGoogle | Google | 46 | 13.5 | 89.4 | 45.9 | -- |
| 100 | Gemini 2.5 ProGoogle | Google | 44.3 | 63.8 | -- | 29.7 | -- |
| 101 | Llama 3 8B InstructMeta | Meta | 42.1 | -- | 61.6 | 31.9 | -- |
| 102 | GPT-4o (2024-11-20)OpenAI | OpenAI | 38.4 | -- | -- | 48 | -- |
| 103 | o3 MiniOpenAI | OpenAI | 38.1 | 49.3 | -- | 33.1 | -- |
| 104 | GPT-4o-mini (2024-07-18)OpenAI | OpenAI | 36.9 | -- | -- | 46.1 | -- |
| 105 | R1DeepSeek | DeepSeek | 36.8 | 49.2 | -- | 29.7 | -- |
| 106 | R1 Distill Qwen 32BDeepSeek | DeepSeek | 35.1 | -- | -- | 43.9 | -- |
| 107 | GPT-4.1 MiniOpenAI | OpenAI | 31.2 | 23.9 | -- | 48.9 | -- |
| 108 | Llama 4 ScoutMeta | Meta | 30.9 | 9.1 | 74.1 | 16.9 | -- |
| 109 | Qwen2.5 7B InstructAlibaba | Alibaba | 30.1 | -- | -- | 37.6 | -- |
| 110 | Command R (08-2024)Cohere | Cohere | 29.7 | -- | -- | 37.1 | -- |
| 111 | R1 Distill Llama 70BDeepSeek | DeepSeek | 28.2 | -- | -- | 35.3 | -- |
| 112 | GPT-5 NanoOpenAI | OpenAI | 27.8 | 34.8 | -- | -- | -- |
| 113 | Maestro Reasoningarcee-ai | arcee-ai | 23.8 | -- | -- | 29.7 | -- |
| 114 | GPT-4.1 NanoOpenAI | OpenAI | 22.7 | -- | -- | 28.4 | -- |
| 115 | gpt-oss-120bOpenAI | OpenAI | 20.8 | 26 | -- | -- | -- |
| 116 | Grok 3 MinixAI | xAI | 18.9 | -- | -- | 23.6 | -- |
| 117 | Llama 3.2 3B InstructMeta | Meta | 18.7 | -- | -- | 23.4 | -- |
| 118 | Gemini 2.0 Flash LiteGoogle | Google | 15.7 | -- | -- | 19.6 | -- |
| 119 | Llama 3.2 1B InstructMeta | Meta | 6.6 | -- | -- | 8.2 | -- |