| 1 | google/gemini-3.1-pro-preview | | 95.2% | 20 | 1 | 21 |
| 2 | z-ai/glm-5 | | 87% | 127 | 19 | 146 |
| 3 | moonshotai/kimi-k2.5 | | 74% | 108 | 38 | 146 |
| 4 | x-ai/grok-3-mini-beta | | 56.2% | 82 | 64 | 146 |
| 5 | qwen/qwen3-235b-a22b | | 38.9% | 44 | 69 | 113 |
| 6 | minimax/minimax-m2.5 | | 32.9% | 48 | 98 | 146 |
| 7 | google/gemini-3-flash-preview | | 21.9% | 32 | 114 | 146 |
| 8 | anthropic/claude-sonnet-4.6 | | 13% | 19 | 127 | 146 |
| 9 | meta-llama/llama-3.3-70b-instruct | | 12.5% | 4 | 28 | 32 |
| 10 | google/gemini-2.0-flash-001 | | 6.2% | 9 | 137 | 146 |
| 11 | anthropic/claude-3.7-sonnet | | 6.2% | 9 | 137 | 146 |
| 12 | deepseek/deepseek-chat-v3-0324 | | 3.4% | 5 | 141 | 146 |
| 13 | openai/gpt-4o | | 3.4% | 5 | 141 | 146 |
| 14 | mistralai/mistral-medium-3 | | 0% | 0 | 146 | 146 |