| 1 | google/gemini-3.1-pro-preview | | 33.3% | 3 | 6 | 9 |
| 2 | google/gemini-3-flash-preview | | 4.4% | 26 | 568 | 594 |
| 3 | qwen/qwen3-235b-a22b | | 3.2% | 7 | 214 | 221 |
| 4 | google/gemini-2.0-flash-001 | | 2.8% | 15 | 522 | 537 |
| 5 | openai/gpt-4o | | 1.2% | 7 | 587 | 594 |
| 6 | deepseek/deepseek-chat-v3-0324 | | 0.7% | 4 | 590 | 594 |
| 7 | anthropic/claude-3.7-sonnet | | 0.6% | 3 | 468 | 471 |
| 8 | mistralai/mistral-medium-3 | | 0% | 0 | 594 | 594 |
| 9 | meta-llama/llama-3.3-70b-instruct | | 0% | 0 | 594 | 594 |
| 10 | x-ai/grok-3-mini-beta | | 0% | 0 | 486 | 486 |