| 1 | google/gemini-3.1-pro-preview | | 33.3% | 3 | 6 | 9 |
| 2 | google/gemini-3-flash-preview | | 4.6% | 21 | 438 | 459 |
| 3 | qwen/qwen3-235b-a22b | | 3.2% | 7 | 214 | 221 |
| 4 | google/gemini-2.0-flash-001 | | 3.1% | 14 | 445 | 459 |
| 5 | openai/gpt-4o | | 1.3% | 6 | 453 | 459 |
| 6 | deepseek/deepseek-chat-v3-0324 | | 0.9% | 4 | 455 | 459 |
| 7 | anthropic/claude-3.7-sonnet | | 0.7% | 3 | 456 | 459 |
| 8 | mistralai/mistral-medium-3 | | 0% | 0 | 459 | 459 |
| 9 | meta-llama/llama-3.3-70b-instruct | | 0% | 0 | 459 | 459 |
| 10 | x-ai/grok-3-mini-beta | | 0% | 0 | 459 | 459 |