 Google (AI Studio) |  Gemini 3.1 Pro Preview (AI Studio) | | | | | | | 29.42 | N/A | |
 Google (Vertex) |  Gemini 3.1 Pro Preview (Vertex) | | | | | | | 39.23 | N/A | |
 OpenAI |  GPT-5.4 (xhigh) | | | | | | | 109.26 | N/A | |
 OpenAI |  GPT-5.3 Codex (xhigh) | | | | | | | 92.20 | N/A | |
 Anthropic |  Claude Opus 4.6 (max) | | | | | | | 19.99 | N/A | |
 Microsoft Azure |  Claude Opus 4.6 (max) | | | | | | | 20.54 | N/A | |
 Google |  Claude Opus 4.6 (max) | | | | | | | 9.36 | N/A | |
 Amazon Bedrock |  Claude Opus 4.6 (max) | | | | | | | 10.12 | N/A | |
 Microsoft Azure |  Claude Sonnet 4.6 (max) | | | | | | | 63.69 | N/A | |
 Amazon Bedrock |  Claude Sonnet 4.6 (max) | | | | | | | 46.77 | N/A | |
 Anthropic |  Claude Sonnet 4.6 (max) | | | | | | | 75.73 | N/A | |
 Google |  Claude Sonnet 4.6 (max) | | | | | | | 73.07 | N/A | |
 OpenAI |  GPT-5.2 (xhigh) | | | | | | | 111.61 | N/A | |
 Microsoft Azure |  GPT-5.2 (xhigh) | | | | | | | 97.69 | N/A | |
 Databricks |  GPT-5.2 (xhigh) | | | | | | | 122.12 | N/A | |
 Novita FP8 |  GLM-5 FP8 | | | | | | | 55.81 | 43.65 | |
 FriendliAI |  GLM-5 | | | | | | | 49.15 | 38.92 | |
 SiliconFlow (FP8) |  GLM-5 (FP8) | | | | | | | 71.26 | 54.21 | |
 DeepInfra FP8 |  GLM-5 FP8 | | | | | | | 73.24 | 57.92 | |
 GMI FP8 |  GLM-5 FP8 | | | | | | | 23.54 | 17.62 | |
 Fireworks |  GLM-5 | | | | | | | 11.60 | 8.47 | |
 Parasail (FP8) |  GLM-5 (FP8) | | | | | | | 91.82 | 72.90 | |
 Weights & Biases (FP8) |  GLM-5 (FP8) | | | | | | | 83.28 | 66.01 | |
 Baseten |  GLM-5 | | | | | | | 13.05 | 10.17 | |
 Google |  GLM-5 | | | | | | | 27.50 | 21.50 | |
 Together.ai (FP4) |  GLM-5 (FP4) | | | | | | | 45.74 | 36.05 | |
 OpenAI |  GPT-5.2 Codex (xhigh) | | | | | | | 10.96 | N/A | |
 Microsoft Azure |  GPT-5.2 Codex (xhigh) | | | | | | | 14.56 | N/A | |
 Amazon Bedrock |  Kimi K2.5 | | | | | | | 34.61 | 26.64 | |
 Lightning AI |  Kimi K2.5 | | | | | | | 23.82 | 18.87 | |
 Fireworks |  Kimi K2.5 | | | | | | | 14.38 | 11.25 | |
 Novita |  Kimi K2.5 | | | | | | | 57.65 | 45.21 | |
 Kimi |  Kimi K2.5 | | | | | | | 60.53 | 47.54 | |
 DeepInfra |  Kimi K2.5 | | | | | | | 169.96 | 135.04 | |
 Together.ai |  Kimi K2.5 | | | | | | | 56.07 | 44.53 | |
 Parasail |  Kimi K2.5 | | | | | | | 70.10 | 55.63 | |
 SiliconFlow |  Kimi K2.5 | | | | | | | 113.71 | 89.44 | |
 Weights & Biases |  Kimi K2.5 | | | | | | | 45.36 | 35.76 | |
 DeepInfra Turbo |  Kimi K2.5 Turbo | | | | | | | 10.45 | 7.87 | |
 Baseten |  Kimi K2.5 | | | | | | | 8.73 | 6.81 | |
 Nebius |  Kimi K2.5 | | | | | | | 40.66 | 31.90 | |
 OpenAI |  GPT-5.2 (medium) | | | | | | | 10.80 | N/A | |
 Microsoft Azure |  Claude Opus 4.6 | | | | | | | 11.59 | N/A | |
 Amazon Bedrock |  Claude Opus 4.6 | | | | | | | 11.15 | N/A | |
 Anthropic |  Claude Opus 4.6 | | | | | | | 11.39 | N/A | |
 Google |  Claude Opus 4.6 | | | | | | | 10.67 | N/A | |
 Google (AI Studio) |  Gemini 3 Flash (AI Studio) | | | | | | | 9.52 | N/A | |
 Alibaba Cloud |  Qwen3.5 397B A17B | | | | | | | 45.84 | 35.22 | |
 Novita |  Qwen3.5 397B A17B | | | | | | | 44.16 | 34.45 | |
 Together.ai |  Qwen3.5 397B A17B | | | | | | | 311.97 | 86.91 | |
 Parasail |  Qwen3.5 397B A17B | | | | | | | 86.65 | 68.81 | |
 Google |  Claude Sonnet 4.6 | | | | | | | 10.49 | N/A | |
 Amazon Bedrock |  Claude Sonnet 4.6 | | | | | | | 10.33 | N/A | |
 Anthropic |  Claude Sonnet 4.6 | | | | | | | 10.80 | N/A | |
 Microsoft Azure |  Claude Sonnet 4.6 | | | | | | | 11.27 | N/A | |
 Anthropic |  Claude Sonnet 4.6 (Non-reasoning, Low Effort) | | | | | | | 10.81 | N/A | |
 Alibaba Cloud |  Qwen3.5 27B | | | | | | | 29.57 | 22.58 | |
 Novita |  Qwen3.5 27B | | | | | | | 34.64 | 26.59 | |
 FriendliAI |  MiniMax-M2.5 | | | | | | | 60.05 | 46.12 | |
 MiniMax |  MiniMax-M2.5 | | | | | | | 53.77 | 41.18 | |
 Novita |  MiniMax-M2.5 | | | | | | | 74.65 | 58.68 | |
 Fireworks |  MiniMax-M2.5 | | | | | | | 9.89 | 7.40 | |
 Clarifai |  MiniMax-M2.5 | | | | | | | 17.65 | 13.87 | |
 Weights & Biases |  MiniMax-M2.5 | | | | | | | 28.68 | 22.45 | |
 SambaNova |  MiniMax-M2.5 | | | | | | | 6.58 | 4.80 | |
 SiliconFlow (FP8) |  MiniMax-M2.5 (FP8) | | | | | | | 28.21 | 21.84 | |
 Together.ai (FP4) |  MiniMax-M2.5 (FP4) | | | | | | | 42.30 | 33.59 | |
 Parasail (FP8) |  MiniMax-M2.5 (FP8) | | | | | | | 33.33 | 26.27 | |
 Amazon Bedrock |  DeepSeek V3.2 | | | | | | | 46.26 | 35.89 | |
 SiliconFlow (FP8) |  DeepSeek V3.2 (FP8) | | | | | | | 105.45 | 83.38 | |
 DeepSeek |  DeepSeek V3.2 | | | | | | | 106.40 | 84.07 | |
 Google Vertex |  DeepSeek V3.2 Vertex | | | | | | | 80.82 | 64.11 | |
 Novita |  DeepSeek V3.2 | | | | | | | 77.08 | 60.49 | |
 Parasail (FP8) |  DeepSeek V3.2 (FP8) | | | | | | | 269.09 | 214.06 | |
 Fireworks |  DeepSeek V3.2 | | | | | | | 28.80 | 22.12 | |
 SambaNova |  DeepSeek V3.2 | | | | | | | 11.11 | 7.80 | |
 Nebius |  DeepSeek V3.2 | | | | | | | 33.58 | 26.03 | |
 Alibaba Cloud |  Qwen3.5 122B A10B | | | | | | | 20.16 | 15.32 | |
 Novita |  Qwen3.5 122B A10B | | | | | | | 21.26 | 16.19 | |
 xAI |  Grok 4 | | | | | | | 24.52 | N/A | |
 Microsoft Azure |  Grok 4 | | | | | | | 23.58 | N/A | |
 Xiaomi |  MiMo-V2-Flash (Feb 2026) | | | | | | | 23.27 | 17.50 | |
 Google (AI Studio) |  Gemini 3 Pro Preview (low) (AI Studio) | | | | | | | 6.67 | N/A | |
 Google (Vertex) |  Gemini 3 Pro Preview (low) (Vertex) | | | | | | | 8.17 | N/A | |
 Databricks |  GPT-5 mini (high) | | | | | | | 144.71 | N/A | |
 OpenAI |  GPT-5 mini (high) | | | | | | | 157.66 | N/A | |
 Microsoft Azure |  GPT-5 mini (high) | | | | | | | 107.42 | N/A | |
 Fireworks |  GLM-5 | | | | | | | 3.25 | N/A | |
 Baseten |  GLM-5 | | | | | | | 2.81 | N/A | |
 DeepInfra (FP8) |  GLM-5 (FP8) | | | | | | | 17.18 | N/A | |
 SiliconFlow (FP8) |  GLM-5 (FP8) | | | | | | | 16.50 | N/A | |
 Novita (FP8) |  GLM-5 (FP8) | | | | | | | 13.13 | N/A | |
 Alibaba Cloud |  Qwen3.5 397B A17B | | | | | | | 10.26 | N/A | |
 Novita |  Qwen3.5 397B A17B | | | | | | | 9.99 | N/A | |
 Alibaba Cloud |  Qwen3 Max Thinking | | | | | | | 74.42 | 58.26 | |
 OpenAI |  GPT-5.1 Codex mini (high) | | | | | | | 9.26 | N/A | |
 Microsoft Azure |  GPT-5.1 Codex mini (high) | | | | | | | 18.16 | N/A | |
 xAI |  Grok 4.1 Fast | | | | | | | 17.51 | N/A | |
 Microsoft Azure |  o3 | | | | | | | 33.84 | N/A | |
 OpenAI |  o3 | | | | | | | 19.23 | N/A | |
 StepFun |  Step 3.5 Flash | | | | | | | 16.71 | 12.44 | |
 SiliconFlow (FP8) |  Step 3.5 Flash (FP8) | | | | | | | 24.68 | 18.86 | |
 Nebius |  Kimi K2.5 | | | | | | | 9.84 | N/A | |
 Kimi |  Kimi K2.5 | | | | | | | 14.28 | N/A | |
 GMI |  Kimi K2.5 | | | | | | | 11.80 | N/A | |
 Together.ai |  Kimi K2.5 | | | | | | | 25.70 | N/A | |
 Fireworks |  Kimi K2.5 | | | | | | | 3.22 | N/A | |
 Novita |  Kimi K2.5 | | | | | | | 31.46 | N/A | |
 Baseten |  Kimi K2.5 | | | | | | | 3.65 | N/A | |
 Alibaba Cloud |  Qwen3.5 27B | | | | | | | 6.58 | N/A | |
 Alibaba Cloud |  Qwen3.5 35B A3B | | | | | | | 19.65 | 14.89 | |
 Novita |  Qwen3.5 35B A3B | | | | | | | 21.36 | 16.20 | |
 Parasail (FP8) |  Qwen3.5 35B A3B (FP8) | | | | | | | 29.75 | 23.46 | |
 Amazon Bedrock |  Claude 4.5 Haiku | | | | | | | 13.18 | N/A | |
 Google Vertex |  Claude 4.5 Haiku Vertex | | | | | | | 21.77 | N/A | |
 Anthropic |  Claude 4.5 Haiku | | | | | | | 15.82 | N/A | |
 Microsoft Azure |  Claude 4.5 Haiku | | | | | | | 16.16 | N/A | |
 Novita |  KAT-Coder-Pro V1 | | | | | | | 10.65 | N/A | |
 Alibaba Cloud |  Qwen3.5 122B A10B | | | | | | | 4.61 | N/A | |
 Amazon Bedrock |  Nova 2.0 Pro Preview (medium) | | | | | | | 35.19 | 14.40 | |
 Google (AI Studio) |  Gemini 3 Flash (AI Studio) | | | | | | | 3.88 | N/A | |
 Google Vertex |  Gemini 2.5 Pro Vertex | | | | | | | 30.43 | N/A | |
 Google (AI Studio) |  Gemini 2.5 Pro (AI Studio) | | | | | | | 28.11 | N/A | |
 OpenAI |  GPT-5.2 | | | | | | | 8.77 | N/A | |
 Microsoft Azure |  GPT-5.2 | | | | | | | 7.73 | N/A | |
 Google (AI Studio) |  Gemini 3.1 Flash-Lite Preview (AI Studio) | | | | | | | 7.70 | N/A | |
 Cerebras |  gpt-oss-120B (high) | | | | | | | 1.48 | 0.96 | |
 Parasail |  gpt-oss-120B (high) | | | | | | | 63.32 | 50.23 | |
 Databricks |  gpt-oss-120B (high) | | | | | | | 19.74 | 15.34 | |
 Cloudflare |  gpt-oss-120B (high) | | | | | | | 111.13 | 18.21 | |
 Microsoft Azure |  gpt-oss-120B (high) | | | | | | | 9.97 | 7.65 | |
 Baseten |  gpt-oss-120B (high) | | | | | | | 11.11 | 8.80 | |
 SambaNova |  gpt-oss-120B (high) | | | | | | | 4.02 | 2.62 | |
 Hyperbolic |  gpt-oss-120B (high) | | | | | | | 4.16 | 2.97 | |
 Amazon Bedrock |  gpt-oss-120B (high) | | | | | | | 8.60 | 6.37 | |
 Together.ai |  gpt-oss-120B (high) | | | | | | | 3.99 | 2.90 | |
 Lightning AI |  gpt-oss-120B (high) | | | | | | | 12.04 | 9.48 | |
 DeepInfra (Turbo) |  gpt-oss-120B (high) (Turbo) | | | | | | | 10.24 | 8.00 | |
 Google Vertex |  gpt-oss-120B (high) Vertex | | | | | | | 5.33 | 4.05 | |
 Snowflake |  gpt-oss-120B (high) | | | | | | | 9.63 | 7.36 | |
 Groq |  gpt-oss-120B (high) | | | | | | | 6.31 | 4.27 | |
 Clarifai |  gpt-oss-120B (high) | | | | | | | 6.14 | 4.73 | |
 DeepInfra |  gpt-oss-120B (high) | | | | | | | 35.91 | 28.26 | |
 Weights & Biases |  gpt-oss-120B (high) | | | | | | | 24.02 | 18.71 | |
 Novita |  gpt-oss-120B (high) | | | | | | | 30.49 | 23.81 | |
 Fireworks |  gpt-oss-120B (high) | | | | | | | 3.53 | 2.58 | |
 Scaleway |  gpt-oss-120B (high) | | | | | | | 19.52 | 15.09 | |
 Nebius Base |  gpt-oss-120B (high) Base | | | | | | | 12.33 | 9.42 | |
 Eigen AI |  gpt-oss-120B (high) | | | | | | | 5.29 | 3.16 | |
 Inception |  Mercury 2 | | | | | | | 4.71 | N/A | |
 Alibaba Cloud |  Qwen3 Max Thinking (Preview) | | | | | | | 63.43 | 49.39 | |
 Amazon Bedrock |  DeepSeek V3.2 | | | | | | | 8.39 | N/A | |
 GMI |  DeepSeek V3.2 | | | | | | | 17.32 | N/A | |
 SambaNova |  DeepSeek V3.2 | | | | | | | 3.95 | N/A | |
 SiliconFlow (FP8) |  DeepSeek V3.2 (FP8) | | | | | | | 17.70 | N/A | |
 DeepSeek |  DeepSeek V3.2 | | | | | | | 21.95 | N/A | |
 Google Vertex |  DeepSeek V3.2 Vertex | | | | | | | 14.32 | N/A | |
 Fireworks |  DeepSeek V3.2 | | | | | | | 11.87 | N/A | |
 Novita |  DeepSeek V3.2 | | | | | | | 16.48 | N/A | |
 DeepInfra |  DeepSeek V3.2 | | | | | | | 44.80 | N/A | |
 Microsoft Azure |  DeepSeek V3.2 | | | | | | | 7.54 | N/A | |
 Nebius |  DeepSeek V3.2 | | | | | | | 7.77 | N/A | |
 xAI Fast |  Grok 3 mini Reasoning (high) Fast | | | | | | | 13.09 | 10.11 | |
 xAI |  Grok 3 mini Reasoning (high) | | | | | | | 13.24 | 10.21 | |
 Microsoft Azure |  Grok 3 mini Reasoning (high) | | | | | | | 24.18 | 19.05 | |
 Amazon Bedrock |  Nova 2.0 Pro Preview (low) | | | | | | | 23.44 | 13.41 | |
 Alibaba Cloud |  Qwen3 Max | | | | | | | 17.34 | N/A | |
 Novita |  Qwen3 Max | | | | | | | 16.92 | N/A | |
 Amazon Bedrock |  Claude 4.5 Haiku | | | | | | | 5.87 | N/A | |
 Google Vertex |  Claude 4.5 Haiku Vertex | | | | | | | 5.56 | N/A | |
 Anthropic |  Claude 4.5 Haiku | | | | | | | 5.53 | N/A | |
 Microsoft Azure |  Claude 4.5 Haiku | | | | | | | 6.06 | N/A | |
 Alibaba Cloud |  Qwen3.5 35B A3B | | | | | | | 4.54 | N/A | |
 Xiaomi |  MiMo-V2-Flash | | | | | | | 5.82 | N/A | |
 Novita |  GLM-4.7-Flash | | | | | | | 29.34 | 22.84 | |
 DeepInfra |  GLM-4.7-Flash | | | | | | | 29.55 | 23.42 | |
 Amazon Bedrock |  GLM-4.7-Flash | | | | | | | 11.64 | 8.29 | |
 Amazon Bedrock |  Nova 2.0 Lite (medium) | | | | | | | 22.48 | 9.63 | |
 Novita |  Qwen3 235B A22B 2507 | | | | | | | 43.97 | 34.25 | |
 Alibaba Cloud |  Qwen3 235B A22B 2507 | | | | | | | 59.57 | 46.51 | |
 Weights & Biases |  Qwen3 235B A22B 2507 | | | | | | | 24.68 | 19.25 | |
 DeepInfra (FP8) |  Qwen3 235B A22B 2507 (FP8) | | | | | | | 86.18 | 68.66 | |
 Nebius (FP8) |  Qwen3 235B A22B 2507 (FP8) | | | | | | | 34.98 | 27.47 | |
 FriendliAI |  Qwen3 235B A22B 2507 | | | | | | | 55.23 | 43.95 | |
 Eigen AI (FP8) |  Qwen3 235B A22B 2507 (FP8) | | | | | | | 16.64 | 12.16 | |
 xAI |  Grok Code Fast 1 | | | | | | | 6.17 | N/A | |
 Together.ai (FP8) |  Qwen3 Coder Next (FP8) | | | | | | | 3.70 | N/A | |
 Novita (FP8) |  Qwen3 Coder Next (FP8) | | | | | | | 4.01 | N/A | |
 Parasail (FP8) |  Qwen3 Coder Next (FP8) | | | | | | | 5.76 | N/A | |
 Alibaba Cloud |  Qwen3 VL 235B A22B | | | | | | | 57.31 | 44.97 | |
 Novita |  Qwen3 VL 235B A22B | | | | | | | 62.98 | 49.46 | |
 Together.ai |  Apriel-v1.6-15B-Thinker | | | | | | | 18.60 | 14.71 | |
 Mistral |  Magistral Medium 1.2 | | | | | | | 62.52 | 49.62 | |
 Nebius |  DeepSeek R1 0528 | | | | | | | 79.36 | 62.96 | |
 Hyperbolic |  DeepSeek R1 0528 | | | | | | | 70.43 | 55.12 | |
 DeepInfra |  DeepSeek R1 0528 | | | | | | | 62.67 | 49.65 | |
 SambaNova |  DeepSeek R1 0528 | | | | | | | 10.61 | 7.55 | |
 Google Vertex |  DeepSeek R1 0528 Vertex | | | | | | | 12.73 | 9.96 | |
 Together.ai |  DeepSeek R1 0528 | | | | | | | 8.81 | 6.74 | |
 Nebius Fast, FP4 |  DeepSeek R1 0528 Fast, FP4 | | | | | | | 11.04 | 7.90 | |
 Novita |  DeepSeek R1 0528 | | | | | | | 60.98 | 47.80 | |
 Microsoft Azure |  DeepSeek R1 0528 | | | | | | | 32.09 | 25.28 | |
 Databricks |  GPT-5 nano (high) | | | | | | | 116.66 | N/A | |
 OpenAI |  GPT-5 nano (high) | | | | | | | 90.15 | N/A | |
 Microsoft Azure |  GPT-5 nano (high) | | | | | | | 112.04 | N/A | |
 Google Vertex |  Qwen3 Next 80B A3B Vertex | | | | | | | 15.33 | 12.04 | |
 Novita |  Qwen3 Next 80B A3B | | | | | | | 12.99 | 9.63 | |
 Alibaba Cloud |  Qwen3 Next 80B A3B | | | | | | | 20.29 | 15.36 | |
 Hyperbolic |  Qwen3 Next 80B A3B | | | | | | | 8.44 | 6.26 | |
 Nebius (FP8) |  Qwen3 Next 80B A3B (FP8) | | | | | | | 17.53 | 13.49 | |
 Eigen AI |  Qwen3 Next 80B A3B | | | | | | | 9.07 | 6.06 | |
 Parasail |  Qwen3 235B 2507 | | | | | | | 16.65 | N/A | |
 Scaleway |  Qwen3 235B 2507 | | | | | | | 7.09 | N/A | |
 Nebius |  Qwen3 235B 2507 | | | | | | | 5.92 | N/A | |
 Alibaba Cloud |  Qwen3 235B 2507 | | | | | | | 8.88 | N/A | |
 Together.ai (FP8) |  Qwen3 235B 2507 (FP8) | | | | | | | 2.35 | N/A | |
 Weights & Biases |  Qwen3 235B 2507 | | | | | | | 11.36 | N/A | |
 Hyperbolic |  Qwen3 235B 2507 | | | | | | | 13.15 | N/A | |
 Amazon Bedrock |  Qwen3 235B 2507 | | | | | | | 7.61 | N/A | |
 DeepInfra |  Qwen3 235B 2507 | | | | | | | 56.45 | N/A | |
 Google Vertex |  Qwen3 235B 2507 Vertex | | | | | | | 5.06 | N/A | |
 Novita |  Qwen3 235B 2507 | | | | | | | 20.89 | N/A | |
 FriendliAI |  Qwen3 235B 2507 | | | | | | | 9.51 | N/A | |
 DeepInfra (FP8) |  Qwen3 Coder 480B (FP8) | | | | | | | 5.68 | N/A | |
 Hyperbolic (FP8) |  Qwen3 Coder 480B (FP8) | | | | | | | 7.43 | N/A | |
 Together.ai (FP8) |  Qwen3 Coder 480B (FP8) | | | | | | | 3.35 | N/A | |
 Alibaba Cloud |  Qwen3 Coder 480B | | | | | | | 9.22 | N/A | |
 Nebius |  Qwen3 Coder 480B | | | | | | | 7.52 | N/A | |
 Amazon Bedrock |  Qwen3 Coder 480B | | | | | | | 6.97 | N/A | |
 Google Vertex |  Qwen3 Coder 480B Vertex | | | | | | | 3.01 | N/A | |
 DeepInfra (Turbo, FP4) |  Qwen3 Coder 480B (Turbo, FP4) | | | | | | | 7.43 | N/A | |
 Novita |  Qwen3 Coder 480B | | | | | | | 9.98 | N/A | |
 Weights & Biases |  Qwen3 Coder 480B | | | | | | | 7.79 | N/A | |
 Eigen AI |  Qwen3 Coder 480B | | | | | | | 6.18 | N/A | |
 Alibaba Cloud |  Qwen3 VL 32B | | | | | | | 27.68 | 21.14 | |
 Amazon Bedrock |  Nova 2.0 Lite (low) | | | | | | | 15.52 | 9.27 | |
 Novita |  gpt-oss-20B (high) | | | | | | | 23.97 | 18.62 | |
 Google Vertex |  gpt-oss-20B (high) Vertex | | | | | | | 9.00 | 7.06 | |
 Amazon Bedrock |  gpt-oss-20B (high) | | | | | | | 17.57 | 3.32 | |
 Databricks |  gpt-oss-20B (high) | | | | | | | 8.83 | 6.77 | |
 Groq |  gpt-oss-20B (high) | | | | | | | 3.02 | 2.24 | |
 DeepInfra |  gpt-oss-20B (high) | | | | | | | 26.32 | 20.60 | |
 Together.ai |  gpt-oss-20B (high) | | | | | | | 2.68 | 1.91 | |
 Cloudflare |  gpt-oss-20B (high) | | | | | | | 76.22 | 14.11 | |
 Hyperbolic |  gpt-oss-20B (high) | | | | | | | 21.40 | 16.65 | |
 Lightning AI |  gpt-oss-20B (high) | | | | | | | 6.40 | 4.83 | |
 Weights & Biases |  gpt-oss-20B (high) | | | | | | | 8.66 | 6.48 | |
 Nebius Base |  gpt-oss-20B (high) Base | | | | | | | 19.92 | 15.49 | |
 Baseten |  gpt-oss-120B (low) | | | | | | | 11.18 | 8.78 | |
 Lightning AI |  gpt-oss-120B (low) | | | | | | | 12.10 | 9.52 | |
 Amazon Bedrock |  gpt-oss-120B (low) | | | | | | | 8.76 | 6.52 | |
 Parasail |  gpt-oss-120B (low) | | | | | | | 67.92 | 53.84 | |
 Databricks |  gpt-oss-120B (low) | | | | | | | 19.35 | 15.02 | |
 Together.ai |  gpt-oss-120B (low) | | | | | | | 4.08 | 2.86 | |
 Hyperbolic |  gpt-oss-120B (low) | | | | | | | 4.19 | 3.00 | |
 Fireworks |  gpt-oss-120B (low) | | | | | | | 3.65 | 2.68 | |
 Groq |  gpt-oss-120B (low) | | | | | | | 6.36 | 4.30 | |
 Weights & Biases |  gpt-oss-120B (low) | | | | | | | 24.52 | 19.07 | |
 Cerebras |  gpt-oss-120B (low) | | | | | | | 1.81 | 1.06 | |
 Clarifai |  gpt-oss-120B (low) | | | | | | | 8.17 | 6.32 | |
 SambaNova |  gpt-oss-120B (low) | | | | | | | 3.79 | 2.52 | |
 Nebius Base |  gpt-oss-120B (low) Base | | | | | | | 11.23 | 8.53 | |
 Snowflake |  gpt-oss-120B (low) | | | | | | | 9.66 | 7.33 | |
 Google Vertex |  gpt-oss-120B (low) Vertex | | | | | | | 5.58 | 4.25 | |
 Cloudflare |  gpt-oss-120B (low) | | | | | | | 34.09 | 17.51 | |
 Microsoft Azure |  gpt-oss-120B (low) | | | | | | | 11.23 | 8.63 | |
 Eigen AI |  gpt-oss-120B (low) | | | | | | | 5.26 | 3.05 | |
 Novita |  gpt-oss-120B (low) | | | | | | | 41.54 | 32.71 | |
 Nebius |  NVIDIA Nemotron 3 Nano | | | | | | | 12.89 | 9.85 | |
 DeepInfra |  NVIDIA Nemotron 3 Nano | | | | | | | 24.76 | 19.42 | |
 xAI |  Grok 4.1 Fast | | | | | | | 5.50 | N/A | |
 SiliconFlow |  GLM-4.6V | | | | | | | 167.44 | 132.46 | |
 DeepInfra (FP8) |  GLM-4.6V (FP8) | | | | | | | 23.93 | 18.95 | |
 Parasail (FP8) |  GLM-4.6V (FP8) | | | | | | | 23.85 | 18.70 | |
 Novita |  GLM-4.6V | | | | | | | 113.39 | 89.77 | |
 Amazon Bedrock |  Nova 2.0 Omni (low) | | | | | | | 13.62 | 8.75 | |
 Amazon Bedrock |  Nova 2.0 Pro Preview | | | | | | | 3.69 | N/A | |
 Amazon Bedrock |  Mistral Large 3 | | | | | | | 4.41 | N/A | |
 Mistral |  Mistral Large 3 | | | | | | | 9.72 | N/A | |
 Microsoft Azure |  Mistral Large 3 | | | | | | | 5.46 | N/A | |
 Nebius |  Qwen3 30B A3B 2507 | | | | | | | 33.36 | 26.23 | |
 Alibaba Cloud |  Qwen3 30B A3B 2507 | | | | | | | 18.63 | 14.13 | |
 Clarifai |  Qwen3 30B A3B 2507 | | | | | | | 41.35 | 32.86 | |
 Amazon Bedrock |  GLM-4.7-Flash | | | | | | | 3.29 | N/A | |
 Novita |  GLM-4.7-Flash | | | | | | | 6.62 | N/A | |
 Mistral |  Devstral 2 | | | | | | | 6.49 | N/A | |
 Google (AI Studio) |  Gemini 2.5 Flash-Lite (Sep) (AI Studio) | | | | | | | 8.64 | N/A | |
 Mistral |  Mistral Medium 3.1 | | | | | | | 5.36 | N/A | |
 Google Vertex |  gpt-oss-20B (low) Vertex | | | | | | | 9.00 | 7.07 | |
 Amazon Bedrock |  gpt-oss-20B (low) | | | | | | | 11.78 | 6.59 | |
 Novita |  gpt-oss-20B (low) | | | | | | | 23.03 | 17.84 | |
 Together.ai |  gpt-oss-20B (low) | | | | | | | 2.87 | 2.06 | |
 Databricks |  gpt-oss-20B (low) | | | | | | | 8.69 | 6.66 | |
 Groq |  gpt-oss-20B (low) | | | | | | | 3.69 | 2.21 | |
 Nebius Base |  gpt-oss-20B (low) Base | | | | | | | 22.68 | 17.65 | |
 Cloudflare |  gpt-oss-20B (low) | | | | | | | 32.45 | 17.98 | |
 Lightning AI |  gpt-oss-20B (low) | | | | | | | 6.38 | 4.81 | |
 Hyperbolic |  gpt-oss-20B (low) | | | | | | | 21.27 | 16.59 | |
 Weights & Biases |  gpt-oss-20B (low) | | | | | | | 8.58 | 6.44 | |
 DeepInfra (FP8) |  Qwen3 VL 235B A22B (FP8) | | | | | | | 51.74 | N/A | |
 Novita |  Qwen3 VL 235B A22B | | | | | | | 18.23 | N/A | |
 Alibaba Cloud |  Qwen3 VL 235B A22B | | | | | | | 10.04 | N/A | |
 Parasail (FP8) |  Qwen3 VL 235B A22B (FP8) | | | | | | | 32.67 | N/A | |
 Eigen AI |  Qwen3 VL 235B A22B | | | | | | | 7.36 | N/A | |
 Hyperbolic |  Qwen3 Next 80B A3B | | | | | | | 2.19 | N/A | |
 Novita |  Qwen3 Next 80B A3B | | | | | | | 5.43 | N/A | |
 Parasail |  Qwen3 Next 80B A3B | | | | | | | 4.89 | N/A | |
 Alibaba Cloud |  Qwen3 Next 80B A3B | | | | | | | 4.67 | N/A | |
 Google Vertex |  Qwen3 Next 80B A3B Vertex | | | | | | | 2.38 | N/A | |
 DeepInfra |  Qwen3 Next 80B A3B | | | | | | | 3.23 | N/A | |
 GMI |  Qwen3 Next 80B A3B | | | | | | | 3.70 | N/A | |
 Nebius |  Qwen3 Coder 30B A3B | | | | | | | 6.62 | N/A | |
 Alibaba Cloud |  Qwen3 Coder 30B A3B | | | | | | | 21.20 | N/A | |
 Scaleway |  Qwen3 Coder 30B A3B | | | | | | | 6.32 | N/A | |
 Amazon Bedrock |  Qwen3 Coder 30B A3B | | | | | | | 3.90 | N/A | |
 Clarifai |  Qwen3 Coder 30B A3B | | | | | | | 2.98 | N/A | |
 Alibaba Cloud |  Qwen3 VL 30B A3B | | | | | | | 27.17 | 20.95 | |
 Fireworks |  Qwen3 VL 30B A3B | | | | | | | 14.18 | 11.12 | |
 Novita |  Qwen3 VL 30B A3B | | | | | | | 28.94 | 22.31 | |
 Mistral |  Devstral Small 2 | | | | | | | 2.76 | N/A | |
 Google (AI Studio) |  Gemini 2.5 Flash-Lite (Sep) (AI Studio) | | | | | | | 1.80 | N/A | |
 Amazon Bedrock |  Nova Premier | | | | | | | 8.94 | N/A | |
 DeepInfra |  Llama Nemotron Super 49B v1.5 | | | | | | | 30.22 | 23.99 | |
 Nebius (FP8) |  Hermes 4 405B (FP8) | | | | | | | 75.90 | 60.07 | |
 Parasail (FP8) |  Llama 4 Maverick (FP8) | | | | | | | 4.24 | N/A | |
 Google Vertex |  Llama 4 Maverick Vertex | | | | | | | 3.42 | N/A | |
 DeepInfra (Turbo, FP8) |  Llama 4 Maverick (Turbo, FP8) | | | | | | | 9.44 | N/A | |
 Together.ai |  Llama 4 Maverick | | | | | | | 6.76 | N/A | |
 Microsoft Azure (FP8) |  Llama 4 Maverick (FP8) | | | | | | | 3.03 | N/A | |
 Amazon Bedrock |  Llama 4 Maverick | | | | | | | 3.03 | N/A | |
 Databricks |  Llama 4 Maverick | | | | | | | 5.48 | N/A | |
 DeepInfra (FP8) |  Llama 4 Maverick (FP8) | | | | | | | 9.51 | N/A | |
 SambaNova |  Llama 4 Maverick | | | | | | | 1.53 | N/A | |
 Groq |  Llama 4 Maverick | | | | | | | 2.02 | N/A | |
 Snowflake |  Llama 4 Maverick | | | | | | | 4.45 | N/A | |
 Novita (FP8) |  Llama 4 Maverick (FP8) | | | | | | | 6.57 | N/A | |
 Mistral |  Magistral Small 1.2 | | | | | | | 14.62 | 11.43 | |
 Amazon Bedrock |  Magistral Small 1.2 | | | | | | | 32.68 | 25.25 | |
 Amazon Bedrock |  Nova 2.0 Lite | | | | | | | 3.40 | N/A | |
 Nebius (FP8) |  Hermes 4 405B (FP8) | | | | | | | 16.19 | N/A | |
 Amazon Bedrock Latency Optimized |  Llama 3.1 405B Latency Optimized | | | | | | | 6.87 | N/A | |
 Amazon Bedrock Standard |  Llama 3.1 405B Standard | | | | | | | 20.03 | N/A | |
 Replicate |  Llama 3.1 405B | | | | | | | 17.97 | N/A | |
 Google Vertex |  Llama 3.1 405B Vertex | | | | | | | 18.30 | N/A | |
 Databricks |  Llama 3.1 405B | | | | | | | 12.52 | N/A | |
 Microsoft Azure |  Llama 3.1 405B | | | | | | | 17.07 | N/A | |
 Alibaba Cloud |  Qwen3 VL 32B | | | | | | | 7.74 | N/A | |
 SiliconFlow |  GLM-4.6V | | | | | | | 62.81 | N/A | |
 Parasail (FP8) |  GLM-4.6V (FP8) | | | | | | | 5.00 | N/A | |
 Novita |  GLM-4.6V | | | | | | | 18.85 | N/A | |
 Alibaba Cloud |  Qwen3 VL 8B | | | | | | | 19.95 | 15.14 | |
 Amazon Bedrock |  Nova 2.0 Omni | | | | | | | 2.98 | N/A | |
 Fireworks |  Qwen3 VL 30B A3B | | | | | | | 3.10 | N/A | |
 Novita |  Qwen3 VL 30B A3B | | | | | | | 4.77 | N/A | |
 DeepInfra (FP8) |  Qwen3 VL 30B A3B (FP8) | | | | | | | 10.43 | N/A | |
 Alibaba Cloud |  Qwen3 VL 30B A3B | | | | | | | 5.08 | N/A | |
 Nebius (FP8) |  Hermes 4 70B (FP8) | | | | | | | 31.81 | 25.00 | |
 Mistral |  Ministral 3 14B | | | | | | | 3.88 | N/A | |
 Amazon Bedrock |  Ministral 3 14B | | | | | | | 3.19 | N/A | |
 SiliconFlow |  Ling-flash-2.0 | | | | | | | 8.82 | N/A | |
 Alibaba Cloud |  Qwen3 Omni 30B A3B | | | | | | | 25.54 | 19.70 | |
 DeepInfra (FP8) |  Mistral Small 3.2 (FP8) | | | | | | | 4.11 | N/A | |
 Mistral |  Mistral Small 3.2 | | | | | | | 3.00 | N/A | |
 Nebius Base |  Llama Nemotron Ultra Base | | | | | | | 60.10 | 47.54 | |
 Nebius |  Qwen3 30B A3B 2507 | | | | | | | 6.51 | N/A | |
 Alibaba Cloud |  Qwen3 30B A3B 2507 | | | | | | | 7.61 | N/A | |
 Clarifai |  Qwen3 30B A3B 2507 | | | | | | | 9.11 | N/A | |
 Novita |  ERNIE 4.5 300B A47B | | | | | | | 20.95 | N/A | |
 DeepInfra (FP8) |  NVIDIA Nemotron Nano 12B v2 VL (FP8) | | | | | | | 19.20 | 15.01 | |
 Mistral |  Ministral 3 8B | | | | | | | 2.89 | N/A | |
 Amazon Bedrock |  Ministral 3 8B | | | | | | | 3.78 | N/A | |
 DeepInfra |  NVIDIA Nemotron Nano 9B V2 | | | | | | | 24.69 | 19.37 | |
 DeepInfra |  Llama Nemotron Super 49B v1.5 | | | | | | | 6.30 | N/A | |
 SambaNova |  Llama 3.3 70B | | | | | | | 2.04 | N/A | |
 Parasail (FP8) |  Llama 3.3 70B (FP8) | | | | | | | 13.36 | N/A | |
 Amazon Bedrock |  Llama 3.3 70B | | | | | | | 4.23 | N/A | |
 Groq |  Llama 3.3 70B | | | | | | | 1.92 | N/A | |
 Nebius Fast |  Llama 3.3 70B Fast | | | | | | | 5.24 | N/A | |
 Nebius Base |  Llama 3.3 70B Base | | | | | | | 37.90 | N/A | |
 Snowflake Snowflake |  Llama 3.3 70B Snowflake | | | | | | | 4.10 | N/A | |
 Fireworks |  Llama 3.3 70B | | | | | | | 3.72 | N/A | |
 FriendliAI |  Llama 3.3 70B | | | | | | | 5.40 | N/A | |
 Hyperbolic |  Llama 3.3 70B | | | | | | | 6.46 | N/A | |
 Google Vertex |  Llama 3.3 70B Vertex | | | | | | | 3.20 | N/A | |
 Weights & Biases |  Llama 3.3 70B | | | | | | | 5.82 | N/A | |
 Cloudflare |  Llama 3.3 70B | | | | | | | 16.15 | N/A | |
 CompactifAI |  Llama 3.3 70B | | | | | | | 4.00 | N/A | |
 Databricks |  Llama 3.3 70B | | | | | | | 7.50 | N/A | |
 Together.ai Turbo |  Llama 3.3 70B Turbo | | | | | | | 6.19 | N/A | |
 Lightning AI |  Llama 3.3 70B | | | | | | | 8.28 | N/A | |
 Microsoft Azure |  Llama 3.3 70B | | | | | | | 4.76 | N/A | |
 Scaleway |  Llama 3.3 70B | | | | | | | 6.64 | N/A | |
 DeepInfra (Turbo, FP8) |  Llama 3.3 70B (Turbo, FP8) | | | | | | | 20.45 | N/A | |
 Novita |  Llama 3.3 70B | | | | | | | 12.89 | N/A | |
 Eigen AI |  Llama 3.3 70B | | | | | | | 2.82 | N/A | |
 Alibaba Cloud |  Qwen3 VL 8B | | | | | | | 4.54 | N/A | |
 Together.ai |  Qwen3 VL 8B | | | | | | | 5.78 | N/A | |
 SiliconFlow |  Ring-flash-2.0 | | | | | | | 33.77 | 25.81 | |
 Parasail |  Olmo 3.1 32B Think | | | | | | | 31.76 | 25.01 | |
 Eigen AI |  Llama 4 Scout | | | | | | | 3.31 | N/A | |
 Google Vertex |  Llama 4 Scout Vertex | | | | | | | 2.90 | N/A | |
 Microsoft Azure |  Llama 4 Scout | | | | | | | 8.02 | N/A | |
 CompactifAI |  Llama 4 Scout | | | | | | | 5.26 | N/A | |
 Amazon Bedrock |  Llama 4 Scout | | | | | | | 2.93 | N/A | |
 Weights & Biases |  Llama 4 Scout | | | | | | | 4.40 | N/A | |
 Cloudflare |  Llama 4 Scout | | | | | | | 5.56 | N/A | |
 Groq |  Llama 4 Scout | | | | | | | 1.95 | N/A | |
 DeepInfra |  Llama 4 Scout | | | | | | | 7.31 | N/A | |
 Novita |  Llama 4 Scout | | | | | | | 6.22 | N/A | |
 Microsoft Azure |  Command A | | | | | | | 12.40 | N/A | |
 Cohere |  Command A | | | | | | | 13.76 | N/A | |
 DeepInfra |  Llama 3.1 Nemotron 70B | | | | | | | 14.43 | N/A | |
 DeepInfra |  NVIDIA Nemotron 3 Nano | | | | | | | 4.58 | N/A | |
 Nebius (FP8) |  Hermes 4 70B (FP8) | | | | | | | 6.42 | N/A | |
 DeepInfra |  Olmo 3.1 32B Instruct | | | | | | | 9.66 | N/A | |
 Mistral |  Ministral 3 3B | | | | | | | 2.09 | N/A | |
 Amazon Bedrock |  Ministral 3 3B | | | | | | | 1.79 | N/A | |
 AI21 Labs |  Jamba 1.7 Large | | | | | | | 9.96 | N/A | |
 Replicate |  Granite 4.0 H Small | | | | | | | 10.11 | N/A | |
 Alibaba Cloud |  Qwen3 Omni 30B A3B | | | | | | | 5.61 | N/A | |
 Together.ai |  LFM2 24B A2B | | | | | | | 2.31 | N/A | |
 DeepInfra |  Phi-4 | | | | | | | 11.97 | N/A | |
 Microsoft Azure |  Phi-4 | | | | | | | 71.25 | N/A | |
 Google (AI Studio) |  Gemma 3 27B (AI Studio) | | | | | | | 14.75 | N/A | |
 Novita |  Gemma 3 27B | | | | | | | 12.82 | N/A | |
 Parasail |  Gemma 3 27B | | | | | | | 13.79 | N/A | |
 DeepInfra |  Gemma 3 27B | | | | | | | 14.53 | N/A | |
 Amazon Bedrock |  Gemma 3 27B | | | | | | | 6.27 | N/A | |
 Nebius (FP8) |  Gemma 3 27B (FP8) | | | | | | | 9.32 | N/A | |
 Amazon Bedrock |  Nova Micro | | | | | | | 2.27 | N/A | |
 Amazon Bedrock |  NVIDIA Nemotron Nano 12B v2 VL | | | | | | | 3.79 | N/A | |
 Nebius |  NVIDIA Nemotron Nano 12B v2 VL | | | | | | | 4.26 | N/A | |
 DeepInfra (FP8) |  NVIDIA Nemotron Nano 12B v2 VL (FP8) | | | | | | | 4.26 | N/A | |
 Reka AI |  Reka Flash 3 | | | | | | | 46.92 | 36.47 | |
 Parasail |  Olmo 3 7B Think | | | | | | | 43.31 | 34.31 | |
 SiliconFlow |  Ling-mini-2.0 | | | | | | | 4.77 | N/A | |
 Google (AI Studio) |  Gemma 3 12B (AI Studio) | | | | | | | 47.76 | N/A | |
 DeepInfra |  Gemma 3 12B | | | | | | | 13.52 | N/A | |
 Databricks |  Gemma 3 12B | | | | | | | 5.47 | N/A | |
 Amazon Bedrock |  Gemma 3 12B | | | | | | | 5.28 | N/A | |
 Cloudflare |  Gemma 3 12B | | | | | | | 6.88 | N/A | |
 Microsoft Azure |  Llama 3.2 11B (Vision) | | | | | | | 7.17 | N/A | |
 DeepInfra |  Llama 3.2 11B (Vision) | | | | | | | 114.00 | N/A | |
 Amazon Bedrock |  Llama 3.2 11B (Vision) | | | | | | | 3.13 | N/A | |
 Parasail |  Olmo 3 7B | | | | | | | 10.98 | N/A | |
 Alibaba Cloud |  Qwen3 1.7B | | | | | | | 19.04 | 14.54 | |
 Alibaba Cloud |  Qwen3 1.7B | | | | | | | 4.52 | N/A | |
 Alibaba Cloud |  Qwen3 0.6B | | | | | | | 12.07 | 8.96 | |
 Together.ai |  Gemma 3n E4B | | | | | | | 10.15 | N/A | |
 Google (AI Studio) |  Gemma 3 4B (AI Studio) | | | | | | | 14.80 | N/A | |
 Amazon Bedrock |  Gemma 3 4B | | | | | | | 2.69 | N/A | |
 DeepInfra |  Gemma 3 4B | | | | | | | 13.32 | N/A | |
 Alibaba Cloud |  Qwen3 0.6B | | | | | | | 3.18 | N/A | |
 Google (AI Studio) |  Gemma 3 1B (AI Studio) | | | | | | | 11.12 | N/A | |
 Google (AI Studio) |  Gemma 3n E2B (AI Studio) | | | | | | | 10.75 | N/A | |
 Amazon Bedrock |  Llama 3.2 90B (Vision) | | | | | | | 8.67 | N/A | |
 Microsoft Azure |  Llama 3.2 90B (Vision) | | | | | | | 12.48 | N/A | |
 DeepInfra |  Llama 3.2 90B (Vision) | | | | | | | 9.06 | N/A | |
 SambaNova |  DeepSeek R1 Distill Llama 70B | | | | | | | 10.01 | 7.23 | |
 DeepInfra |  DeepSeek R1 Distill Llama 70B | | | | | | | 41.47 | 32.96 | |
 Scaleway |  DeepSeek R1 Distill Llama 70B | | | | | | | 64.42 | 50.86 | |
 Microsoft Azure |  Phi-4 Mini | | | | | | | 11.75 | N/A | |
 Weights & Biases |  Phi-4 Mini | | | | | | | 2.44 | N/A | |
 Microsoft Azure |  Phi-4 Multimodal | | | | | | | 30.41 | N/A | |
 DeepInfra |  NVIDIA Nemotron Nano 9B V2 | | | | | | | 5.38 | N/A | |
 Amazon Bedrock |  NVIDIA Nemotron Nano 9B V2 | | | | | | | 4.25 | N/A | |
 Parasail |  Molmo2-8B | | | | | | | 4.25 | N/A | |
 Together.ai |  Cogito v2.1 | | | | | | | 31.64 | 25.03 | |