{
  "schemaVersion": "1.0",
  "name": "BenchLM curated comparisons",
  "description": "Curated and high-value model comparisons. BenchLM supports more pairwise comparison pages than this export includes.",
  "canonicalUrl": "https://benchlm.ai/data/comparisons.json",
  "generatedAt": "2026-06-12T20:35:11.146Z",
  "sourceLastUpdated": "June 12, 2026",
  "sourceFiles": [
    "src/data/featuredComparisons.js",
    "src/lib/prebuiltComparisons.js"
  ],
  "counts": {
    "exportedComparisons": 400,
    "totalPairwiseComparisons": 33153
  },
  "items": [
    {
      "slug": "claude-opus-4-8-vs-gpt-5-5",
      "url": "https://benchlm.ai/compare/claude-opus-4-8-vs-gpt-5-5",
      "markdownUrl": "https://benchlm.ai/md/compare/claude-opus-4-8-vs-gpt-5-5.md",
      "modelA": {
        "slug": "claude-opus-4-8",
        "canonicalModelKey": "claude-opus-4-8",
        "model": "Claude Opus 4.8",
        "creator": "Anthropic",
        "sourceType": "Proprietary",
        "reasoningType": "Reasoning",
        "contextWindow": "1M",
        "contextWindowTokens": 1000000,
        "displayScore": 93,
        "rankingEligible": true,
        "overallRank": 3,
        "url": "https://benchlm.ai/models/claude-opus-4-8",
        "markdownUrl": "https://benchlm.ai/md/models/claude-opus-4-8.md"
      },
      "modelB": {
        "slug": "gpt-5-5",
        "canonicalModelKey": "gpt-5-5",
        "model": "GPT-5.5",
        "creator": "OpenAI",
        "sourceType": "Proprietary",
        "reasoningType": "Reasoning",
        "contextWindow": "1M",
        "contextWindowTokens": 1000000,
        "displayScore": 89,
        "rankingEligible": true,
        "overallRank": 7,
        "url": "https://benchlm.ai/models/gpt-5-5",
        "markdownUrl": "https://benchlm.ai/md/models/gpt-5-5.md"
      },
      "overallWinner": "A",
      "winner": {
        "slug": "claude-opus-4-8",
        "canonicalModelKey": "claude-opus-4-8",
        "model": "Claude Opus 4.8",
        "creator": "Anthropic",
        "sourceType": "Proprietary",
        "reasoningType": "Reasoning",
        "contextWindow": "1M",
        "contextWindowTokens": 1000000,
        "displayScore": 93,
        "rankingEligible": true,
        "overallRank": 3,
        "url": "https://benchlm.ai/models/claude-opus-4-8",
        "markdownUrl": "https://benchlm.ai/md/models/claude-opus-4-8.md"
      },
      "scoreDiff": 4,
      "winsA": 3,
      "winsB": 1,
      "comparableCategoryCount": 4,
      "benchmarkCountA": 41,
      "benchmarkCountB": 42,
      "categoryResults": {
        "agentic": {
          "categoryLabel": "Agentic",
          "avgA": 80.1,
          "avgB": 81.5,
          "winner": "B",
          "benchmarkCount": 14
        },
        "coding": {
          "categoryLabel": "Coding",
          "avgA": 76.4,
          "avgB": 58.6,
          "winner": "A",
          "benchmarkCount": 11
        },
        "multimodalGrounded": {
          "categoryLabel": "Multimodal & Grounded",
          "avgA": 76.1,
          "avgB": 70.4,
          "winner": "A",
          "benchmarkCount": 8
        },
        "reasoning": {
          "categoryLabel": "Reasoning",
          "avgA": null,
          "avgB": 85,
          "winner": null,
          "benchmarkCount": 5
        },
        "knowledge": {
          "categoryLabel": "Knowledge",
          "avgA": 70.1,
          "avgB": 66.4,
          "winner": "A",
          "benchmarkCount": 10
        },
        "instructionFollowing": {
          "categoryLabel": "Instruction Following",
          "avgA": null,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 1
        },
        "multilingual": {
          "categoryLabel": "Multilingual",
          "avgA": null,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 1
        },
        "math": {
          "categoryLabel": "Mathematics",
          "avgA": null,
          "avgB": 51.7,
          "winner": null,
          "benchmarkCount": 2
        }
      }
    },
    {
      "slug": "claude-opus-4-7-adaptive-vs-claude-opus-4-8",
      "url": "https://benchlm.ai/compare/claude-opus-4-7-adaptive-vs-claude-opus-4-8",
      "markdownUrl": "https://benchlm.ai/md/compare/claude-opus-4-7-adaptive-vs-claude-opus-4-8.md",
      "modelA": {
        "slug": "claude-opus-4-8",
        "canonicalModelKey": "claude-opus-4-8",
        "model": "Claude Opus 4.8",
        "creator": "Anthropic",
        "sourceType": "Proprietary",
        "reasoningType": "Reasoning",
        "contextWindow": "1M",
        "contextWindowTokens": 1000000,
        "displayScore": 93,
        "rankingEligible": true,
        "overallRank": 3,
        "url": "https://benchlm.ai/models/claude-opus-4-8",
        "markdownUrl": "https://benchlm.ai/md/models/claude-opus-4-8.md"
      },
      "modelB": {
        "slug": "claude-opus-4-7-adaptive",
        "canonicalModelKey": "claude-opus-4-7-max",
        "model": "Claude Opus 4.7 (Adaptive)",
        "creator": "Anthropic",
        "sourceType": "Proprietary",
        "reasoningType": "Reasoning",
        "contextWindow": "1M",
        "contextWindowTokens": 1000000,
        "displayScore": 84,
        "rankingEligible": true,
        "overallRank": 16,
        "url": "https://benchlm.ai/models/claude-opus-4-7-adaptive",
        "markdownUrl": "https://benchlm.ai/md/models/claude-opus-4-7-adaptive.md"
      },
      "overallWinner": "A",
      "winner": {
        "slug": "claude-opus-4-8",
        "canonicalModelKey": "claude-opus-4-8",
        "model": "Claude Opus 4.8",
        "creator": "Anthropic",
        "sourceType": "Proprietary",
        "reasoningType": "Reasoning",
        "contextWindow": "1M",
        "contextWindowTokens": 1000000,
        "displayScore": 93,
        "rankingEligible": true,
        "overallRank": 3,
        "url": "https://benchlm.ai/models/claude-opus-4-8",
        "markdownUrl": "https://benchlm.ai/md/models/claude-opus-4-8.md"
      },
      "scoreDiff": 9,
      "winsA": 4,
      "winsB": 0,
      "comparableCategoryCount": 4,
      "benchmarkCountA": 41,
      "benchmarkCountB": 36,
      "categoryResults": {
        "agentic": {
          "categoryLabel": "Agentic",
          "avgA": 80.1,
          "avgB": 74.9,
          "winner": "A",
          "benchmarkCount": 13
        },
        "coding": {
          "categoryLabel": "Coding",
          "avgA": 76.4,
          "avgB": 72.9,
          "winner": "A",
          "benchmarkCount": 9
        },
        "multimodalGrounded": {
          "categoryLabel": "Multimodal & Grounded",
          "avgA": 76.1,
          "avgB": 64.3,
          "winner": "A",
          "benchmarkCount": 6
        },
        "reasoning": {
          "categoryLabel": "Reasoning",
          "avgA": null,
          "avgB": 75.8,
          "winner": null,
          "benchmarkCount": 4
        },
        "knowledge": {
          "categoryLabel": "Knowledge",
          "avgA": 70.1,
          "avgB": 68.2,
          "winner": "A",
          "benchmarkCount": 10
        },
        "instructionFollowing": {
          "categoryLabel": "Instruction Following",
          "avgA": null,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 1
        },
        "multilingual": {
          "categoryLabel": "Multilingual",
          "avgA": null,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 1
        },
        "math": {
          "categoryLabel": "Mathematics",
          "avgA": null,
          "avgB": 43.8,
          "winner": null,
          "benchmarkCount": 2
        }
      }
    },
    {
      "slug": "gemini-3-5-flash-vs-gpt-5-5",
      "url": "https://benchlm.ai/compare/gemini-3-5-flash-vs-gpt-5-5",
      "markdownUrl": "https://benchlm.ai/md/compare/gemini-3-5-flash-vs-gpt-5-5.md",
      "modelA": {
        "slug": "gemini-3-5-flash",
        "canonicalModelKey": "gemini-3-5-flash",
        "model": "Gemini 3.5 Flash",
        "creator": "Google",
        "sourceType": "Proprietary",
        "reasoningType": "Reasoning",
        "contextWindow": "1M",
        "contextWindowTokens": 1000000,
        "displayScore": 86,
        "rankingEligible": true,
        "overallRank": 13,
        "url": "https://benchlm.ai/models/gemini-3-5-flash",
        "markdownUrl": "https://benchlm.ai/md/models/gemini-3-5-flash.md"
      },
      "modelB": {
        "slug": "gpt-5-5",
        "canonicalModelKey": "gpt-5-5",
        "model": "GPT-5.5",
        "creator": "OpenAI",
        "sourceType": "Proprietary",
        "reasoningType": "Reasoning",
        "contextWindow": "1M",
        "contextWindowTokens": 1000000,
        "displayScore": 89,
        "rankingEligible": true,
        "overallRank": 7,
        "url": "https://benchlm.ai/models/gpt-5-5",
        "markdownUrl": "https://benchlm.ai/md/models/gpt-5-5.md"
      },
      "overallWinner": "B",
      "winner": {
        "slug": "gpt-5-5",
        "canonicalModelKey": "gpt-5-5",
        "model": "GPT-5.5",
        "creator": "OpenAI",
        "sourceType": "Proprietary",
        "reasoningType": "Reasoning",
        "contextWindow": "1M",
        "contextWindowTokens": 1000000,
        "displayScore": 89,
        "rankingEligible": true,
        "overallRank": 7,
        "url": "https://benchlm.ai/models/gpt-5-5",
        "markdownUrl": "https://benchlm.ai/md/models/gpt-5-5.md"
      },
      "scoreDiff": 3,
      "winsA": 1,
      "winsB": 4,
      "comparableCategoryCount": 5,
      "benchmarkCountA": 40,
      "benchmarkCountB": 42,
      "categoryResults": {
        "agentic": {
          "categoryLabel": "Agentic",
          "avgA": 77.2,
          "avgB": 81.5,
          "winner": "B",
          "benchmarkCount": 13
        },
        "coding": {
          "categoryLabel": "Coding",
          "avgA": 54.5,
          "avgB": 58.6,
          "winner": "B",
          "benchmarkCount": 9
        },
        "multimodalGrounded": {
          "categoryLabel": "Multimodal & Grounded",
          "avgA": 83.8,
          "avgB": 70.4,
          "winner": "A",
          "benchmarkCount": 7
        },
        "reasoning": {
          "categoryLabel": "Reasoning",
          "avgA": 74.7,
          "avgB": 85,
          "winner": "B",
          "benchmarkCount": 7
        },
        "knowledge": {
          "categoryLabel": "Knowledge",
          "avgA": 58,
          "avgB": 66.4,
          "winner": "B",
          "benchmarkCount": 10
        },
        "instructionFollowing": {
          "categoryLabel": "Instruction Following",
          "avgA": 76.3,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 2
        },
        "multilingual": {
          "categoryLabel": "Multilingual",
          "avgA": null,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 0
        },
        "math": {
          "categoryLabel": "Mathematics",
          "avgA": null,
          "avgB": 51.7,
          "winner": null,
          "benchmarkCount": 1
        }
      }
    },
    {
      "slug": "claude-opus-4-7-vs-gemini-3-5-flash",
      "url": "https://benchlm.ai/compare/claude-opus-4-7-vs-gemini-3-5-flash",
      "markdownUrl": "https://benchlm.ai/md/compare/claude-opus-4-7-vs-gemini-3-5-flash.md",
      "modelA": {
        "slug": "gemini-3-5-flash",
        "canonicalModelKey": "gemini-3-5-flash",
        "model": "Gemini 3.5 Flash",
        "creator": "Google",
        "sourceType": "Proprietary",
        "reasoningType": "Reasoning",
        "contextWindow": "1M",
        "contextWindowTokens": 1000000,
        "displayScore": 86,
        "rankingEligible": true,
        "overallRank": 13,
        "url": "https://benchlm.ai/models/gemini-3-5-flash",
        "markdownUrl": "https://benchlm.ai/md/models/gemini-3-5-flash.md"
      },
      "modelB": {
        "slug": "claude-opus-4-7",
        "canonicalModelKey": "claude-opus-4-7",
        "model": "Claude Opus 4.7",
        "creator": "Anthropic",
        "sourceType": "Proprietary",
        "reasoningType": "Non-Reasoning",
        "contextWindow": "1M",
        "contextWindowTokens": 1000000,
        "displayScore": 23,
        "rankingEligible": false,
        "overallRank": null,
        "url": "https://benchlm.ai/models/claude-opus-4-7",
        "markdownUrl": "https://benchlm.ai/md/models/claude-opus-4-7.md"
      },
      "overallWinner": "A",
      "winner": {
        "slug": "gemini-3-5-flash",
        "canonicalModelKey": "gemini-3-5-flash",
        "model": "Gemini 3.5 Flash",
        "creator": "Google",
        "sourceType": "Proprietary",
        "reasoningType": "Reasoning",
        "contextWindow": "1M",
        "contextWindowTokens": 1000000,
        "displayScore": 86,
        "rankingEligible": true,
        "overallRank": 13,
        "url": "https://benchlm.ai/models/gemini-3-5-flash",
        "markdownUrl": "https://benchlm.ai/md/models/gemini-3-5-flash.md"
      },
      "scoreDiff": 63,
      "winsA": 0,
      "winsB": 0,
      "comparableCategoryCount": 0,
      "benchmarkCountA": 40,
      "benchmarkCountB": 21,
      "categoryResults": {
        "agentic": {
          "categoryLabel": "Agentic",
          "avgA": 77.2,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 11
        },
        "coding": {
          "categoryLabel": "Coding",
          "avgA": 54.5,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 9
        },
        "multimodalGrounded": {
          "categoryLabel": "Multimodal & Grounded",
          "avgA": 83.8,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 5
        },
        "reasoning": {
          "categoryLabel": "Reasoning",
          "avgA": 74.7,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 5
        },
        "knowledge": {
          "categoryLabel": "Knowledge",
          "avgA": 58,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 9
        },
        "instructionFollowing": {
          "categoryLabel": "Instruction Following",
          "avgA": 76.3,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 2
        },
        "multilingual": {
          "categoryLabel": "Multilingual",
          "avgA": null,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 0
        },
        "math": {
          "categoryLabel": "Mathematics",
          "avgA": null,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 0
        }
      }
    },
    {
      "slug": "gemini-3-1-pro-vs-gemini-3-5-flash",
      "url": "https://benchlm.ai/compare/gemini-3-1-pro-vs-gemini-3-5-flash",
      "markdownUrl": "https://benchlm.ai/md/compare/gemini-3-1-pro-vs-gemini-3-5-flash.md",
      "modelA": {
        "slug": "gemini-3-5-flash",
        "canonicalModelKey": "gemini-3-5-flash",
        "model": "Gemini 3.5 Flash",
        "creator": "Google",
        "sourceType": "Proprietary",
        "reasoningType": "Reasoning",
        "contextWindow": "1M",
        "contextWindowTokens": 1000000,
        "displayScore": 86,
        "rankingEligible": true,
        "overallRank": 13,
        "url": "https://benchlm.ai/models/gemini-3-5-flash",
        "markdownUrl": "https://benchlm.ai/md/models/gemini-3-5-flash.md"
      },
      "modelB": {
        "slug": "gemini-3-1-pro",
        "canonicalModelKey": "gemini-3-1-pro",
        "model": "Gemini 3.1 Pro",
        "creator": "Google",
        "sourceType": "Proprietary",
        "reasoningType": "Non-Reasoning",
        "contextWindow": "1M",
        "contextWindowTokens": 1000000,
        "displayScore": 91,
        "rankingEligible": true,
        "overallRank": 4,
        "url": "https://benchlm.ai/models/gemini-3-1-pro",
        "markdownUrl": "https://benchlm.ai/md/models/gemini-3-1-pro.md"
      },
      "overallWinner": "B",
      "winner": {
        "slug": "gemini-3-1-pro",
        "canonicalModelKey": "gemini-3-1-pro",
        "model": "Gemini 3.1 Pro",
        "creator": "Google",
        "sourceType": "Proprietary",
        "reasoningType": "Non-Reasoning",
        "contextWindow": "1M",
        "contextWindowTokens": 1000000,
        "displayScore": 91,
        "rankingEligible": true,
        "overallRank": 4,
        "url": "https://benchlm.ai/models/gemini-3-1-pro",
        "markdownUrl": "https://benchlm.ai/md/models/gemini-3-1-pro.md"
      },
      "scoreDiff": 5,
      "winsA": 1,
      "winsB": 1,
      "comparableCategoryCount": 2,
      "benchmarkCountA": 40,
      "benchmarkCountB": 38,
      "categoryResults": {
        "agentic": {
          "categoryLabel": "Agentic",
          "avgA": 77.2,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 13
        },
        "coding": {
          "categoryLabel": "Coding",
          "avgA": 54.5,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 10
        },
        "multimodalGrounded": {
          "categoryLabel": "Multimodal & Grounded",
          "avgA": 83.8,
          "avgB": 82.8,
          "winner": "A",
          "benchmarkCount": 11
        },
        "reasoning": {
          "categoryLabel": "Reasoning",
          "avgA": 74.7,
          "avgB": 77.1,
          "winner": "B",
          "benchmarkCount": 5
        },
        "knowledge": {
          "categoryLabel": "Knowledge",
          "avgA": 58,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 12
        },
        "instructionFollowing": {
          "categoryLabel": "Instruction Following",
          "avgA": 76.3,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 2
        },
        "multilingual": {
          "categoryLabel": "Multilingual",
          "avgA": null,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 0
        },
        "math": {
          "categoryLabel": "Mathematics",
          "avgA": null,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 0
        }
      }
    },
    {
      "slug": "claude-opus-4-7-vs-gpt-5-5",
      "url": "https://benchlm.ai/compare/claude-opus-4-7-vs-gpt-5-5",
      "markdownUrl": "https://benchlm.ai/md/compare/claude-opus-4-7-vs-gpt-5-5.md",
      "modelA": {
        "slug": "gpt-5-5",
        "canonicalModelKey": "gpt-5-5",
        "model": "GPT-5.5",
        "creator": "OpenAI",
        "sourceType": "Proprietary",
        "reasoningType": "Reasoning",
        "contextWindow": "1M",
        "contextWindowTokens": 1000000,
        "displayScore": 89,
        "rankingEligible": true,
        "overallRank": 7,
        "url": "https://benchlm.ai/models/gpt-5-5",
        "markdownUrl": "https://benchlm.ai/md/models/gpt-5-5.md"
      },
      "modelB": {
        "slug": "claude-opus-4-7",
        "canonicalModelKey": "claude-opus-4-7",
        "model": "Claude Opus 4.7",
        "creator": "Anthropic",
        "sourceType": "Proprietary",
        "reasoningType": "Non-Reasoning",
        "contextWindow": "1M",
        "contextWindowTokens": 1000000,
        "displayScore": 23,
        "rankingEligible": false,
        "overallRank": null,
        "url": "https://benchlm.ai/models/claude-opus-4-7",
        "markdownUrl": "https://benchlm.ai/md/models/claude-opus-4-7.md"
      },
      "overallWinner": "A",
      "winner": {
        "slug": "gpt-5-5",
        "canonicalModelKey": "gpt-5-5",
        "model": "GPT-5.5",
        "creator": "OpenAI",
        "sourceType": "Proprietary",
        "reasoningType": "Reasoning",
        "contextWindow": "1M",
        "contextWindowTokens": 1000000,
        "displayScore": 89,
        "rankingEligible": true,
        "overallRank": 7,
        "url": "https://benchlm.ai/models/gpt-5-5",
        "markdownUrl": "https://benchlm.ai/md/models/gpt-5-5.md"
      },
      "scoreDiff": 66,
      "winsA": 0,
      "winsB": 0,
      "comparableCategoryCount": 0,
      "benchmarkCountA": 42,
      "benchmarkCountB": 21,
      "categoryResults": {
        "agentic": {
          "categoryLabel": "Agentic",
          "avgA": 81.5,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 12
        },
        "coding": {
          "categoryLabel": "Coding",
          "avgA": 58.6,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 8
        },
        "multimodalGrounded": {
          "categoryLabel": "Multimodal & Grounded",
          "avgA": 70.4,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 5
        },
        "reasoning": {
          "categoryLabel": "Reasoning",
          "avgA": 85,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 5
        },
        "knowledge": {
          "categoryLabel": "Knowledge",
          "avgA": 66.4,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 10
        },
        "instructionFollowing": {
          "categoryLabel": "Instruction Following",
          "avgA": null,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 1
        },
        "multilingual": {
          "categoryLabel": "Multilingual",
          "avgA": null,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 0
        },
        "math": {
          "categoryLabel": "Mathematics",
          "avgA": 51.7,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 1
        }
      }
    },
    {
      "slug": "claude-opus-4-7-adaptive-vs-gpt-5-5",
      "url": "https://benchlm.ai/compare/claude-opus-4-7-adaptive-vs-gpt-5-5",
      "markdownUrl": "https://benchlm.ai/md/compare/claude-opus-4-7-adaptive-vs-gpt-5-5.md",
      "modelA": {
        "slug": "gpt-5-5",
        "canonicalModelKey": "gpt-5-5",
        "model": "GPT-5.5",
        "creator": "OpenAI",
        "sourceType": "Proprietary",
        "reasoningType": "Reasoning",
        "contextWindow": "1M",
        "contextWindowTokens": 1000000,
        "displayScore": 89,
        "rankingEligible": true,
        "overallRank": 7,
        "url": "https://benchlm.ai/models/gpt-5-5",
        "markdownUrl": "https://benchlm.ai/md/models/gpt-5-5.md"
      },
      "modelB": {
        "slug": "claude-opus-4-7-adaptive",
        "canonicalModelKey": "claude-opus-4-7-max",
        "model": "Claude Opus 4.7 (Adaptive)",
        "creator": "Anthropic",
        "sourceType": "Proprietary",
        "reasoningType": "Reasoning",
        "contextWindow": "1M",
        "contextWindowTokens": 1000000,
        "displayScore": 84,
        "rankingEligible": true,
        "overallRank": 16,
        "url": "https://benchlm.ai/models/claude-opus-4-7-adaptive",
        "markdownUrl": "https://benchlm.ai/md/models/claude-opus-4-7-adaptive.md"
      },
      "overallWinner": "A",
      "winner": {
        "slug": "gpt-5-5",
        "canonicalModelKey": "gpt-5-5",
        "model": "GPT-5.5",
        "creator": "OpenAI",
        "sourceType": "Proprietary",
        "reasoningType": "Reasoning",
        "contextWindow": "1M",
        "contextWindowTokens": 1000000,
        "displayScore": 89,
        "rankingEligible": true,
        "overallRank": 7,
        "url": "https://benchlm.ai/models/gpt-5-5",
        "markdownUrl": "https://benchlm.ai/md/models/gpt-5-5.md"
      },
      "scoreDiff": 5,
      "winsA": 4,
      "winsB": 2,
      "comparableCategoryCount": 6,
      "benchmarkCountA": 42,
      "benchmarkCountB": 36,
      "categoryResults": {
        "agentic": {
          "categoryLabel": "Agentic",
          "avgA": 81.5,
          "avgB": 74.9,
          "winner": "A",
          "benchmarkCount": 12
        },
        "coding": {
          "categoryLabel": "Coding",
          "avgA": 58.6,
          "avgB": 72.9,
          "winner": "B",
          "benchmarkCount": 9
        },
        "multimodalGrounded": {
          "categoryLabel": "Multimodal & Grounded",
          "avgA": 70.4,
          "avgB": 64.3,
          "winner": "A",
          "benchmarkCount": 7
        },
        "reasoning": {
          "categoryLabel": "Reasoning",
          "avgA": 85,
          "avgB": 75.8,
          "winner": "A",
          "benchmarkCount": 5
        },
        "knowledge": {
          "categoryLabel": "Knowledge",
          "avgA": 66.4,
          "avgB": 68.2,
          "winner": "B",
          "benchmarkCount": 10
        },
        "instructionFollowing": {
          "categoryLabel": "Instruction Following",
          "avgA": null,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 1
        },
        "multilingual": {
          "categoryLabel": "Multilingual",
          "avgA": null,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 0
        },
        "math": {
          "categoryLabel": "Mathematics",
          "avgA": 51.7,
          "avgB": 43.8,
          "winner": "A",
          "benchmarkCount": 1
        }
      }
    },
    {
      "slug": "claude-fable-vs-gpt-5-5",
      "url": "https://benchlm.ai/compare/claude-fable-vs-gpt-5-5",
      "markdownUrl": "https://benchlm.ai/md/compare/claude-fable-vs-gpt-5-5.md",
      "modelA": {
        "slug": "gpt-5-5",
        "canonicalModelKey": "gpt-5-5",
        "model": "GPT-5.5",
        "creator": "OpenAI",
        "sourceType": "Proprietary",
        "reasoningType": "Reasoning",
        "contextWindow": "1M",
        "contextWindowTokens": 1000000,
        "displayScore": 89,
        "rankingEligible": true,
        "overallRank": 7,
        "url": "https://benchlm.ai/models/gpt-5-5",
        "markdownUrl": "https://benchlm.ai/md/models/gpt-5-5.md"
      },
      "modelB": {
        "slug": "claude-fable",
        "canonicalModelKey": "claude-fable-5",
        "model": "Claude Fable 5",
        "creator": "Anthropic",
        "sourceType": "Proprietary",
        "reasoningType": "Reasoning",
        "contextWindow": "1M+",
        "contextWindowTokens": 1000000,
        "displayScore": 97,
        "rankingEligible": true,
        "overallRank": 2,
        "url": "https://benchlm.ai/models/claude-fable",
        "markdownUrl": "https://benchlm.ai/md/models/claude-fable.md"
      },
      "overallWinner": "B",
      "winner": {
        "slug": "claude-fable",
        "canonicalModelKey": "claude-fable-5",
        "model": "Claude Fable 5",
        "creator": "Anthropic",
        "sourceType": "Proprietary",
        "reasoningType": "Reasoning",
        "contextWindow": "1M+",
        "contextWindowTokens": 1000000,
        "displayScore": 97,
        "rankingEligible": true,
        "overallRank": 2,
        "url": "https://benchlm.ai/models/claude-fable",
        "markdownUrl": "https://benchlm.ai/md/models/claude-fable.md"
      },
      "scoreDiff": 8,
      "winsA": 0,
      "winsB": 4,
      "comparableCategoryCount": 4,
      "benchmarkCountA": 42,
      "benchmarkCountB": 19,
      "categoryResults": {
        "agentic": {
          "categoryLabel": "Agentic",
          "avgA": 81.5,
          "avgB": 85.2,
          "winner": "B",
          "benchmarkCount": 12
        },
        "coding": {
          "categoryLabel": "Coding",
          "avgA": 58.6,
          "avgB": 85.6,
          "winner": "B",
          "benchmarkCount": 10
        },
        "multimodalGrounded": {
          "categoryLabel": "Multimodal & Grounded",
          "avgA": 70.4,
          "avgB": 92.4,
          "winner": "B",
          "benchmarkCount": 9
        },
        "reasoning": {
          "categoryLabel": "Reasoning",
          "avgA": 85,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 5
        },
        "knowledge": {
          "categoryLabel": "Knowledge",
          "avgA": 66.4,
          "avgB": 74.8,
          "winner": "B",
          "benchmarkCount": 10
        },
        "instructionFollowing": {
          "categoryLabel": "Instruction Following",
          "avgA": null,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 1
        },
        "multilingual": {
          "categoryLabel": "Multilingual",
          "avgA": null,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 1
        },
        "math": {
          "categoryLabel": "Mathematics",
          "avgA": 51.7,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 2
        }
      }
    },
    {
      "slug": "claude-mythos-5-vs-gpt-5-5",
      "url": "https://benchlm.ai/compare/claude-mythos-5-vs-gpt-5-5",
      "markdownUrl": "https://benchlm.ai/md/compare/claude-mythos-5-vs-gpt-5-5.md",
      "modelA": {
        "slug": "gpt-5-5",
        "canonicalModelKey": "gpt-5-5",
        "model": "GPT-5.5",
        "creator": "OpenAI",
        "sourceType": "Proprietary",
        "reasoningType": "Reasoning",
        "contextWindow": "1M",
        "contextWindowTokens": 1000000,
        "displayScore": 89,
        "rankingEligible": true,
        "overallRank": 7,
        "url": "https://benchlm.ai/models/gpt-5-5",
        "markdownUrl": "https://benchlm.ai/md/models/gpt-5-5.md"
      },
      "modelB": {
        "slug": "claude-mythos-5",
        "canonicalModelKey": "claude-mythos-5",
        "model": "Claude Mythos 5",
        "creator": "Anthropic",
        "sourceType": "Proprietary",
        "reasoningType": "Reasoning",
        "contextWindow": "1M+",
        "contextWindowTokens": 1000000,
        "displayScore": 99,
        "rankingEligible": true,
        "overallRank": 1,
        "url": "https://benchlm.ai/models/claude-mythos-5",
        "markdownUrl": "https://benchlm.ai/md/models/claude-mythos-5.md"
      },
      "overallWinner": "B",
      "winner": {
        "slug": "claude-mythos-5",
        "canonicalModelKey": "claude-mythos-5",
        "model": "Claude Mythos 5",
        "creator": "Anthropic",
        "sourceType": "Proprietary",
        "reasoningType": "Reasoning",
        "contextWindow": "1M+",
        "contextWindowTokens": 1000000,
        "displayScore": 99,
        "rankingEligible": true,
        "overallRank": 1,
        "url": "https://benchlm.ai/models/claude-mythos-5",
        "markdownUrl": "https://benchlm.ai/md/models/claude-mythos-5.md"
      },
      "scoreDiff": 10,
      "winsA": 0,
      "winsB": 4,
      "comparableCategoryCount": 4,
      "benchmarkCountA": 42,
      "benchmarkCountB": 19,
      "categoryResults": {
        "agentic": {
          "categoryLabel": "Agentic",
          "avgA": 81.5,
          "avgB": 87,
          "winner": "B",
          "benchmarkCount": 12
        },
        "coding": {
          "categoryLabel": "Coding",
          "avgA": 58.6,
          "avgB": 85.9,
          "winner": "B",
          "benchmarkCount": 10
        },
        "multimodalGrounded": {
          "categoryLabel": "Multimodal & Grounded",
          "avgA": 70.4,
          "avgB": 92.7,
          "winner": "B",
          "benchmarkCount": 9
        },
        "reasoning": {
          "categoryLabel": "Reasoning",
          "avgA": 85,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 5
        },
        "knowledge": {
          "categoryLabel": "Knowledge",
          "avgA": 66.4,
          "avgB": 74.6,
          "winner": "B",
          "benchmarkCount": 10
        },
        "instructionFollowing": {
          "categoryLabel": "Instruction Following",
          "avgA": null,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 1
        },
        "multilingual": {
          "categoryLabel": "Multilingual",
          "avgA": null,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 1
        },
        "math": {
          "categoryLabel": "Mathematics",
          "avgA": 51.7,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 2
        }
      }
    },
    {
      "slug": "gemini-3-1-pro-vs-gpt-5-5",
      "url": "https://benchlm.ai/compare/gemini-3-1-pro-vs-gpt-5-5",
      "markdownUrl": "https://benchlm.ai/md/compare/gemini-3-1-pro-vs-gpt-5-5.md",
      "modelA": {
        "slug": "gpt-5-5",
        "canonicalModelKey": "gpt-5-5",
        "model": "GPT-5.5",
        "creator": "OpenAI",
        "sourceType": "Proprietary",
        "reasoningType": "Reasoning",
        "contextWindow": "1M",
        "contextWindowTokens": 1000000,
        "displayScore": 89,
        "rankingEligible": true,
        "overallRank": 7,
        "url": "https://benchlm.ai/models/gpt-5-5",
        "markdownUrl": "https://benchlm.ai/md/models/gpt-5-5.md"
      },
      "modelB": {
        "slug": "gemini-3-1-pro",
        "canonicalModelKey": "gemini-3-1-pro",
        "model": "Gemini 3.1 Pro",
        "creator": "Google",
        "sourceType": "Proprietary",
        "reasoningType": "Non-Reasoning",
        "contextWindow": "1M",
        "contextWindowTokens": 1000000,
        "displayScore": 91,
        "rankingEligible": true,
        "overallRank": 4,
        "url": "https://benchlm.ai/models/gemini-3-1-pro",
        "markdownUrl": "https://benchlm.ai/md/models/gemini-3-1-pro.md"
      },
      "overallWinner": "B",
      "winner": {
        "slug": "gemini-3-1-pro",
        "canonicalModelKey": "gemini-3-1-pro",
        "model": "Gemini 3.1 Pro",
        "creator": "Google",
        "sourceType": "Proprietary",
        "reasoningType": "Non-Reasoning",
        "contextWindow": "1M",
        "contextWindowTokens": 1000000,
        "displayScore": 91,
        "rankingEligible": true,
        "overallRank": 4,
        "url": "https://benchlm.ai/models/gemini-3-1-pro",
        "markdownUrl": "https://benchlm.ai/md/models/gemini-3-1-pro.md"
      },
      "scoreDiff": 2,
      "winsA": 1,
      "winsB": 1,
      "comparableCategoryCount": 2,
      "benchmarkCountA": 42,
      "benchmarkCountB": 38,
      "categoryResults": {
        "agentic": {
          "categoryLabel": "Agentic",
          "avgA": 81.5,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 14
        },
        "coding": {
          "categoryLabel": "Coding",
          "avgA": 58.6,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 9
        },
        "multimodalGrounded": {
          "categoryLabel": "Multimodal & Grounded",
          "avgA": 70.4,
          "avgB": 82.8,
          "winner": "B",
          "benchmarkCount": 12
        },
        "reasoning": {
          "categoryLabel": "Reasoning",
          "avgA": 85,
          "avgB": 77.1,
          "winner": "A",
          "benchmarkCount": 5
        },
        "knowledge": {
          "categoryLabel": "Knowledge",
          "avgA": 66.4,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 12
        },
        "instructionFollowing": {
          "categoryLabel": "Instruction Following",
          "avgA": null,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 1
        },
        "multilingual": {
          "categoryLabel": "Multilingual",
          "avgA": null,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 0
        },
        "math": {
          "categoryLabel": "Mathematics",
          "avgA": 51.7,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 1
        }
      }
    },
    {
      "slug": "gemini-3-1-flash-lite-vs-gpt-5-5",
      "url": "https://benchlm.ai/compare/gemini-3-1-flash-lite-vs-gpt-5-5",
      "markdownUrl": "https://benchlm.ai/md/compare/gemini-3-1-flash-lite-vs-gpt-5-5.md",
      "modelA": {
        "slug": "gpt-5-5",
        "canonicalModelKey": "gpt-5-5",
        "model": "GPT-5.5",
        "creator": "OpenAI",
        "sourceType": "Proprietary",
        "reasoningType": "Reasoning",
        "contextWindow": "1M",
        "contextWindowTokens": 1000000,
        "displayScore": 89,
        "rankingEligible": true,
        "overallRank": 7,
        "url": "https://benchlm.ai/models/gpt-5-5",
        "markdownUrl": "https://benchlm.ai/md/models/gpt-5-5.md"
      },
      "modelB": {
        "slug": "gemini-3-1-flash-lite",
        "canonicalModelKey": "gemini-3-1-flash-lite",
        "model": "Gemini 3.1 Flash-Lite",
        "creator": "Google",
        "sourceType": "Proprietary",
        "reasoningType": "Non-Reasoning",
        "contextWindow": "1M",
        "contextWindowTokens": 1000000,
        "displayScore": 47,
        "rankingEligible": true,
        "overallRank": 75,
        "url": "https://benchlm.ai/models/gemini-3-1-flash-lite",
        "markdownUrl": "https://benchlm.ai/md/models/gemini-3-1-flash-lite.md"
      },
      "overallWinner": "A",
      "winner": {
        "slug": "gpt-5-5",
        "canonicalModelKey": "gpt-5-5",
        "model": "GPT-5.5",
        "creator": "OpenAI",
        "sourceType": "Proprietary",
        "reasoningType": "Reasoning",
        "contextWindow": "1M",
        "contextWindowTokens": 1000000,
        "displayScore": 89,
        "rankingEligible": true,
        "overallRank": 7,
        "url": "https://benchlm.ai/models/gpt-5-5",
        "markdownUrl": "https://benchlm.ai/md/models/gpt-5-5.md"
      },
      "scoreDiff": 42,
      "winsA": 0,
      "winsB": 1,
      "comparableCategoryCount": 1,
      "benchmarkCountA": 42,
      "benchmarkCountB": 21,
      "categoryResults": {
        "agentic": {
          "categoryLabel": "Agentic",
          "avgA": 81.5,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 12
        },
        "coding": {
          "categoryLabel": "Coding",
          "avgA": 58.6,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 8
        },
        "multimodalGrounded": {
          "categoryLabel": "Multimodal & Grounded",
          "avgA": 70.4,
          "avgB": 73.2,
          "winner": "B",
          "benchmarkCount": 6
        },
        "reasoning": {
          "categoryLabel": "Reasoning",
          "avgA": 85,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 5
        },
        "knowledge": {
          "categoryLabel": "Knowledge",
          "avgA": 66.4,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 10
        },
        "instructionFollowing": {
          "categoryLabel": "Instruction Following",
          "avgA": null,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 1
        },
        "multilingual": {
          "categoryLabel": "Multilingual",
          "avgA": null,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 0
        },
        "math": {
          "categoryLabel": "Mathematics",
          "avgA": 51.7,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 1
        }
      }
    },
    {
      "slug": "glm-5-1-vs-gpt-5-5",
      "url": "https://benchlm.ai/compare/glm-5-1-vs-gpt-5-5",
      "markdownUrl": "https://benchlm.ai/md/compare/glm-5-1-vs-gpt-5-5.md",
      "modelA": {
        "slug": "gpt-5-5",
        "canonicalModelKey": "gpt-5-5",
        "model": "GPT-5.5",
        "creator": "OpenAI",
        "sourceType": "Proprietary",
        "reasoningType": "Reasoning",
        "contextWindow": "1M",
        "contextWindowTokens": 1000000,
        "displayScore": 89,
        "rankingEligible": true,
        "overallRank": 7,
        "url": "https://benchlm.ai/models/gpt-5-5",
        "markdownUrl": "https://benchlm.ai/md/models/gpt-5-5.md"
      },
      "modelB": {
        "slug": "glm-5-1",
        "canonicalModelKey": "glm-5-1",
        "model": "GLM-5.1",
        "creator": "Z.AI",
        "sourceType": "Open Weight",
        "reasoningType": "Reasoning",
        "contextWindow": "203K",
        "contextWindowTokens": 203000,
        "displayScore": 82,
        "rankingEligible": true,
        "overallRank": 17,
        "url": "https://benchlm.ai/models/glm-5-1",
        "markdownUrl": "https://benchlm.ai/md/models/glm-5-1.md"
      },
      "overallWinner": "A",
      "winner": {
        "slug": "gpt-5-5",
        "canonicalModelKey": "gpt-5-5",
        "model": "GPT-5.5",
        "creator": "OpenAI",
        "sourceType": "Proprietary",
        "reasoningType": "Reasoning",
        "contextWindow": "1M",
        "contextWindowTokens": 1000000,
        "displayScore": 89,
        "rankingEligible": true,
        "overallRank": 7,
        "url": "https://benchlm.ai/models/gpt-5-5",
        "markdownUrl": "https://benchlm.ai/md/models/gpt-5-5.md"
      },
      "scoreDiff": 7,
      "winsA": 2,
      "winsB": 1,
      "comparableCategoryCount": 3,
      "benchmarkCountA": 42,
      "benchmarkCountB": 33,
      "categoryResults": {
        "agentic": {
          "categoryLabel": "Agentic",
          "avgA": 81.5,
          "avgB": 65.3,
          "winner": "A",
          "benchmarkCount": 14
        },
        "coding": {
          "categoryLabel": "Coding",
          "avgA": 58.6,
          "avgB": 60.9,
          "winner": "B",
          "benchmarkCount": 10
        },
        "multimodalGrounded": {
          "categoryLabel": "Multimodal & Grounded",
          "avgA": 70.4,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 5
        },
        "reasoning": {
          "categoryLabel": "Reasoning",
          "avgA": 85,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 5
        },
        "knowledge": {
          "categoryLabel": "Knowledge",
          "avgA": 66.4,
          "avgB": 52.3,
          "winner": "A",
          "benchmarkCount": 10
        },
        "instructionFollowing": {
          "categoryLabel": "Instruction Following",
          "avgA": null,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 1
        },
        "multilingual": {
          "categoryLabel": "Multilingual",
          "avgA": null,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 0
        },
        "math": {
          "categoryLabel": "Mathematics",
          "avgA": 51.7,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 5
        }
      }
    },
    {
      "slug": "gpt-5-5-vs-kimi-k2-7-code",
      "url": "https://benchlm.ai/compare/gpt-5-5-vs-kimi-k2-7-code",
      "markdownUrl": "https://benchlm.ai/md/compare/gpt-5-5-vs-kimi-k2-7-code.md",
      "modelA": {
        "slug": "gpt-5-5",
        "canonicalModelKey": "gpt-5-5",
        "model": "GPT-5.5",
        "creator": "OpenAI",
        "sourceType": "Proprietary",
        "reasoningType": "Reasoning",
        "contextWindow": "1M",
        "contextWindowTokens": 1000000,
        "displayScore": 89,
        "rankingEligible": true,
        "overallRank": 7,
        "url": "https://benchlm.ai/models/gpt-5-5",
        "markdownUrl": "https://benchlm.ai/md/models/gpt-5-5.md"
      },
      "modelB": {
        "slug": "kimi-k2-7-code",
        "canonicalModelKey": "kimi-k2-7-code",
        "model": "Kimi K2.7 Code",
        "creator": "Moonshot AI",
        "sourceType": "Open Weight",
        "reasoningType": "Reasoning",
        "contextWindow": "256K",
        "contextWindowTokens": 256000,
        "displayScore": 0,
        "rankingEligible": false,
        "overallRank": null,
        "url": "https://benchlm.ai/models/kimi-k2-7-code",
        "markdownUrl": "https://benchlm.ai/md/models/kimi-k2-7-code.md"
      },
      "overallWinner": "A",
      "winner": {
        "slug": "gpt-5-5",
        "canonicalModelKey": "gpt-5-5",
        "model": "GPT-5.5",
        "creator": "OpenAI",
        "sourceType": "Proprietary",
        "reasoningType": "Reasoning",
        "contextWindow": "1M",
        "contextWindowTokens": 1000000,
        "displayScore": 89,
        "rankingEligible": true,
        "overallRank": 7,
        "url": "https://benchlm.ai/models/gpt-5-5",
        "markdownUrl": "https://benchlm.ai/md/models/gpt-5-5.md"
      },
      "scoreDiff": 89,
      "winsA": 0,
      "winsB": 0,
      "comparableCategoryCount": 0,
      "benchmarkCountA": 42,
      "benchmarkCountB": 6,
      "categoryResults": {
        "agentic": {
          "categoryLabel": "Agentic",
          "avgA": 81.5,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 14
        },
        "coding": {
          "categoryLabel": "Coding",
          "avgA": 58.6,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 11
        },
        "multimodalGrounded": {
          "categoryLabel": "Multimodal & Grounded",
          "avgA": 70.4,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 5
        },
        "reasoning": {
          "categoryLabel": "Reasoning",
          "avgA": 85,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 5
        },
        "knowledge": {
          "categoryLabel": "Knowledge",
          "avgA": 66.4,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 10
        },
        "instructionFollowing": {
          "categoryLabel": "Instruction Following",
          "avgA": null,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 1
        },
        "multilingual": {
          "categoryLabel": "Multilingual",
          "avgA": null,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 0
        },
        "math": {
          "categoryLabel": "Mathematics",
          "avgA": 51.7,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 1
        }
      }
    },
    {
      "slug": "claude-opus-4-7-vs-gpt-5-5-pro",
      "url": "https://benchlm.ai/compare/claude-opus-4-7-vs-gpt-5-5-pro",
      "markdownUrl": "https://benchlm.ai/md/compare/claude-opus-4-7-vs-gpt-5-5-pro.md",
      "modelA": {
        "slug": "gpt-5-5-pro",
        "canonicalModelKey": "gpt-5-5-pro",
        "model": "GPT-5.5 Pro",
        "creator": "OpenAI",
        "sourceType": "Proprietary",
        "reasoningType": "Reasoning",
        "contextWindow": "1M",
        "contextWindowTokens": 1000000,
        "displayScore": 100,
        "rankingEligible": false,
        "overallRank": null,
        "url": "https://benchlm.ai/models/gpt-5-5-pro",
        "markdownUrl": "https://benchlm.ai/md/models/gpt-5-5-pro.md"
      },
      "modelB": {
        "slug": "claude-opus-4-7",
        "canonicalModelKey": "claude-opus-4-7",
        "model": "Claude Opus 4.7",
        "creator": "Anthropic",
        "sourceType": "Proprietary",
        "reasoningType": "Non-Reasoning",
        "contextWindow": "1M",
        "contextWindowTokens": 1000000,
        "displayScore": 23,
        "rankingEligible": false,
        "overallRank": null,
        "url": "https://benchlm.ai/models/claude-opus-4-7",
        "markdownUrl": "https://benchlm.ai/md/models/claude-opus-4-7.md"
      },
      "overallWinner": "A",
      "winner": {
        "slug": "gpt-5-5-pro",
        "canonicalModelKey": "gpt-5-5-pro",
        "model": "GPT-5.5 Pro",
        "creator": "OpenAI",
        "sourceType": "Proprietary",
        "reasoningType": "Reasoning",
        "contextWindow": "1M",
        "contextWindowTokens": 1000000,
        "displayScore": 100,
        "rankingEligible": false,
        "overallRank": null,
        "url": "https://benchlm.ai/models/gpt-5-5-pro",
        "markdownUrl": "https://benchlm.ai/md/models/gpt-5-5-pro.md"
      },
      "scoreDiff": 77,
      "winsA": 0,
      "winsB": 0,
      "comparableCategoryCount": 0,
      "benchmarkCountA": 4,
      "benchmarkCountB": 21,
      "categoryResults": {
        "agentic": {
          "categoryLabel": "Agentic",
          "avgA": 90.1,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 6
        },
        "coding": {
          "categoryLabel": "Coding",
          "avgA": null,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 5
        },
        "multimodalGrounded": {
          "categoryLabel": "Multimodal & Grounded",
          "avgA": null,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 2
        },
        "reasoning": {
          "categoryLabel": "Reasoning",
          "avgA": null,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 2
        },
        "knowledge": {
          "categoryLabel": "Knowledge",
          "avgA": 57.2,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 8
        },
        "instructionFollowing": {
          "categoryLabel": "Instruction Following",
          "avgA": null,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 1
        },
        "multilingual": {
          "categoryLabel": "Multilingual",
          "avgA": null,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 0
        },
        "math": {
          "categoryLabel": "Mathematics",
          "avgA": 52.4,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 1
        }
      }
    },
    {
      "slug": "claude-opus-4-7-vs-gemini-3-1-pro",
      "url": "https://benchlm.ai/compare/claude-opus-4-7-vs-gemini-3-1-pro",
      "markdownUrl": "https://benchlm.ai/md/compare/claude-opus-4-7-vs-gemini-3-1-pro.md",
      "modelA": {
        "slug": "claude-opus-4-7",
        "canonicalModelKey": "claude-opus-4-7",
        "model": "Claude Opus 4.7",
        "creator": "Anthropic",
        "sourceType": "Proprietary",
        "reasoningType": "Non-Reasoning",
        "contextWindow": "1M",
        "contextWindowTokens": 1000000,
        "displayScore": 23,
        "rankingEligible": false,
        "overallRank": null,
        "url": "https://benchlm.ai/models/claude-opus-4-7",
        "markdownUrl": "https://benchlm.ai/md/models/claude-opus-4-7.md"
      },
      "modelB": {
        "slug": "gemini-3-1-pro",
        "canonicalModelKey": "gemini-3-1-pro",
        "model": "Gemini 3.1 Pro",
        "creator": "Google",
        "sourceType": "Proprietary",
        "reasoningType": "Non-Reasoning",
        "contextWindow": "1M",
        "contextWindowTokens": 1000000,
        "displayScore": 91,
        "rankingEligible": true,
        "overallRank": 4,
        "url": "https://benchlm.ai/models/gemini-3-1-pro",
        "markdownUrl": "https://benchlm.ai/md/models/gemini-3-1-pro.md"
      },
      "overallWinner": "B",
      "winner": {
        "slug": "gemini-3-1-pro",
        "canonicalModelKey": "gemini-3-1-pro",
        "model": "Gemini 3.1 Pro",
        "creator": "Google",
        "sourceType": "Proprietary",
        "reasoningType": "Non-Reasoning",
        "contextWindow": "1M",
        "contextWindowTokens": 1000000,
        "displayScore": 91,
        "rankingEligible": true,
        "overallRank": 4,
        "url": "https://benchlm.ai/models/gemini-3-1-pro",
        "markdownUrl": "https://benchlm.ai/md/models/gemini-3-1-pro.md"
      },
      "scoreDiff": 68,
      "winsA": 0,
      "winsB": 0,
      "comparableCategoryCount": 0,
      "benchmarkCountA": 21,
      "benchmarkCountB": 38,
      "categoryResults": {
        "agentic": {
          "categoryLabel": "Agentic",
          "avgA": null,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 8
        },
        "coding": {
          "categoryLabel": "Coding",
          "avgA": null,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 6
        },
        "multimodalGrounded": {
          "categoryLabel": "Multimodal & Grounded",
          "avgA": null,
          "avgB": 82.8,
          "winner": null,
          "benchmarkCount": 10
        },
        "reasoning": {
          "categoryLabel": "Reasoning",
          "avgA": null,
          "avgB": 77.1,
          "winner": null,
          "benchmarkCount": 3
        },
        "knowledge": {
          "categoryLabel": "Knowledge",
          "avgA": null,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 10
        },
        "instructionFollowing": {
          "categoryLabel": "Instruction Following",
          "avgA": null,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 1
        },
        "multilingual": {
          "categoryLabel": "Multilingual",
          "avgA": null,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 0
        },
        "math": {
          "categoryLabel": "Mathematics",
          "avgA": null,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 0
        }
      }
    },
    {
      "slug": "glm-5-reasoning-vs-gpt-5-5",
      "url": "https://benchlm.ai/compare/glm-5-reasoning-vs-gpt-5-5",
      "markdownUrl": "https://benchlm.ai/md/compare/glm-5-reasoning-vs-gpt-5-5.md",
      "modelA": {
        "slug": "glm-5-reasoning",
        "canonicalModelKey": "glm-5-reasoning",
        "model": "GLM-5 (Reasoning)",
        "creator": "Z.AI",
        "sourceType": "Open Weight",
        "reasoningType": "Reasoning",
        "contextWindow": "200K",
        "contextWindowTokens": 200000,
        "displayScore": 79,
        "rankingEligible": true,
        "overallRank": 24,
        "url": "https://benchlm.ai/models/glm-5-reasoning",
        "markdownUrl": "https://benchlm.ai/md/models/glm-5-reasoning.md"
      },
      "modelB": {
        "slug": "gpt-5-5",
        "canonicalModelKey": "gpt-5-5",
        "model": "GPT-5.5",
        "creator": "OpenAI",
        "sourceType": "Proprietary",
        "reasoningType": "Reasoning",
        "contextWindow": "1M",
        "contextWindowTokens": 1000000,
        "displayScore": 89,
        "rankingEligible": true,
        "overallRank": 7,
        "url": "https://benchlm.ai/models/gpt-5-5",
        "markdownUrl": "https://benchlm.ai/md/models/gpt-5-5.md"
      },
      "overallWinner": "B",
      "winner": {
        "slug": "gpt-5-5",
        "canonicalModelKey": "gpt-5-5",
        "model": "GPT-5.5",
        "creator": "OpenAI",
        "sourceType": "Proprietary",
        "reasoningType": "Reasoning",
        "contextWindow": "1M",
        "contextWindowTokens": 1000000,
        "displayScore": 89,
        "rankingEligible": true,
        "overallRank": 7,
        "url": "https://benchlm.ai/models/gpt-5-5",
        "markdownUrl": "https://benchlm.ai/md/models/gpt-5-5.md"
      },
      "scoreDiff": 10,
      "winsA": 0,
      "winsB": 0,
      "comparableCategoryCount": 0,
      "benchmarkCountA": 2,
      "benchmarkCountB": 42,
      "categoryResults": {
        "agentic": {
          "categoryLabel": "Agentic",
          "avgA": null,
          "avgB": 81.5,
          "winner": null,
          "benchmarkCount": 12
        },
        "coding": {
          "categoryLabel": "Coding",
          "avgA": null,
          "avgB": 58.6,
          "winner": null,
          "benchmarkCount": 8
        },
        "multimodalGrounded": {
          "categoryLabel": "Multimodal & Grounded",
          "avgA": null,
          "avgB": 70.4,
          "winner": null,
          "benchmarkCount": 5
        },
        "reasoning": {
          "categoryLabel": "Reasoning",
          "avgA": null,
          "avgB": 85,
          "winner": null,
          "benchmarkCount": 5
        },
        "knowledge": {
          "categoryLabel": "Knowledge",
          "avgA": null,
          "avgB": 66.4,
          "winner": null,
          "benchmarkCount": 10
        },
        "instructionFollowing": {
          "categoryLabel": "Instruction Following",
          "avgA": null,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 1
        },
        "multilingual": {
          "categoryLabel": "Multilingual",
          "avgA": null,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 0
        },
        "math": {
          "categoryLabel": "Mathematics",
          "avgA": null,
          "avgB": 51.7,
          "winner": null,
          "benchmarkCount": 1
        }
      }
    },
    {
      "slug": "glm-5-1-vs-kimi-k2-7-code",
      "url": "https://benchlm.ai/compare/glm-5-1-vs-kimi-k2-7-code",
      "markdownUrl": "https://benchlm.ai/md/compare/glm-5-1-vs-kimi-k2-7-code.md",
      "modelA": {
        "slug": "glm-5-1",
        "canonicalModelKey": "glm-5-1",
        "model": "GLM-5.1",
        "creator": "Z.AI",
        "sourceType": "Open Weight",
        "reasoningType": "Reasoning",
        "contextWindow": "203K",
        "contextWindowTokens": 203000,
        "displayScore": 82,
        "rankingEligible": true,
        "overallRank": 17,
        "url": "https://benchlm.ai/models/glm-5-1",
        "markdownUrl": "https://benchlm.ai/md/models/glm-5-1.md"
      },
      "modelB": {
        "slug": "kimi-k2-7-code",
        "canonicalModelKey": "kimi-k2-7-code",
        "model": "Kimi K2.7 Code",
        "creator": "Moonshot AI",
        "sourceType": "Open Weight",
        "reasoningType": "Reasoning",
        "contextWindow": "256K",
        "contextWindowTokens": 256000,
        "displayScore": 0,
        "rankingEligible": false,
        "overallRank": null,
        "url": "https://benchlm.ai/models/kimi-k2-7-code",
        "markdownUrl": "https://benchlm.ai/md/models/kimi-k2-7-code.md"
      },
      "overallWinner": "A",
      "winner": {
        "slug": "glm-5-1",
        "canonicalModelKey": "glm-5-1",
        "model": "GLM-5.1",
        "creator": "Z.AI",
        "sourceType": "Open Weight",
        "reasoningType": "Reasoning",
        "contextWindow": "203K",
        "contextWindowTokens": 203000,
        "displayScore": 82,
        "rankingEligible": true,
        "overallRank": 17,
        "url": "https://benchlm.ai/models/glm-5-1",
        "markdownUrl": "https://benchlm.ai/md/models/glm-5-1.md"
      },
      "scoreDiff": 82,
      "winsA": 0,
      "winsB": 0,
      "comparableCategoryCount": 0,
      "benchmarkCountA": 33,
      "benchmarkCountB": 6,
      "categoryResults": {
        "agentic": {
          "categoryLabel": "Agentic",
          "avgA": 65.3,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 12
        },
        "coding": {
          "categoryLabel": "Coding",
          "avgA": 60.9,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 10
        },
        "multimodalGrounded": {
          "categoryLabel": "Multimodal & Grounded",
          "avgA": null,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 1
        },
        "reasoning": {
          "categoryLabel": "Reasoning",
          "avgA": null,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 2
        },
        "knowledge": {
          "categoryLabel": "Knowledge",
          "avgA": 52.3,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 8
        },
        "instructionFollowing": {
          "categoryLabel": "Instruction Following",
          "avgA": null,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 1
        },
        "multilingual": {
          "categoryLabel": "Multilingual",
          "avgA": null,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 0
        },
        "math": {
          "categoryLabel": "Mathematics",
          "avgA": null,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 4
        }
      }
    },
    {
      "slug": "kimi-k2-7-code-vs-ling-2-6-flash",
      "url": "https://benchlm.ai/compare/kimi-k2-7-code-vs-ling-2-6-flash",
      "markdownUrl": "https://benchlm.ai/md/compare/kimi-k2-7-code-vs-ling-2-6-flash.md",
      "modelA": {
        "slug": "ling-2-6-flash",
        "canonicalModelKey": "ling-2-6-flash",
        "model": "Ling 2.6 Flash",
        "creator": "InclusionAI",
        "sourceType": "Open Weight",
        "reasoningType": "Non-Reasoning",
        "contextWindow": "262K",
        "contextWindowTokens": 262000,
        "displayScore": 36,
        "rankingEligible": false,
        "overallRank": null,
        "url": "https://benchlm.ai/models/ling-2-6-flash",
        "markdownUrl": "https://benchlm.ai/md/models/ling-2-6-flash.md"
      },
      "modelB": {
        "slug": "kimi-k2-7-code",
        "canonicalModelKey": "kimi-k2-7-code",
        "model": "Kimi K2.7 Code",
        "creator": "Moonshot AI",
        "sourceType": "Open Weight",
        "reasoningType": "Reasoning",
        "contextWindow": "256K",
        "contextWindowTokens": 256000,
        "displayScore": 0,
        "rankingEligible": false,
        "overallRank": null,
        "url": "https://benchlm.ai/models/kimi-k2-7-code",
        "markdownUrl": "https://benchlm.ai/md/models/kimi-k2-7-code.md"
      },
      "overallWinner": "A",
      "winner": {
        "slug": "ling-2-6-flash",
        "canonicalModelKey": "ling-2-6-flash",
        "model": "Ling 2.6 Flash",
        "creator": "InclusionAI",
        "sourceType": "Open Weight",
        "reasoningType": "Non-Reasoning",
        "contextWindow": "262K",
        "contextWindowTokens": 262000,
        "displayScore": 36,
        "rankingEligible": false,
        "overallRank": null,
        "url": "https://benchlm.ai/models/ling-2-6-flash",
        "markdownUrl": "https://benchlm.ai/md/models/ling-2-6-flash.md"
      },
      "scoreDiff": 36,
      "winsA": 0,
      "winsB": 0,
      "comparableCategoryCount": 0,
      "benchmarkCountA": 19,
      "benchmarkCountB": 6,
      "categoryResults": {
        "agentic": {
          "categoryLabel": "Agentic",
          "avgA": null,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 7
        },
        "coding": {
          "categoryLabel": "Coding",
          "avgA": 27,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 7
        },
        "multimodalGrounded": {
          "categoryLabel": "Multimodal & Grounded",
          "avgA": null,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 0
        },
        "reasoning": {
          "categoryLabel": "Reasoning",
          "avgA": null,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 2
        },
        "knowledge": {
          "categoryLabel": "Knowledge",
          "avgA": 59,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 7
        },
        "instructionFollowing": {
          "categoryLabel": "Instruction Following",
          "avgA": 57,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 2
        },
        "multilingual": {
          "categoryLabel": "Multilingual",
          "avgA": null,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 0
        },
        "math": {
          "categoryLabel": "Mathematics",
          "avgA": null,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 0
        }
      }
    },
    {
      "slug": "gpt-5-5-vs-ling-2-6-flash",
      "url": "https://benchlm.ai/compare/gpt-5-5-vs-ling-2-6-flash",
      "markdownUrl": "https://benchlm.ai/md/compare/gpt-5-5-vs-ling-2-6-flash.md",
      "modelA": {
        "slug": "ling-2-6-flash",
        "canonicalModelKey": "ling-2-6-flash",
        "model": "Ling 2.6 Flash",
        "creator": "InclusionAI",
        "sourceType": "Open Weight",
        "reasoningType": "Non-Reasoning",
        "contextWindow": "262K",
        "contextWindowTokens": 262000,
        "displayScore": 36,
        "rankingEligible": false,
        "overallRank": null,
        "url": "https://benchlm.ai/models/ling-2-6-flash",
        "markdownUrl": "https://benchlm.ai/md/models/ling-2-6-flash.md"
      },
      "modelB": {
        "slug": "gpt-5-5",
        "canonicalModelKey": "gpt-5-5",
        "model": "GPT-5.5",
        "creator": "OpenAI",
        "sourceType": "Proprietary",
        "reasoningType": "Reasoning",
        "contextWindow": "1M",
        "contextWindowTokens": 1000000,
        "displayScore": 89,
        "rankingEligible": true,
        "overallRank": 7,
        "url": "https://benchlm.ai/models/gpt-5-5",
        "markdownUrl": "https://benchlm.ai/md/models/gpt-5-5.md"
      },
      "overallWinner": "B",
      "winner": {
        "slug": "gpt-5-5",
        "canonicalModelKey": "gpt-5-5",
        "model": "GPT-5.5",
        "creator": "OpenAI",
        "sourceType": "Proprietary",
        "reasoningType": "Reasoning",
        "contextWindow": "1M",
        "contextWindowTokens": 1000000,
        "displayScore": 89,
        "rankingEligible": true,
        "overallRank": 7,
        "url": "https://benchlm.ai/models/gpt-5-5",
        "markdownUrl": "https://benchlm.ai/md/models/gpt-5-5.md"
      },
      "scoreDiff": 53,
      "winsA": 0,
      "winsB": 2,
      "comparableCategoryCount": 2,
      "benchmarkCountA": 19,
      "benchmarkCountB": 42,
      "categoryResults": {
        "agentic": {
          "categoryLabel": "Agentic",
          "avgA": null,
          "avgB": 81.5,
          "winner": null,
          "benchmarkCount": 12
        },
        "coding": {
          "categoryLabel": "Coding",
          "avgA": 27,
          "avgB": 58.6,
          "winner": "B",
          "benchmarkCount": 9
        },
        "multimodalGrounded": {
          "categoryLabel": "Multimodal & Grounded",
          "avgA": null,
          "avgB": 70.4,
          "winner": null,
          "benchmarkCount": 5
        },
        "reasoning": {
          "categoryLabel": "Reasoning",
          "avgA": null,
          "avgB": 85,
          "winner": null,
          "benchmarkCount": 5
        },
        "knowledge": {
          "categoryLabel": "Knowledge",
          "avgA": 59,
          "avgB": 66.4,
          "winner": "B",
          "benchmarkCount": 10
        },
        "instructionFollowing": {
          "categoryLabel": "Instruction Following",
          "avgA": 57,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 2
        },
        "multilingual": {
          "categoryLabel": "Multilingual",
          "avgA": null,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 0
        },
        "math": {
          "categoryLabel": "Mathematics",
          "avgA": null,
          "avgB": 51.7,
          "winner": null,
          "benchmarkCount": 1
        }
      }
    },
    {
      "slug": "glm-5-1-vs-ling-2-6-flash",
      "url": "https://benchlm.ai/compare/glm-5-1-vs-ling-2-6-flash",
      "markdownUrl": "https://benchlm.ai/md/compare/glm-5-1-vs-ling-2-6-flash.md",
      "modelA": {
        "slug": "ling-2-6-flash",
        "canonicalModelKey": "ling-2-6-flash",
        "model": "Ling 2.6 Flash",
        "creator": "InclusionAI",
        "sourceType": "Open Weight",
        "reasoningType": "Non-Reasoning",
        "contextWindow": "262K",
        "contextWindowTokens": 262000,
        "displayScore": 36,
        "rankingEligible": false,
        "overallRank": null,
        "url": "https://benchlm.ai/models/ling-2-6-flash",
        "markdownUrl": "https://benchlm.ai/md/models/ling-2-6-flash.md"
      },
      "modelB": {
        "slug": "glm-5-1",
        "canonicalModelKey": "glm-5-1",
        "model": "GLM-5.1",
        "creator": "Z.AI",
        "sourceType": "Open Weight",
        "reasoningType": "Reasoning",
        "contextWindow": "203K",
        "contextWindowTokens": 203000,
        "displayScore": 82,
        "rankingEligible": true,
        "overallRank": 17,
        "url": "https://benchlm.ai/models/glm-5-1",
        "markdownUrl": "https://benchlm.ai/md/models/glm-5-1.md"
      },
      "overallWinner": "B",
      "winner": {
        "slug": "glm-5-1",
        "canonicalModelKey": "glm-5-1",
        "model": "GLM-5.1",
        "creator": "Z.AI",
        "sourceType": "Open Weight",
        "reasoningType": "Reasoning",
        "contextWindow": "203K",
        "contextWindowTokens": 203000,
        "displayScore": 82,
        "rankingEligible": true,
        "overallRank": 17,
        "url": "https://benchlm.ai/models/glm-5-1",
        "markdownUrl": "https://benchlm.ai/md/models/glm-5-1.md"
      },
      "scoreDiff": 46,
      "winsA": 1,
      "winsB": 1,
      "comparableCategoryCount": 2,
      "benchmarkCountA": 19,
      "benchmarkCountB": 33,
      "categoryResults": {
        "agentic": {
          "categoryLabel": "Agentic",
          "avgA": null,
          "avgB": 65.3,
          "winner": null,
          "benchmarkCount": 11
        },
        "coding": {
          "categoryLabel": "Coding",
          "avgA": 27,
          "avgB": 60.9,
          "winner": "B",
          "benchmarkCount": 8
        },
        "multimodalGrounded": {
          "categoryLabel": "Multimodal & Grounded",
          "avgA": null,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 1
        },
        "reasoning": {
          "categoryLabel": "Reasoning",
          "avgA": null,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 2
        },
        "knowledge": {
          "categoryLabel": "Knowledge",
          "avgA": 59,
          "avgB": 52.3,
          "winner": "A",
          "benchmarkCount": 9
        },
        "instructionFollowing": {
          "categoryLabel": "Instruction Following",
          "avgA": 57,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 2
        },
        "multilingual": {
          "categoryLabel": "Multilingual",
          "avgA": null,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 0
        },
        "math": {
          "categoryLabel": "Mathematics",
          "avgA": null,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 4
        }
      }
    },
    {
      "slug": "claude-opus-4-7-vs-ling-2-6-flash",
      "url": "https://benchlm.ai/compare/claude-opus-4-7-vs-ling-2-6-flash",
      "markdownUrl": "https://benchlm.ai/md/compare/claude-opus-4-7-vs-ling-2-6-flash.md",
      "modelA": {
        "slug": "ling-2-6-flash",
        "canonicalModelKey": "ling-2-6-flash",
        "model": "Ling 2.6 Flash",
        "creator": "InclusionAI",
        "sourceType": "Open Weight",
        "reasoningType": "Non-Reasoning",
        "contextWindow": "262K",
        "contextWindowTokens": 262000,
        "displayScore": 36,
        "rankingEligible": false,
        "overallRank": null,
        "url": "https://benchlm.ai/models/ling-2-6-flash",
        "markdownUrl": "https://benchlm.ai/md/models/ling-2-6-flash.md"
      },
      "modelB": {
        "slug": "claude-opus-4-7",
        "canonicalModelKey": "claude-opus-4-7",
        "model": "Claude Opus 4.7",
        "creator": "Anthropic",
        "sourceType": "Proprietary",
        "reasoningType": "Non-Reasoning",
        "contextWindow": "1M",
        "contextWindowTokens": 1000000,
        "displayScore": 23,
        "rankingEligible": false,
        "overallRank": null,
        "url": "https://benchlm.ai/models/claude-opus-4-7",
        "markdownUrl": "https://benchlm.ai/md/models/claude-opus-4-7.md"
      },
      "overallWinner": "A",
      "winner": {
        "slug": "ling-2-6-flash",
        "canonicalModelKey": "ling-2-6-flash",
        "model": "Ling 2.6 Flash",
        "creator": "InclusionAI",
        "sourceType": "Open Weight",
        "reasoningType": "Non-Reasoning",
        "contextWindow": "262K",
        "contextWindowTokens": 262000,
        "displayScore": 36,
        "rankingEligible": false,
        "overallRank": null,
        "url": "https://benchlm.ai/models/ling-2-6-flash",
        "markdownUrl": "https://benchlm.ai/md/models/ling-2-6-flash.md"
      },
      "scoreDiff": 13,
      "winsA": 0,
      "winsB": 0,
      "comparableCategoryCount": 0,
      "benchmarkCountA": 19,
      "benchmarkCountB": 21,
      "categoryResults": {
        "agentic": {
          "categoryLabel": "Agentic",
          "avgA": null,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 5
        },
        "coding": {
          "categoryLabel": "Coding",
          "avgA": 27,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 6
        },
        "multimodalGrounded": {
          "categoryLabel": "Multimodal & Grounded",
          "avgA": null,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 2
        },
        "reasoning": {
          "categoryLabel": "Reasoning",
          "avgA": null,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 2
        },
        "knowledge": {
          "categoryLabel": "Knowledge",
          "avgA": 59,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 7
        },
        "instructionFollowing": {
          "categoryLabel": "Instruction Following",
          "avgA": 57,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 2
        },
        "multilingual": {
          "categoryLabel": "Multilingual",
          "avgA": null,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 0
        },
        "math": {
          "categoryLabel": "Mathematics",
          "avgA": null,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 0
        }
      }
    },
    {
      "slug": "qwen3-6-27b-vs-qwen3-6-35b-a3b",
      "url": "https://benchlm.ai/compare/qwen3-6-27b-vs-qwen3-6-35b-a3b",
      "markdownUrl": "https://benchlm.ai/md/compare/qwen3-6-27b-vs-qwen3-6-35b-a3b.md",
      "modelA": {
        "slug": "qwen3-6-27b",
        "canonicalModelKey": "qwen3-6-27b",
        "model": "Qwen3.6-27B",
        "creator": "Alibaba",
        "sourceType": "Open Weight",
        "reasoningType": "Reasoning",
        "contextWindow": "262K",
        "contextWindowTokens": 262000,
        "displayScore": 72,
        "rankingEligible": true,
        "overallRank": 34,
        "url": "https://benchlm.ai/models/qwen3-6-27b",
        "markdownUrl": "https://benchlm.ai/md/models/qwen3-6-27b.md"
      },
      "modelB": {
        "slug": "qwen3-6-35b-a3b",
        "canonicalModelKey": "qwen3-6-35b-a3b",
        "model": "Qwen3.6-35B-A3B",
        "creator": "Alibaba",
        "sourceType": "Open Weight",
        "reasoningType": "Reasoning",
        "contextWindow": "262K",
        "contextWindowTokens": 262000,
        "displayScore": 65,
        "rankingEligible": true,
        "overallRank": 45,
        "url": "https://benchlm.ai/models/qwen3-6-35b-a3b",
        "markdownUrl": "https://benchlm.ai/md/models/qwen3-6-35b-a3b.md"
      },
      "overallWinner": "A",
      "winner": {
        "slug": "qwen3-6-27b",
        "canonicalModelKey": "qwen3-6-27b",
        "model": "Qwen3.6-27B",
        "creator": "Alibaba",
        "sourceType": "Open Weight",
        "reasoningType": "Reasoning",
        "contextWindow": "262K",
        "contextWindowTokens": 262000,
        "displayScore": 72,
        "rankingEligible": true,
        "overallRank": 34,
        "url": "https://benchlm.ai/models/qwen3-6-27b",
        "markdownUrl": "https://benchlm.ai/md/models/qwen3-6-27b.md"
      },
      "scoreDiff": 7,
      "winsA": 4,
      "winsB": 0,
      "comparableCategoryCount": 4,
      "benchmarkCountA": 55,
      "benchmarkCountB": 58,
      "categoryResults": {
        "agentic": {
          "categoryLabel": "Agentic",
          "avgA": 59.3,
          "avgB": 51.5,
          "winner": "A",
          "benchmarkCount": 16
        },
        "coding": {
          "categoryLabel": "Coding",
          "avgA": 70.6,
          "avgB": 66.9,
          "winner": "A",
          "benchmarkCount": 9
        },
        "multimodalGrounded": {
          "categoryLabel": "Multimodal & Grounded",
          "avgA": 76.6,
          "avgB": 76.1,
          "winner": "A",
          "benchmarkCount": 20
        },
        "reasoning": {
          "categoryLabel": "Reasoning",
          "avgA": null,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 2
        },
        "knowledge": {
          "categoryLabel": "Knowledge",
          "avgA": 62.2,
          "avgB": 60.5,
          "winner": "A",
          "benchmarkCount": 12
        },
        "instructionFollowing": {
          "categoryLabel": "Instruction Following",
          "avgA": null,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 1
        },
        "multilingual": {
          "categoryLabel": "Multilingual",
          "avgA": null,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 0
        },
        "math": {
          "categoryLabel": "Mathematics",
          "avgA": null,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 5
        }
      }
    },
    {
      "slug": "qwen3-5-27b-vs-qwen3-6-27b",
      "url": "https://benchlm.ai/compare/qwen3-5-27b-vs-qwen3-6-27b",
      "markdownUrl": "https://benchlm.ai/md/compare/qwen3-5-27b-vs-qwen3-6-27b.md",
      "modelA": {
        "slug": "qwen3-6-27b",
        "canonicalModelKey": "qwen3-6-27b",
        "model": "Qwen3.6-27B",
        "creator": "Alibaba",
        "sourceType": "Open Weight",
        "reasoningType": "Reasoning",
        "contextWindow": "262K",
        "contextWindowTokens": 262000,
        "displayScore": 72,
        "rankingEligible": true,
        "overallRank": 34,
        "url": "https://benchlm.ai/models/qwen3-6-27b",
        "markdownUrl": "https://benchlm.ai/md/models/qwen3-6-27b.md"
      },
      "modelB": {
        "slug": "qwen3-5-27b",
        "canonicalModelKey": "qwen3-5-27b",
        "model": "Qwen3.5-27B",
        "creator": "Alibaba",
        "sourceType": "Open Weight",
        "reasoningType": "Reasoning",
        "contextWindow": "262K",
        "contextWindowTokens": 262000,
        "displayScore": 61,
        "rankingEligible": true,
        "overallRank": 52,
        "url": "https://benchlm.ai/models/qwen3-5-27b",
        "markdownUrl": "https://benchlm.ai/md/models/qwen3-5-27b.md"
      },
      "overallWinner": "A",
      "winner": {
        "slug": "qwen3-6-27b",
        "canonicalModelKey": "qwen3-6-27b",
        "model": "Qwen3.6-27B",
        "creator": "Alibaba",
        "sourceType": "Open Weight",
        "reasoningType": "Reasoning",
        "contextWindow": "262K",
        "contextWindowTokens": 262000,
        "displayScore": 72,
        "rankingEligible": true,
        "overallRank": 34,
        "url": "https://benchlm.ai/models/qwen3-6-27b",
        "markdownUrl": "https://benchlm.ai/md/models/qwen3-6-27b.md"
      },
      "scoreDiff": 11,
      "winsA": 2,
      "winsB": 1,
      "comparableCategoryCount": 3,
      "benchmarkCountA": 55,
      "benchmarkCountB": 33,
      "categoryResults": {
        "agentic": {
          "categoryLabel": "Agentic",
          "avgA": 59.3,
          "avgB": 51.6,
          "winner": "A",
          "benchmarkCount": 12
        },
        "coding": {
          "categoryLabel": "Coding",
          "avgA": 70.6,
          "avgB": 63,
          "winner": "A",
          "benchmarkCount": 10
        },
        "multimodalGrounded": {
          "categoryLabel": "Multimodal & Grounded",
          "avgA": 76.6,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 18
        },
        "reasoning": {
          "categoryLabel": "Reasoning",
          "avgA": null,
          "avgB": 60.6,
          "winner": null,
          "benchmarkCount": 3
        },
        "knowledge": {
          "categoryLabel": "Knowledge",
          "avgA": 62.2,
          "avgB": 80.6,
          "winner": "B",
          "benchmarkCount": 12
        },
        "instructionFollowing": {
          "categoryLabel": "Instruction Following",
          "avgA": null,
          "avgB": 95,
          "winner": null,
          "benchmarkCount": 2
        },
        "multilingual": {
          "categoryLabel": "Multilingual",
          "avgA": null,
          "avgB": 82.2,
          "winner": null,
          "benchmarkCount": 1
        },
        "math": {
          "categoryLabel": "Mathematics",
          "avgA": null,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 5
        }
      }
    },
    {
      "slug": "gemma-4-31b-vs-qwen3-6-27b",
      "url": "https://benchlm.ai/compare/gemma-4-31b-vs-qwen3-6-27b",
      "markdownUrl": "https://benchlm.ai/md/compare/gemma-4-31b-vs-qwen3-6-27b.md",
      "modelA": {
        "slug": "qwen3-6-27b",
        "canonicalModelKey": "qwen3-6-27b",
        "model": "Qwen3.6-27B",
        "creator": "Alibaba",
        "sourceType": "Open Weight",
        "reasoningType": "Reasoning",
        "contextWindow": "262K",
        "contextWindowTokens": 262000,
        "displayScore": 72,
        "rankingEligible": true,
        "overallRank": 34,
        "url": "https://benchlm.ai/models/qwen3-6-27b",
        "markdownUrl": "https://benchlm.ai/md/models/qwen3-6-27b.md"
      },
      "modelB": {
        "slug": "gemma-4-31b",
        "canonicalModelKey": "gemma-4-31b",
        "model": "Gemma 4 31B",
        "creator": "Google",
        "sourceType": "Open Weight",
        "reasoningType": "Reasoning",
        "contextWindow": "256K",
        "contextWindowTokens": 256000,
        "displayScore": 64,
        "rankingEligible": false,
        "overallRank": null,
        "url": "https://benchlm.ai/models/gemma-4-31b",
        "markdownUrl": "https://benchlm.ai/md/models/gemma-4-31b.md"
      },
      "overallWinner": "A",
      "winner": {
        "slug": "qwen3-6-27b",
        "canonicalModelKey": "qwen3-6-27b",
        "model": "Qwen3.6-27B",
        "creator": "Alibaba",
        "sourceType": "Open Weight",
        "reasoningType": "Reasoning",
        "contextWindow": "262K",
        "contextWindowTokens": 262000,
        "displayScore": 72,
        "rankingEligible": true,
        "overallRank": 34,
        "url": "https://benchlm.ai/models/qwen3-6-27b",
        "markdownUrl": "https://benchlm.ai/md/models/qwen3-6-27b.md"
      },
      "scoreDiff": 8,
      "winsA": 2,
      "winsB": 1,
      "comparableCategoryCount": 3,
      "benchmarkCountA": 55,
      "benchmarkCountB": 25,
      "categoryResults": {
        "agentic": {
          "categoryLabel": "Agentic",
          "avgA": 59.3,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 10
        },
        "coding": {
          "categoryLabel": "Coding",
          "avgA": 70.6,
          "avgB": 41.6,
          "winner": "A",
          "benchmarkCount": 11
        },
        "multimodalGrounded": {
          "categoryLabel": "Multimodal & Grounded",
          "avgA": 76.6,
          "avgB": 76.9,
          "winner": "B",
          "benchmarkCount": 16
        },
        "reasoning": {
          "categoryLabel": "Reasoning",
          "avgA": null,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 2
        },
        "knowledge": {
          "categoryLabel": "Knowledge",
          "avgA": 62.2,
          "avgB": 61.3,
          "winner": "A",
          "benchmarkCount": 13
        },
        "instructionFollowing": {
          "categoryLabel": "Instruction Following",
          "avgA": null,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 1
        },
        "multilingual": {
          "categoryLabel": "Multilingual",
          "avgA": null,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 0
        },
        "math": {
          "categoryLabel": "Mathematics",
          "avgA": null,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 5
        }
      }
    },
    {
      "slug": "claude-mythos-5-vs-gpt-5-5-pro",
      "url": "https://benchlm.ai/compare/claude-mythos-5-vs-gpt-5-5-pro",
      "markdownUrl": "https://benchlm.ai/md/compare/claude-mythos-5-vs-gpt-5-5-pro.md",
      "modelA": {
        "slug": "claude-mythos-5",
        "canonicalModelKey": "claude-mythos-5",
        "model": "Claude Mythos 5",
        "creator": "Anthropic",
        "sourceType": "Proprietary",
        "reasoningType": "Reasoning",
        "contextWindow": "1M+",
        "contextWindowTokens": 1000000,
        "displayScore": 99,
        "rankingEligible": true,
        "overallRank": 1,
        "url": "https://benchlm.ai/models/claude-mythos-5",
        "markdownUrl": "https://benchlm.ai/md/models/claude-mythos-5.md"
      },
      "modelB": {
        "slug": "gpt-5-5-pro",
        "canonicalModelKey": "gpt-5-5-pro",
        "model": "GPT-5.5 Pro",
        "creator": "OpenAI",
        "sourceType": "Proprietary",
        "reasoningType": "Reasoning",
        "contextWindow": "1M",
        "contextWindowTokens": 1000000,
        "displayScore": 100,
        "rankingEligible": false,
        "overallRank": null,
        "url": "https://benchlm.ai/models/gpt-5-5-pro",
        "markdownUrl": "https://benchlm.ai/md/models/gpt-5-5-pro.md"
      },
      "overallWinner": "B",
      "winner": {
        "slug": "gpt-5-5-pro",
        "canonicalModelKey": "gpt-5-5-pro",
        "model": "GPT-5.5 Pro",
        "creator": "OpenAI",
        "sourceType": "Proprietary",
        "reasoningType": "Reasoning",
        "contextWindow": "1M",
        "contextWindowTokens": 1000000,
        "displayScore": 100,
        "rankingEligible": false,
        "overallRank": null,
        "url": "https://benchlm.ai/models/gpt-5-5-pro",
        "markdownUrl": "https://benchlm.ai/md/models/gpt-5-5-pro.md"
      },
      "scoreDiff": 1,
      "winsA": 1,
      "winsB": 1,
      "comparableCategoryCount": 2,
      "benchmarkCountA": 19,
      "benchmarkCountB": 4,
      "categoryResults": {
        "agentic": {
          "categoryLabel": "Agentic",
          "avgA": 87,
          "avgB": 90.1,
          "winner": "B",
          "benchmarkCount": 4
        },
        "coding": {
          "categoryLabel": "Coding",
          "avgA": 85.9,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 4
        },
        "multimodalGrounded": {
          "categoryLabel": "Multimodal & Grounded",
          "avgA": 92.7,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 5
        },
        "reasoning": {
          "categoryLabel": "Reasoning",
          "avgA": null,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 0
        },
        "knowledge": {
          "categoryLabel": "Knowledge",
          "avgA": 74.6,
          "avgB": 57.2,
          "winner": "A",
          "benchmarkCount": 3
        },
        "instructionFollowing": {
          "categoryLabel": "Instruction Following",
          "avgA": null,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 0
        },
        "multilingual": {
          "categoryLabel": "Multilingual",
          "avgA": null,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 1
        },
        "math": {
          "categoryLabel": "Mathematics",
          "avgA": null,
          "avgB": 52.4,
          "winner": null,
          "benchmarkCount": 2
        }
      }
    },
    {
      "slug": "claude-mythos-5-vs-claude-opus-4-7",
      "url": "https://benchlm.ai/compare/claude-mythos-5-vs-claude-opus-4-7",
      "markdownUrl": "https://benchlm.ai/md/compare/claude-mythos-5-vs-claude-opus-4-7.md",
      "modelA": {
        "slug": "claude-mythos-5",
        "canonicalModelKey": "claude-mythos-5",
        "model": "Claude Mythos 5",
        "creator": "Anthropic",
        "sourceType": "Proprietary",
        "reasoningType": "Reasoning",
        "contextWindow": "1M+",
        "contextWindowTokens": 1000000,
        "displayScore": 99,
        "rankingEligible": true,
        "overallRank": 1,
        "url": "https://benchlm.ai/models/claude-mythos-5",
        "markdownUrl": "https://benchlm.ai/md/models/claude-mythos-5.md"
      },
      "modelB": {
        "slug": "claude-opus-4-7",
        "canonicalModelKey": "claude-opus-4-7",
        "model": "Claude Opus 4.7",
        "creator": "Anthropic",
        "sourceType": "Proprietary",
        "reasoningType": "Non-Reasoning",
        "contextWindow": "1M",
        "contextWindowTokens": 1000000,
        "displayScore": 23,
        "rankingEligible": false,
        "overallRank": null,
        "url": "https://benchlm.ai/models/claude-opus-4-7",
        "markdownUrl": "https://benchlm.ai/md/models/claude-opus-4-7.md"
      },
      "overallWinner": "A",
      "winner": {
        "slug": "claude-mythos-5",
        "canonicalModelKey": "claude-mythos-5",
        "model": "Claude Mythos 5",
        "creator": "Anthropic",
        "sourceType": "Proprietary",
        "reasoningType": "Reasoning",
        "contextWindow": "1M+",
        "contextWindowTokens": 1000000,
        "displayScore": 99,
        "rankingEligible": true,
        "overallRank": 1,
        "url": "https://benchlm.ai/models/claude-mythos-5",
        "markdownUrl": "https://benchlm.ai/md/models/claude-mythos-5.md"
      },
      "scoreDiff": 76,
      "winsA": 0,
      "winsB": 0,
      "comparableCategoryCount": 0,
      "benchmarkCountA": 19,
      "benchmarkCountB": 21,
      "categoryResults": {
        "agentic": {
          "categoryLabel": "Agentic",
          "avgA": 87,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 8
        },
        "coding": {
          "categoryLabel": "Coding",
          "avgA": 85.9,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 9
        },
        "multimodalGrounded": {
          "categoryLabel": "Multimodal & Grounded",
          "avgA": 92.7,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 7
        },
        "reasoning": {
          "categoryLabel": "Reasoning",
          "avgA": null,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 2
        },
        "knowledge": {
          "categoryLabel": "Knowledge",
          "avgA": 74.6,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 9
        },
        "instructionFollowing": {
          "categoryLabel": "Instruction Following",
          "avgA": null,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 1
        },
        "multilingual": {
          "categoryLabel": "Multilingual",
          "avgA": null,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 1
        },
        "math": {
          "categoryLabel": "Mathematics",
          "avgA": null,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 1
        }
      }
    },
    {
      "slug": "claude-fable-vs-claude-opus-4-8",
      "url": "https://benchlm.ai/compare/claude-fable-vs-claude-opus-4-8",
      "markdownUrl": "https://benchlm.ai/md/compare/claude-fable-vs-claude-opus-4-8.md",
      "modelA": {
        "slug": "claude-fable",
        "canonicalModelKey": "claude-fable-5",
        "model": "Claude Fable 5",
        "creator": "Anthropic",
        "sourceType": "Proprietary",
        "reasoningType": "Reasoning",
        "contextWindow": "1M+",
        "contextWindowTokens": 1000000,
        "displayScore": 97,
        "rankingEligible": true,
        "overallRank": 2,
        "url": "https://benchlm.ai/models/claude-fable",
        "markdownUrl": "https://benchlm.ai/md/models/claude-fable.md"
      },
      "modelB": {
        "slug": "claude-opus-4-8",
        "canonicalModelKey": "claude-opus-4-8",
        "model": "Claude Opus 4.8",
        "creator": "Anthropic",
        "sourceType": "Proprietary",
        "reasoningType": "Reasoning",
        "contextWindow": "1M",
        "contextWindowTokens": 1000000,
        "displayScore": 93,
        "rankingEligible": true,
        "overallRank": 3,
        "url": "https://benchlm.ai/models/claude-opus-4-8",
        "markdownUrl": "https://benchlm.ai/md/models/claude-opus-4-8.md"
      },
      "overallWinner": "A",
      "winner": {
        "slug": "claude-fable",
        "canonicalModelKey": "claude-fable-5",
        "model": "Claude Fable 5",
        "creator": "Anthropic",
        "sourceType": "Proprietary",
        "reasoningType": "Reasoning",
        "contextWindow": "1M+",
        "contextWindowTokens": 1000000,
        "displayScore": 97,
        "rankingEligible": true,
        "overallRank": 2,
        "url": "https://benchlm.ai/models/claude-fable",
        "markdownUrl": "https://benchlm.ai/md/models/claude-fable.md"
      },
      "scoreDiff": 4,
      "winsA": 4,
      "winsB": 0,
      "comparableCategoryCount": 4,
      "benchmarkCountA": 19,
      "benchmarkCountB": 41,
      "categoryResults": {
        "agentic": {
          "categoryLabel": "Agentic",
          "avgA": 85.2,
          "avgB": 80.1,
          "winner": "A",
          "benchmarkCount": 12
        },
        "coding": {
          "categoryLabel": "Coding",
          "avgA": 85.6,
          "avgB": 76.4,
          "winner": "A",
          "benchmarkCount": 10
        },
        "multimodalGrounded": {
          "categoryLabel": "Multimodal & Grounded",
          "avgA": 92.4,
          "avgB": 76.1,
          "winner": "A",
          "benchmarkCount": 8
        },
        "reasoning": {
          "categoryLabel": "Reasoning",
          "avgA": null,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 2
        },
        "knowledge": {
          "categoryLabel": "Knowledge",
          "avgA": 74.8,
          "avgB": 70.1,
          "winner": "A",
          "benchmarkCount": 10
        },
        "instructionFollowing": {
          "categoryLabel": "Instruction Following",
          "avgA": null,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 1
        },
        "multilingual": {
          "categoryLabel": "Multilingual",
          "avgA": null,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 2
        },
        "math": {
          "categoryLabel": "Mathematics",
          "avgA": null,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 1
        }
      }
    },
    {
      "slug": "claude-3-5-sonnet-vs-grok-4",
      "url": "https://benchlm.ai/compare/claude-3-5-sonnet-vs-grok-4",
      "markdownUrl": "https://benchlm.ai/md/compare/claude-3-5-sonnet-vs-grok-4.md",
      "modelA": {
        "slug": "claude-3-5-sonnet",
        "canonicalModelKey": "claude-3-5-sonnet",
        "model": "Claude 3.5 Sonnet",
        "creator": "Anthropic",
        "sourceType": "Proprietary",
        "reasoningType": "Non-Reasoning",
        "contextWindow": "200K",
        "contextWindowTokens": 200000,
        "displayScore": 40,
        "rankingEligible": true,
        "overallRank": 84,
        "url": "https://benchlm.ai/models/claude-3-5-sonnet",
        "markdownUrl": "https://benchlm.ai/md/models/claude-3-5-sonnet.md"
      },
      "modelB": {
        "slug": "grok-4",
        "canonicalModelKey": "grok-4",
        "model": "Grok 4",
        "creator": "xAI",
        "sourceType": "Proprietary",
        "reasoningType": "Non-Reasoning",
        "contextWindow": "128K",
        "contextWindowTokens": 128000,
        "displayScore": 63,
        "rankingEligible": true,
        "overallRank": 50,
        "url": "https://benchlm.ai/models/grok-4",
        "markdownUrl": "https://benchlm.ai/md/models/grok-4.md"
      },
      "overallWinner": "B",
      "winner": {
        "slug": "grok-4",
        "canonicalModelKey": "grok-4",
        "model": "Grok 4",
        "creator": "xAI",
        "sourceType": "Proprietary",
        "reasoningType": "Non-Reasoning",
        "contextWindow": "128K",
        "contextWindowTokens": 128000,
        "displayScore": 63,
        "rankingEligible": true,
        "overallRank": 50,
        "url": "https://benchlm.ai/models/grok-4",
        "markdownUrl": "https://benchlm.ai/md/models/grok-4.md"
      },
      "scoreDiff": 23,
      "winsA": 0,
      "winsB": 0,
      "comparableCategoryCount": 0,
      "benchmarkCountA": 2,
      "benchmarkCountB": 19,
      "categoryResults": {
        "agentic": {
          "categoryLabel": "Agentic",
          "avgA": null,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 5
        },
        "coding": {
          "categoryLabel": "Coding",
          "avgA": 49,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 5
        },
        "multimodalGrounded": {
          "categoryLabel": "Multimodal & Grounded",
          "avgA": null,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 1
        },
        "reasoning": {
          "categoryLabel": "Reasoning",
          "avgA": null,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 2
        },
        "knowledge": {
          "categoryLabel": "Knowledge",
          "avgA": 59.4,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 7
        },
        "instructionFollowing": {
          "categoryLabel": "Instruction Following",
          "avgA": null,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 1
        },
        "multilingual": {
          "categoryLabel": "Multilingual",
          "avgA": null,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 0
        },
        "math": {
          "categoryLabel": "Mathematics",
          "avgA": null,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 0
        }
      }
    },
    {
      "slug": "gpt-4o-vs-grok-4-1",
      "url": "https://benchlm.ai/compare/gpt-4o-vs-grok-4-1",
      "markdownUrl": "https://benchlm.ai/md/compare/gpt-4o-vs-grok-4-1.md",
      "modelA": {
        "slug": "gpt-4o",
        "canonicalModelKey": "gpt-4o",
        "model": "GPT-4o",
        "creator": "OpenAI",
        "sourceType": "Proprietary",
        "reasoningType": "Non-Reasoning",
        "contextWindow": "128K",
        "contextWindowTokens": 128000,
        "displayScore": 42,
        "rankingEligible": true,
        "overallRank": 81,
        "url": "https://benchlm.ai/models/gpt-4o",
        "markdownUrl": "https://benchlm.ai/md/models/gpt-4o.md"
      },
      "modelB": {
        "slug": "grok-4-1",
        "canonicalModelKey": "grok-4-1",
        "model": "Grok 4.1",
        "creator": "xAI",
        "sourceType": "Proprietary",
        "reasoningType": "Non-Reasoning",
        "contextWindow": "1M",
        "contextWindowTokens": 1000000,
        "displayScore": 89,
        "rankingEligible": true,
        "overallRank": 9,
        "url": "https://benchlm.ai/models/grok-4-1",
        "markdownUrl": "https://benchlm.ai/md/models/grok-4-1.md"
      },
      "overallWinner": "B",
      "winner": {
        "slug": "grok-4-1",
        "canonicalModelKey": "grok-4-1",
        "model": "Grok 4.1",
        "creator": "xAI",
        "sourceType": "Proprietary",
        "reasoningType": "Non-Reasoning",
        "contextWindow": "1M",
        "contextWindowTokens": 1000000,
        "displayScore": 89,
        "rankingEligible": true,
        "overallRank": 9,
        "url": "https://benchlm.ai/models/grok-4-1",
        "markdownUrl": "https://benchlm.ai/md/models/grok-4-1.md"
      },
      "scoreDiff": 47,
      "winsA": 0,
      "winsB": 0,
      "comparableCategoryCount": 0,
      "benchmarkCountA": 17,
      "benchmarkCountB": 0,
      "categoryResults": {
        "agentic": {
          "categoryLabel": "Agentic",
          "avgA": null,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 4
        },
        "coding": {
          "categoryLabel": "Coding",
          "avgA": null,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 3
        },
        "multimodalGrounded": {
          "categoryLabel": "Multimodal & Grounded",
          "avgA": null,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 1
        },
        "reasoning": {
          "categoryLabel": "Reasoning",
          "avgA": null,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 2
        },
        "knowledge": {
          "categoryLabel": "Knowledge",
          "avgA": null,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 6
        },
        "instructionFollowing": {
          "categoryLabel": "Instruction Following",
          "avgA": null,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 1
        },
        "multilingual": {
          "categoryLabel": "Multilingual",
          "avgA": null,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 0
        },
        "math": {
          "categoryLabel": "Mathematics",
          "avgA": null,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 0
        }
      }
    },
    {
      "slug": "gemini-2-5-pro-vs-o3",
      "url": "https://benchlm.ai/compare/gemini-2-5-pro-vs-o3",
      "markdownUrl": "https://benchlm.ai/md/compare/gemini-2-5-pro-vs-o3.md",
      "modelA": {
        "slug": "gemini-2-5-pro",
        "canonicalModelKey": "gemini-2-5-pro",
        "model": "Gemini 2.5 Pro",
        "creator": "Google",
        "sourceType": "Proprietary",
        "reasoningType": "Non-Reasoning",
        "contextWindow": "1M",
        "contextWindowTokens": 1000000,
        "displayScore": 63,
        "rankingEligible": true,
        "overallRank": 49,
        "url": "https://benchlm.ai/models/gemini-2-5-pro",
        "markdownUrl": "https://benchlm.ai/md/models/gemini-2-5-pro.md"
      },
      "modelB": {
        "slug": "o3",
        "canonicalModelKey": "o3",
        "model": "o3",
        "creator": "OpenAI",
        "sourceType": "Proprietary",
        "reasoningType": "Reasoning",
        "contextWindow": "200K",
        "contextWindowTokens": 200000,
        "displayScore": 56,
        "rankingEligible": true,
        "overallRank": 61,
        "url": "https://benchlm.ai/models/o3",
        "markdownUrl": "https://benchlm.ai/md/models/o3.md"
      },
      "overallWinner": "A",
      "winner": {
        "slug": "gemini-2-5-pro",
        "canonicalModelKey": "gemini-2-5-pro",
        "model": "Gemini 2.5 Pro",
        "creator": "Google",
        "sourceType": "Proprietary",
        "reasoningType": "Non-Reasoning",
        "contextWindow": "1M",
        "contextWindowTokens": 1000000,
        "displayScore": 63,
        "rankingEligible": true,
        "overallRank": 49,
        "url": "https://benchlm.ai/models/gemini-2-5-pro",
        "markdownUrl": "https://benchlm.ai/md/models/gemini-2-5-pro.md"
      },
      "scoreDiff": 7,
      "winsA": 0,
      "winsB": 0,
      "comparableCategoryCount": 0,
      "benchmarkCountA": 23,
      "benchmarkCountB": 18,
      "categoryResults": {
        "agentic": {
          "categoryLabel": "Agentic",
          "avgA": null,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 5
        },
        "coding": {
          "categoryLabel": "Coding",
          "avgA": 63.8,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 5
        },
        "multimodalGrounded": {
          "categoryLabel": "Multimodal & Grounded",
          "avgA": null,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 2
        },
        "reasoning": {
          "categoryLabel": "Reasoning",
          "avgA": null,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 2
        },
        "knowledge": {
          "categoryLabel": "Knowledge",
          "avgA": 40.8,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 8
        },
        "instructionFollowing": {
          "categoryLabel": "Instruction Following",
          "avgA": null,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 1
        },
        "multilingual": {
          "categoryLabel": "Multilingual",
          "avgA": null,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 0
        },
        "math": {
          "categoryLabel": "Mathematics",
          "avgA": null,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 0
        }
      }
    },
    {
      "slug": "kimi-2-6-vs-kimi-k2-7-code",
      "url": "https://benchlm.ai/compare/kimi-2-6-vs-kimi-k2-7-code",
      "markdownUrl": "https://benchlm.ai/md/compare/kimi-2-6-vs-kimi-k2-7-code.md",
      "modelA": {
        "slug": "kimi-k2-7-code",
        "canonicalModelKey": "kimi-k2-7-code",
        "model": "Kimi K2.7 Code",
        "creator": "Moonshot AI",
        "sourceType": "Open Weight",
        "reasoningType": "Reasoning",
        "contextWindow": "256K",
        "contextWindowTokens": 256000,
        "displayScore": 0,
        "rankingEligible": false,
        "overallRank": null,
        "url": "https://benchlm.ai/models/kimi-k2-7-code",
        "markdownUrl": "https://benchlm.ai/md/models/kimi-k2-7-code.md"
      },
      "modelB": {
        "slug": "kimi-2-6",
        "canonicalModelKey": "kimi-2-6",
        "model": "Kimi K2.6",
        "creator": "Moonshot AI",
        "sourceType": "Open Weight",
        "reasoningType": "Reasoning",
        "contextWindow": "256K",
        "contextWindowTokens": 256000,
        "displayScore": 81,
        "rankingEligible": true,
        "overallRank": 21,
        "url": "https://benchlm.ai/models/kimi-2-6",
        "markdownUrl": "https://benchlm.ai/md/models/kimi-2-6.md"
      },
      "overallWinner": "B",
      "winner": {
        "slug": "kimi-2-6",
        "canonicalModelKey": "kimi-2-6",
        "model": "Kimi K2.6",
        "creator": "Moonshot AI",
        "sourceType": "Open Weight",
        "reasoningType": "Reasoning",
        "contextWindow": "256K",
        "contextWindowTokens": 256000,
        "displayScore": 81,
        "rankingEligible": true,
        "overallRank": 21,
        "url": "https://benchlm.ai/models/kimi-2-6",
        "markdownUrl": "https://benchlm.ai/md/models/kimi-2-6.md"
      },
      "scoreDiff": 81,
      "winsA": 0,
      "winsB": 0,
      "comparableCategoryCount": 0,
      "benchmarkCountA": 6,
      "benchmarkCountB": 48,
      "categoryResults": {
        "agentic": {
          "categoryLabel": "Agentic",
          "avgA": null,
          "avgB": 73.1,
          "winner": null,
          "benchmarkCount": 16
        },
        "coding": {
          "categoryLabel": "Coding",
          "avgA": null,
          "avgB": 72,
          "winner": null,
          "benchmarkCount": 15
        },
        "multimodalGrounded": {
          "categoryLabel": "Multimodal & Grounded",
          "avgA": null,
          "avgB": 79.7,
          "winner": null,
          "benchmarkCount": 7
        },
        "reasoning": {
          "categoryLabel": "Reasoning",
          "avgA": null,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 2
        },
        "knowledge": {
          "categoryLabel": "Knowledge",
          "avgA": null,
          "avgB": 53.8,
          "winner": null,
          "benchmarkCount": 9
        },
        "instructionFollowing": {
          "categoryLabel": "Instruction Following",
          "avgA": null,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 1
        },
        "multilingual": {
          "categoryLabel": "Multilingual",
          "avgA": null,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 0
        },
        "math": {
          "categoryLabel": "Mathematics",
          "avgA": null,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 3
        }
      }
    },
    {
      "slug": "claude-opus-4-7-vs-grok-4-20-beta",
      "url": "https://benchlm.ai/compare/claude-opus-4-7-vs-grok-4-20-beta",
      "markdownUrl": "https://benchlm.ai/md/compare/claude-opus-4-7-vs-grok-4-20-beta.md",
      "modelA": {
        "slug": "claude-opus-4-7",
        "canonicalModelKey": "claude-opus-4-7",
        "model": "Claude Opus 4.7",
        "creator": "Anthropic",
        "sourceType": "Proprietary",
        "reasoningType": "Non-Reasoning",
        "contextWindow": "1M",
        "contextWindowTokens": 1000000,
        "displayScore": 23,
        "rankingEligible": false,
        "overallRank": null,
        "url": "https://benchlm.ai/models/claude-opus-4-7",
        "markdownUrl": "https://benchlm.ai/md/models/claude-opus-4-7.md"
      },
      "modelB": {
        "slug": "grok-4-20-beta",
        "canonicalModelKey": "grok-4-20-beta",
        "model": "Grok 4.20",
        "creator": "xAI",
        "sourceType": "Proprietary",
        "reasoningType": "Reasoning",
        "contextWindow": "2M",
        "contextWindowTokens": 2000000,
        "displayScore": 71,
        "rankingEligible": true,
        "overallRank": 35,
        "url": "https://benchlm.ai/models/grok-4-20-beta",
        "markdownUrl": "https://benchlm.ai/md/models/grok-4-20-beta.md"
      },
      "overallWinner": "B",
      "winner": {
        "slug": "grok-4-20-beta",
        "canonicalModelKey": "grok-4-20-beta",
        "model": "Grok 4.20",
        "creator": "xAI",
        "sourceType": "Proprietary",
        "reasoningType": "Reasoning",
        "contextWindow": "2M",
        "contextWindowTokens": 2000000,
        "displayScore": 71,
        "rankingEligible": true,
        "overallRank": 35,
        "url": "https://benchlm.ai/models/grok-4-20-beta",
        "markdownUrl": "https://benchlm.ai/md/models/grok-4-20-beta.md"
      },
      "scoreDiff": 48,
      "winsA": 0,
      "winsB": 0,
      "comparableCategoryCount": 0,
      "benchmarkCountA": 21,
      "benchmarkCountB": 18,
      "categoryResults": {
        "agentic": {
          "categoryLabel": "Agentic",
          "avgA": null,
          "avgB": 47.1,
          "winner": null,
          "benchmarkCount": 7
        },
        "coding": {
          "categoryLabel": "Coding",
          "avgA": null,
          "avgB": 61,
          "winner": null,
          "benchmarkCount": 8
        },
        "multimodalGrounded": {
          "categoryLabel": "Multimodal & Grounded",
          "avgA": null,
          "avgB": 70.8,
          "winner": null,
          "benchmarkCount": 8
        },
        "reasoning": {
          "categoryLabel": "Reasoning",
          "avgA": null,
          "avgB": 53.3,
          "winner": null,
          "benchmarkCount": 3
        },
        "knowledge": {
          "categoryLabel": "Knowledge",
          "avgA": null,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 10
        },
        "instructionFollowing": {
          "categoryLabel": "Instruction Following",
          "avgA": null,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 1
        },
        "multilingual": {
          "categoryLabel": "Multilingual",
          "avgA": null,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 0
        },
        "math": {
          "categoryLabel": "Mathematics",
          "avgA": null,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 0
        }
      }
    },
    {
      "slug": "gpt-4o-vs-grok-4",
      "url": "https://benchlm.ai/compare/gpt-4o-vs-grok-4",
      "markdownUrl": "https://benchlm.ai/md/compare/gpt-4o-vs-grok-4.md",
      "modelA": {
        "slug": "gpt-4o",
        "canonicalModelKey": "gpt-4o",
        "model": "GPT-4o",
        "creator": "OpenAI",
        "sourceType": "Proprietary",
        "reasoningType": "Non-Reasoning",
        "contextWindow": "128K",
        "contextWindowTokens": 128000,
        "displayScore": 42,
        "rankingEligible": true,
        "overallRank": 81,
        "url": "https://benchlm.ai/models/gpt-4o",
        "markdownUrl": "https://benchlm.ai/md/models/gpt-4o.md"
      },
      "modelB": {
        "slug": "grok-4",
        "canonicalModelKey": "grok-4",
        "model": "Grok 4",
        "creator": "xAI",
        "sourceType": "Proprietary",
        "reasoningType": "Non-Reasoning",
        "contextWindow": "128K",
        "contextWindowTokens": 128000,
        "displayScore": 63,
        "rankingEligible": true,
        "overallRank": 50,
        "url": "https://benchlm.ai/models/grok-4",
        "markdownUrl": "https://benchlm.ai/md/models/grok-4.md"
      },
      "overallWinner": "B",
      "winner": {
        "slug": "grok-4",
        "canonicalModelKey": "grok-4",
        "model": "Grok 4",
        "creator": "xAI",
        "sourceType": "Proprietary",
        "reasoningType": "Non-Reasoning",
        "contextWindow": "128K",
        "contextWindowTokens": 128000,
        "displayScore": 63,
        "rankingEligible": true,
        "overallRank": 50,
        "url": "https://benchlm.ai/models/grok-4",
        "markdownUrl": "https://benchlm.ai/md/models/grok-4.md"
      },
      "scoreDiff": 21,
      "winsA": 0,
      "winsB": 0,
      "comparableCategoryCount": 0,
      "benchmarkCountA": 17,
      "benchmarkCountB": 19,
      "categoryResults": {
        "agentic": {
          "categoryLabel": "Agentic",
          "avgA": null,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 5
        },
        "coding": {
          "categoryLabel": "Coding",
          "avgA": null,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 4
        },
        "multimodalGrounded": {
          "categoryLabel": "Multimodal & Grounded",
          "avgA": null,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 2
        },
        "reasoning": {
          "categoryLabel": "Reasoning",
          "avgA": null,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 2
        },
        "knowledge": {
          "categoryLabel": "Knowledge",
          "avgA": null,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 6
        },
        "instructionFollowing": {
          "categoryLabel": "Instruction Following",
          "avgA": null,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 1
        },
        "multilingual": {
          "categoryLabel": "Multilingual",
          "avgA": null,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 0
        },
        "math": {
          "categoryLabel": "Mathematics",
          "avgA": null,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 0
        }
      }
    },
    {
      "slug": "claude-4-1-opus-thinking-vs-grok-4",
      "url": "https://benchlm.ai/compare/claude-4-1-opus-thinking-vs-grok-4",
      "markdownUrl": "https://benchlm.ai/md/compare/claude-4-1-opus-thinking-vs-grok-4.md",
      "modelA": {
        "slug": "claude-4-1-opus-thinking",
        "canonicalModelKey": "claude-4-1-opus-thinking",
        "model": "Claude 4.1 Opus Thinking",
        "creator": "Anthropic",
        "sourceType": "Proprietary",
        "reasoningType": "Reasoning",
        "contextWindow": "200K",
        "contextWindowTokens": 200000,
        "displayScore": 43,
        "rankingEligible": true,
        "overallRank": 80,
        "url": "https://benchlm.ai/models/claude-4-1-opus-thinking",
        "markdownUrl": "https://benchlm.ai/md/models/claude-4-1-opus-thinking.md"
      },
      "modelB": {
        "slug": "grok-4",
        "canonicalModelKey": "grok-4",
        "model": "Grok 4",
        "creator": "xAI",
        "sourceType": "Proprietary",
        "reasoningType": "Non-Reasoning",
        "contextWindow": "128K",
        "contextWindowTokens": 128000,
        "displayScore": 63,
        "rankingEligible": true,
        "overallRank": 50,
        "url": "https://benchlm.ai/models/grok-4",
        "markdownUrl": "https://benchlm.ai/md/models/grok-4.md"
      },
      "overallWinner": "B",
      "winner": {
        "slug": "grok-4",
        "canonicalModelKey": "grok-4",
        "model": "Grok 4",
        "creator": "xAI",
        "sourceType": "Proprietary",
        "reasoningType": "Non-Reasoning",
        "contextWindow": "128K",
        "contextWindowTokens": 128000,
        "displayScore": 63,
        "rankingEligible": true,
        "overallRank": 50,
        "url": "https://benchlm.ai/models/grok-4",
        "markdownUrl": "https://benchlm.ai/md/models/grok-4.md"
      },
      "scoreDiff": 20,
      "winsA": 0,
      "winsB": 0,
      "comparableCategoryCount": 0,
      "benchmarkCountA": 11,
      "benchmarkCountB": 19,
      "categoryResults": {
        "agentic": {
          "categoryLabel": "Agentic",
          "avgA": null,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 5
        },
        "coding": {
          "categoryLabel": "Coding",
          "avgA": null,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 4
        },
        "multimodalGrounded": {
          "categoryLabel": "Multimodal & Grounded",
          "avgA": null,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 1
        },
        "reasoning": {
          "categoryLabel": "Reasoning",
          "avgA": null,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 2
        },
        "knowledge": {
          "categoryLabel": "Knowledge",
          "avgA": null,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 6
        },
        "instructionFollowing": {
          "categoryLabel": "Instruction Following",
          "avgA": null,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 1
        },
        "multilingual": {
          "categoryLabel": "Multilingual",
          "avgA": null,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 0
        },
        "math": {
          "categoryLabel": "Mathematics",
          "avgA": null,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 0
        }
      }
    },
    {
      "slug": "claude-opus-4-7-vs-grok-4-1-fast",
      "url": "https://benchlm.ai/compare/claude-opus-4-7-vs-grok-4-1-fast",
      "markdownUrl": "https://benchlm.ai/md/compare/claude-opus-4-7-vs-grok-4-1-fast.md",
      "modelA": {
        "slug": "claude-opus-4-7",
        "canonicalModelKey": "claude-opus-4-7",
        "model": "Claude Opus 4.7",
        "creator": "Anthropic",
        "sourceType": "Proprietary",
        "reasoningType": "Non-Reasoning",
        "contextWindow": "1M",
        "contextWindowTokens": 1000000,
        "displayScore": 23,
        "rankingEligible": false,
        "overallRank": null,
        "url": "https://benchlm.ai/models/claude-opus-4-7",
        "markdownUrl": "https://benchlm.ai/md/models/claude-opus-4-7.md"
      },
      "modelB": {
        "slug": "grok-4-1-fast",
        "canonicalModelKey": "grok-4-1-fast",
        "model": "Grok 4.1 Fast",
        "creator": "xAI",
        "sourceType": "Proprietary",
        "reasoningType": "Non-Reasoning",
        "contextWindow": "1M",
        "contextWindowTokens": 1000000,
        "displayScore": 68,
        "rankingEligible": true,
        "overallRank": 41,
        "url": "https://benchlm.ai/models/grok-4-1-fast",
        "markdownUrl": "https://benchlm.ai/md/models/grok-4-1-fast.md"
      },
      "overallWinner": "B",
      "winner": {
        "slug": "grok-4-1-fast",
        "canonicalModelKey": "grok-4-1-fast",
        "model": "Grok 4.1 Fast",
        "creator": "xAI",
        "sourceType": "Proprietary",
        "reasoningType": "Non-Reasoning",
        "contextWindow": "1M",
        "contextWindowTokens": 1000000,
        "displayScore": 68,
        "rankingEligible": true,
        "overallRank": 41,
        "url": "https://benchlm.ai/models/grok-4-1-fast",
        "markdownUrl": "https://benchlm.ai/md/models/grok-4-1-fast.md"
      },
      "scoreDiff": 45,
      "winsA": 0,
      "winsB": 0,
      "comparableCategoryCount": 0,
      "benchmarkCountA": 21,
      "benchmarkCountB": 18,
      "categoryResults": {
        "agentic": {
          "categoryLabel": "Agentic",
          "avgA": null,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 5
        },
        "coding": {
          "categoryLabel": "Coding",
          "avgA": null,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 5
        },
        "multimodalGrounded": {
          "categoryLabel": "Multimodal & Grounded",
          "avgA": null,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 2
        },
        "reasoning": {
          "categoryLabel": "Reasoning",
          "avgA": null,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 2
        },
        "knowledge": {
          "categoryLabel": "Knowledge",
          "avgA": null,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 6
        },
        "instructionFollowing": {
          "categoryLabel": "Instruction Following",
          "avgA": null,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 1
        },
        "multilingual": {
          "categoryLabel": "Multilingual",
          "avgA": null,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 0
        },
        "math": {
          "categoryLabel": "Mathematics",
          "avgA": null,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 0
        }
      }
    },
    {
      "slug": "gemini-3-1-pro-vs-grok-3-beta",
      "url": "https://benchlm.ai/compare/gemini-3-1-pro-vs-grok-3-beta",
      "markdownUrl": "https://benchlm.ai/md/compare/gemini-3-1-pro-vs-grok-3-beta.md",
      "modelA": {
        "slug": "gemini-3-1-pro",
        "canonicalModelKey": "gemini-3-1-pro",
        "model": "Gemini 3.1 Pro",
        "creator": "Google",
        "sourceType": "Proprietary",
        "reasoningType": "Non-Reasoning",
        "contextWindow": "1M",
        "contextWindowTokens": 1000000,
        "displayScore": 91,
        "rankingEligible": true,
        "overallRank": 4,
        "url": "https://benchlm.ai/models/gemini-3-1-pro",
        "markdownUrl": "https://benchlm.ai/md/models/gemini-3-1-pro.md"
      },
      "modelB": {
        "slug": "grok-3-beta",
        "canonicalModelKey": "grok-3-beta",
        "model": "Grok 3 [Beta]",
        "creator": "xAI",
        "sourceType": "Proprietary",
        "reasoningType": "Non-Reasoning",
        "contextWindow": "128K",
        "contextWindowTokens": 128000,
        "displayScore": 30,
        "rankingEligible": true,
        "overallRank": 97,
        "url": "https://benchlm.ai/models/grok-3-beta",
        "markdownUrl": "https://benchlm.ai/md/models/grok-3-beta.md"
      },
      "overallWinner": "A",
      "winner": {
        "slug": "gemini-3-1-pro",
        "canonicalModelKey": "gemini-3-1-pro",
        "model": "Gemini 3.1 Pro",
        "creator": "Google",
        "sourceType": "Proprietary",
        "reasoningType": "Non-Reasoning",
        "contextWindow": "1M",
        "contextWindowTokens": 1000000,
        "displayScore": 91,
        "rankingEligible": true,
        "overallRank": 4,
        "url": "https://benchlm.ai/models/gemini-3-1-pro",
        "markdownUrl": "https://benchlm.ai/md/models/gemini-3-1-pro.md"
      },
      "scoreDiff": 61,
      "winsA": 0,
      "winsB": 0,
      "comparableCategoryCount": 0,
      "benchmarkCountA": 38,
      "benchmarkCountB": 0,
      "categoryResults": {
        "agentic": {
          "categoryLabel": "Agentic",
          "avgA": null,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 8
        },
        "coding": {
          "categoryLabel": "Coding",
          "avgA": null,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 6
        },
        "multimodalGrounded": {
          "categoryLabel": "Multimodal & Grounded",
          "avgA": 82.8,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 10
        },
        "reasoning": {
          "categoryLabel": "Reasoning",
          "avgA": 77.1,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 3
        },
        "knowledge": {
          "categoryLabel": "Knowledge",
          "avgA": null,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 10
        },
        "instructionFollowing": {
          "categoryLabel": "Instruction Following",
          "avgA": null,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 1
        },
        "multilingual": {
          "categoryLabel": "Multilingual",
          "avgA": null,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 0
        },
        "math": {
          "categoryLabel": "Mathematics",
          "avgA": null,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 0
        }
      }
    },
    {
      "slug": "claude-4-sonnet-vs-grok-4",
      "url": "https://benchlm.ai/compare/claude-4-sonnet-vs-grok-4",
      "markdownUrl": "https://benchlm.ai/md/compare/claude-4-sonnet-vs-grok-4.md",
      "modelA": {
        "slug": "claude-4-sonnet",
        "canonicalModelKey": "claude-4-sonnet",
        "model": "Claude 4 Sonnet",
        "creator": "Anthropic",
        "sourceType": "Proprietary",
        "reasoningType": "Non-Reasoning",
        "contextWindow": "200K",
        "contextWindowTokens": 200000,
        "displayScore": 50,
        "rankingEligible": true,
        "overallRank": 70,
        "url": "https://benchlm.ai/models/claude-4-sonnet",
        "markdownUrl": "https://benchlm.ai/md/models/claude-4-sonnet.md"
      },
      "modelB": {
        "slug": "grok-4",
        "canonicalModelKey": "grok-4",
        "model": "Grok 4",
        "creator": "xAI",
        "sourceType": "Proprietary",
        "reasoningType": "Non-Reasoning",
        "contextWindow": "128K",
        "contextWindowTokens": 128000,
        "displayScore": 63,
        "rankingEligible": true,
        "overallRank": 50,
        "url": "https://benchlm.ai/models/grok-4",
        "markdownUrl": "https://benchlm.ai/md/models/grok-4.md"
      },
      "overallWinner": "B",
      "winner": {
        "slug": "grok-4",
        "canonicalModelKey": "grok-4",
        "model": "Grok 4",
        "creator": "xAI",
        "sourceType": "Proprietary",
        "reasoningType": "Non-Reasoning",
        "contextWindow": "128K",
        "contextWindowTokens": 128000,
        "displayScore": 63,
        "rankingEligible": true,
        "overallRank": 50,
        "url": "https://benchlm.ai/models/grok-4",
        "markdownUrl": "https://benchlm.ai/md/models/grok-4.md"
      },
      "scoreDiff": 13,
      "winsA": 0,
      "winsB": 0,
      "comparableCategoryCount": 0,
      "benchmarkCountA": 20,
      "benchmarkCountB": 19,
      "categoryResults": {
        "agentic": {
          "categoryLabel": "Agentic",
          "avgA": null,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 5
        },
        "coding": {
          "categoryLabel": "Coding",
          "avgA": 72.7,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 5
        },
        "multimodalGrounded": {
          "categoryLabel": "Multimodal & Grounded",
          "avgA": null,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 2
        },
        "reasoning": {
          "categoryLabel": "Reasoning",
          "avgA": null,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 2
        },
        "knowledge": {
          "categoryLabel": "Knowledge",
          "avgA": null,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 6
        },
        "instructionFollowing": {
          "categoryLabel": "Instruction Following",
          "avgA": null,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 1
        },
        "multilingual": {
          "categoryLabel": "Multilingual",
          "avgA": null,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 0
        },
        "math": {
          "categoryLabel": "Mathematics",
          "avgA": null,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 0
        }
      }
    },
    {
      "slug": "claude-opus-4-7-vs-gpt-4o",
      "url": "https://benchlm.ai/compare/claude-opus-4-7-vs-gpt-4o",
      "markdownUrl": "https://benchlm.ai/md/compare/claude-opus-4-7-vs-gpt-4o.md",
      "modelA": {
        "slug": "claude-opus-4-7",
        "canonicalModelKey": "claude-opus-4-7",
        "model": "Claude Opus 4.7",
        "creator": "Anthropic",
        "sourceType": "Proprietary",
        "reasoningType": "Non-Reasoning",
        "contextWindow": "1M",
        "contextWindowTokens": 1000000,
        "displayScore": 23,
        "rankingEligible": false,
        "overallRank": null,
        "url": "https://benchlm.ai/models/claude-opus-4-7",
        "markdownUrl": "https://benchlm.ai/md/models/claude-opus-4-7.md"
      },
      "modelB": {
        "slug": "gpt-4o",
        "canonicalModelKey": "gpt-4o",
        "model": "GPT-4o",
        "creator": "OpenAI",
        "sourceType": "Proprietary",
        "reasoningType": "Non-Reasoning",
        "contextWindow": "128K",
        "contextWindowTokens": 128000,
        "displayScore": 42,
        "rankingEligible": true,
        "overallRank": 81,
        "url": "https://benchlm.ai/models/gpt-4o",
        "markdownUrl": "https://benchlm.ai/md/models/gpt-4o.md"
      },
      "overallWinner": "B",
      "winner": {
        "slug": "gpt-4o",
        "canonicalModelKey": "gpt-4o",
        "model": "GPT-4o",
        "creator": "OpenAI",
        "sourceType": "Proprietary",
        "reasoningType": "Non-Reasoning",
        "contextWindow": "128K",
        "contextWindowTokens": 128000,
        "displayScore": 42,
        "rankingEligible": true,
        "overallRank": 81,
        "url": "https://benchlm.ai/models/gpt-4o",
        "markdownUrl": "https://benchlm.ai/md/models/gpt-4o.md"
      },
      "scoreDiff": 19,
      "winsA": 0,
      "winsB": 0,
      "comparableCategoryCount": 0,
      "benchmarkCountA": 21,
      "benchmarkCountB": 17,
      "categoryResults": {
        "agentic": {
          "categoryLabel": "Agentic",
          "avgA": null,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 5
        },
        "coding": {
          "categoryLabel": "Coding",
          "avgA": null,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 5
        },
        "multimodalGrounded": {
          "categoryLabel": "Multimodal & Grounded",
          "avgA": null,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 2
        },
        "reasoning": {
          "categoryLabel": "Reasoning",
          "avgA": null,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 2
        },
        "knowledge": {
          "categoryLabel": "Knowledge",
          "avgA": null,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 6
        },
        "instructionFollowing": {
          "categoryLabel": "Instruction Following",
          "avgA": null,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 1
        },
        "multilingual": {
          "categoryLabel": "Multilingual",
          "avgA": null,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 0
        },
        "math": {
          "categoryLabel": "Mathematics",
          "avgA": null,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 0
        }
      }
    },
    {
      "slug": "claude-fable-vs-claude-mythos-5",
      "url": "https://benchlm.ai/compare/claude-fable-vs-claude-mythos-5",
      "markdownUrl": "https://benchlm.ai/md/compare/claude-fable-vs-claude-mythos-5.md",
      "modelA": {
        "slug": "claude-mythos-5",
        "canonicalModelKey": "claude-mythos-5",
        "model": "Claude Mythos 5",
        "creator": "Anthropic",
        "sourceType": "Proprietary",
        "reasoningType": "Reasoning",
        "contextWindow": "1M+",
        "contextWindowTokens": 1000000,
        "displayScore": 99,
        "rankingEligible": true,
        "overallRank": 1,
        "url": "https://benchlm.ai/models/claude-mythos-5",
        "markdownUrl": "https://benchlm.ai/md/models/claude-mythos-5.md"
      },
      "modelB": {
        "slug": "claude-fable",
        "canonicalModelKey": "claude-fable-5",
        "model": "Claude Fable 5",
        "creator": "Anthropic",
        "sourceType": "Proprietary",
        "reasoningType": "Reasoning",
        "contextWindow": "1M+",
        "contextWindowTokens": 1000000,
        "displayScore": 97,
        "rankingEligible": true,
        "overallRank": 2,
        "url": "https://benchlm.ai/models/claude-fable",
        "markdownUrl": "https://benchlm.ai/md/models/claude-fable.md"
      },
      "overallWinner": "A",
      "winner": {
        "slug": "claude-mythos-5",
        "canonicalModelKey": "claude-mythos-5",
        "model": "Claude Mythos 5",
        "creator": "Anthropic",
        "sourceType": "Proprietary",
        "reasoningType": "Reasoning",
        "contextWindow": "1M+",
        "contextWindowTokens": 1000000,
        "displayScore": 99,
        "rankingEligible": true,
        "overallRank": 1,
        "url": "https://benchlm.ai/models/claude-mythos-5",
        "markdownUrl": "https://benchlm.ai/md/models/claude-mythos-5.md"
      },
      "scoreDiff": 2,
      "winsA": 3,
      "winsB": 1,
      "comparableCategoryCount": 4,
      "benchmarkCountA": 19,
      "benchmarkCountB": 19,
      "categoryResults": {
        "agentic": {
          "categoryLabel": "Agentic",
          "avgA": 87,
          "avgB": 85.2,
          "winner": "A",
          "benchmarkCount": 4
        },
        "coding": {
          "categoryLabel": "Coding",
          "avgA": 85.9,
          "avgB": 85.6,
          "winner": "A",
          "benchmarkCount": 4
        },
        "multimodalGrounded": {
          "categoryLabel": "Multimodal & Grounded",
          "avgA": 92.7,
          "avgB": 92.4,
          "winner": "A",
          "benchmarkCount": 5
        },
        "reasoning": {
          "categoryLabel": "Reasoning",
          "avgA": null,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 0
        },
        "knowledge": {
          "categoryLabel": "Knowledge",
          "avgA": 74.6,
          "avgB": 74.8,
          "winner": "B",
          "benchmarkCount": 3
        },
        "instructionFollowing": {
          "categoryLabel": "Instruction Following",
          "avgA": null,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 0
        },
        "multilingual": {
          "categoryLabel": "Multilingual",
          "avgA": null,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 1
        },
        "math": {
          "categoryLabel": "Mathematics",
          "avgA": null,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 1
        }
      }
    },
    {
      "slug": "claude-mythos-5-vs-claude-opus-4-8",
      "url": "https://benchlm.ai/compare/claude-mythos-5-vs-claude-opus-4-8",
      "markdownUrl": "https://benchlm.ai/md/compare/claude-mythos-5-vs-claude-opus-4-8.md",
      "modelA": {
        "slug": "claude-mythos-5",
        "canonicalModelKey": "claude-mythos-5",
        "model": "Claude Mythos 5",
        "creator": "Anthropic",
        "sourceType": "Proprietary",
        "reasoningType": "Reasoning",
        "contextWindow": "1M+",
        "contextWindowTokens": 1000000,
        "displayScore": 99,
        "rankingEligible": true,
        "overallRank": 1,
        "url": "https://benchlm.ai/models/claude-mythos-5",
        "markdownUrl": "https://benchlm.ai/md/models/claude-mythos-5.md"
      },
      "modelB": {
        "slug": "claude-opus-4-8",
        "canonicalModelKey": "claude-opus-4-8",
        "model": "Claude Opus 4.8",
        "creator": "Anthropic",
        "sourceType": "Proprietary",
        "reasoningType": "Reasoning",
        "contextWindow": "1M",
        "contextWindowTokens": 1000000,
        "displayScore": 93,
        "rankingEligible": true,
        "overallRank": 3,
        "url": "https://benchlm.ai/models/claude-opus-4-8",
        "markdownUrl": "https://benchlm.ai/md/models/claude-opus-4-8.md"
      },
      "overallWinner": "A",
      "winner": {
        "slug": "claude-mythos-5",
        "canonicalModelKey": "claude-mythos-5",
        "model": "Claude Mythos 5",
        "creator": "Anthropic",
        "sourceType": "Proprietary",
        "reasoningType": "Reasoning",
        "contextWindow": "1M+",
        "contextWindowTokens": 1000000,
        "displayScore": 99,
        "rankingEligible": true,
        "overallRank": 1,
        "url": "https://benchlm.ai/models/claude-mythos-5",
        "markdownUrl": "https://benchlm.ai/md/models/claude-mythos-5.md"
      },
      "scoreDiff": 6,
      "winsA": 4,
      "winsB": 0,
      "comparableCategoryCount": 4,
      "benchmarkCountA": 19,
      "benchmarkCountB": 41,
      "categoryResults": {
        "agentic": {
          "categoryLabel": "Agentic",
          "avgA": 87,
          "avgB": 80.1,
          "winner": "A",
          "benchmarkCount": 12
        },
        "coding": {
          "categoryLabel": "Coding",
          "avgA": 85.9,
          "avgB": 76.4,
          "winner": "A",
          "benchmarkCount": 10
        },
        "multimodalGrounded": {
          "categoryLabel": "Multimodal & Grounded",
          "avgA": 92.7,
          "avgB": 76.1,
          "winner": "A",
          "benchmarkCount": 8
        },
        "reasoning": {
          "categoryLabel": "Reasoning",
          "avgA": null,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 2
        },
        "knowledge": {
          "categoryLabel": "Knowledge",
          "avgA": 74.6,
          "avgB": 70.1,
          "winner": "A",
          "benchmarkCount": 10
        },
        "instructionFollowing": {
          "categoryLabel": "Instruction Following",
          "avgA": null,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 1
        },
        "multilingual": {
          "categoryLabel": "Multilingual",
          "avgA": null,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 2
        },
        "math": {
          "categoryLabel": "Mathematics",
          "avgA": null,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 1
        }
      }
    },
    {
      "slug": "claude-mythos-5-vs-gemini-3-1-pro",
      "url": "https://benchlm.ai/compare/claude-mythos-5-vs-gemini-3-1-pro",
      "markdownUrl": "https://benchlm.ai/md/compare/claude-mythos-5-vs-gemini-3-1-pro.md",
      "modelA": {
        "slug": "claude-mythos-5",
        "canonicalModelKey": "claude-mythos-5",
        "model": "Claude Mythos 5",
        "creator": "Anthropic",
        "sourceType": "Proprietary",
        "reasoningType": "Reasoning",
        "contextWindow": "1M+",
        "contextWindowTokens": 1000000,
        "displayScore": 99,
        "rankingEligible": true,
        "overallRank": 1,
        "url": "https://benchlm.ai/models/claude-mythos-5",
        "markdownUrl": "https://benchlm.ai/md/models/claude-mythos-5.md"
      },
      "modelB": {
        "slug": "gemini-3-1-pro",
        "canonicalModelKey": "gemini-3-1-pro",
        "model": "Gemini 3.1 Pro",
        "creator": "Google",
        "sourceType": "Proprietary",
        "reasoningType": "Non-Reasoning",
        "contextWindow": "1M",
        "contextWindowTokens": 1000000,
        "displayScore": 91,
        "rankingEligible": true,
        "overallRank": 4,
        "url": "https://benchlm.ai/models/gemini-3-1-pro",
        "markdownUrl": "https://benchlm.ai/md/models/gemini-3-1-pro.md"
      },
      "overallWinner": "A",
      "winner": {
        "slug": "claude-mythos-5",
        "canonicalModelKey": "claude-mythos-5",
        "model": "Claude Mythos 5",
        "creator": "Anthropic",
        "sourceType": "Proprietary",
        "reasoningType": "Reasoning",
        "contextWindow": "1M+",
        "contextWindowTokens": 1000000,
        "displayScore": 99,
        "rankingEligible": true,
        "overallRank": 1,
        "url": "https://benchlm.ai/models/claude-mythos-5",
        "markdownUrl": "https://benchlm.ai/md/models/claude-mythos-5.md"
      },
      "scoreDiff": 8,
      "winsA": 1,
      "winsB": 0,
      "comparableCategoryCount": 1,
      "benchmarkCountA": 19,
      "benchmarkCountB": 38,
      "categoryResults": {
        "agentic": {
          "categoryLabel": "Agentic",
          "avgA": 87,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 11
        },
        "coding": {
          "categoryLabel": "Coding",
          "avgA": 85.9,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 10
        },
        "multimodalGrounded": {
          "categoryLabel": "Multimodal & Grounded",
          "avgA": 92.7,
          "avgB": 82.8,
          "winner": "A",
          "benchmarkCount": 13
        },
        "reasoning": {
          "categoryLabel": "Reasoning",
          "avgA": null,
          "avgB": 77.1,
          "winner": null,
          "benchmarkCount": 3
        },
        "knowledge": {
          "categoryLabel": "Knowledge",
          "avgA": 74.6,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 12
        },
        "instructionFollowing": {
          "categoryLabel": "Instruction Following",
          "avgA": null,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 1
        },
        "multilingual": {
          "categoryLabel": "Multilingual",
          "avgA": null,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 1
        },
        "math": {
          "categoryLabel": "Mathematics",
          "avgA": null,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 1
        }
      }
    },
    {
      "slug": "claude-mythos-5-vs-qwen3-7-max",
      "url": "https://benchlm.ai/compare/claude-mythos-5-vs-qwen3-7-max",
      "markdownUrl": "https://benchlm.ai/md/compare/claude-mythos-5-vs-qwen3-7-max.md",
      "modelA": {
        "slug": "claude-mythos-5",
        "canonicalModelKey": "claude-mythos-5",
        "model": "Claude Mythos 5",
        "creator": "Anthropic",
        "sourceType": "Proprietary",
        "reasoningType": "Reasoning",
        "contextWindow": "1M+",
        "contextWindowTokens": 1000000,
        "displayScore": 99,
        "rankingEligible": true,
        "overallRank": 1,
        "url": "https://benchlm.ai/models/claude-mythos-5",
        "markdownUrl": "https://benchlm.ai/md/models/claude-mythos-5.md"
      },
      "modelB": {
        "slug": "qwen3-7-max",
        "canonicalModelKey": "qwen3-7-max",
        "model": "Qwen3.7 Max",
        "creator": "Alibaba",
        "sourceType": "Proprietary",
        "reasoningType": "Reasoning",
        "contextWindow": "1M",
        "contextWindowTokens": 1000000,
        "displayScore": 91,
        "rankingEligible": true,
        "overallRank": 5,
        "url": "https://benchlm.ai/models/qwen3-7-max",
        "markdownUrl": "https://benchlm.ai/md/models/qwen3-7-max.md"
      },
      "overallWinner": "A",
      "winner": {
        "slug": "claude-mythos-5",
        "canonicalModelKey": "claude-mythos-5",
        "model": "Claude Mythos 5",
        "creator": "Anthropic",
        "sourceType": "Proprietary",
        "reasoningType": "Reasoning",
        "contextWindow": "1M+",
        "contextWindowTokens": 1000000,
        "displayScore": 99,
        "rankingEligible": true,
        "overallRank": 1,
        "url": "https://benchlm.ai/models/claude-mythos-5",
        "markdownUrl": "https://benchlm.ai/md/models/claude-mythos-5.md"
      },
      "scoreDiff": 8,
      "winsA": 3,
      "winsB": 0,
      "comparableCategoryCount": 3,
      "benchmarkCountA": 19,
      "benchmarkCountB": 51,
      "categoryResults": {
        "agentic": {
          "categoryLabel": "Agentic",
          "avgA": 87,
          "avgB": 69.7,
          "winner": "A",
          "benchmarkCount": 15
        },
        "coding": {
          "categoryLabel": "Coding",
          "avgA": 85.9,
          "avgB": 73.6,
          "winner": "A",
          "benchmarkCount": 11
        },
        "multimodalGrounded": {
          "categoryLabel": "Multimodal & Grounded",
          "avgA": 92.7,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 6
        },
        "reasoning": {
          "categoryLabel": "Reasoning",
          "avgA": null,
          "avgB": 90.4,
          "winner": null,
          "benchmarkCount": 3
        },
        "knowledge": {
          "categoryLabel": "Knowledge",
          "avgA": 74.6,
          "avgB": 71.2,
          "winner": "A",
          "benchmarkCount": 14
        },
        "instructionFollowing": {
          "categoryLabel": "Instruction Following",
          "avgA": null,
          "avgB": 89,
          "winner": null,
          "benchmarkCount": 3
        },
        "multilingual": {
          "categoryLabel": "Multilingual",
          "avgA": null,
          "avgB": 87,
          "winner": null,
          "benchmarkCount": 6
        },
        "math": {
          "categoryLabel": "Mathematics",
          "avgA": null,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 4
        }
      }
    },
    {
      "slug": "claude-mythos-5-vs-gpt-5-4-pro",
      "url": "https://benchlm.ai/compare/claude-mythos-5-vs-gpt-5-4-pro",
      "markdownUrl": "https://benchlm.ai/md/compare/claude-mythos-5-vs-gpt-5-4-pro.md",
      "modelA": {
        "slug": "claude-mythos-5",
        "canonicalModelKey": "claude-mythos-5",
        "model": "Claude Mythos 5",
        "creator": "Anthropic",
        "sourceType": "Proprietary",
        "reasoningType": "Reasoning",
        "contextWindow": "1M+",
        "contextWindowTokens": 1000000,
        "displayScore": 99,
        "rankingEligible": true,
        "overallRank": 1,
        "url": "https://benchlm.ai/models/claude-mythos-5",
        "markdownUrl": "https://benchlm.ai/md/models/claude-mythos-5.md"
      },
      "modelB": {
        "slug": "gpt-5-4-pro",
        "canonicalModelKey": "gpt-5-4-pro",
        "model": "GPT-5.4 Pro",
        "creator": "OpenAI",
        "sourceType": "Proprietary",
        "reasoningType": "Reasoning",
        "contextWindow": "1.05M",
        "contextWindowTokens": 1050000,
        "displayScore": 90,
        "rankingEligible": true,
        "overallRank": 6,
        "url": "https://benchlm.ai/models/gpt-5-4-pro",
        "markdownUrl": "https://benchlm.ai/md/models/gpt-5-4-pro.md"
      },
      "overallWinner": "A",
      "winner": {
        "slug": "claude-mythos-5",
        "canonicalModelKey": "claude-mythos-5",
        "model": "Claude Mythos 5",
        "creator": "Anthropic",
        "sourceType": "Proprietary",
        "reasoningType": "Reasoning",
        "contextWindow": "1M+",
        "contextWindowTokens": 1000000,
        "displayScore": 99,
        "rankingEligible": true,
        "overallRank": 1,
        "url": "https://benchlm.ai/models/claude-mythos-5",
        "markdownUrl": "https://benchlm.ai/md/models/claude-mythos-5.md"
      },
      "scoreDiff": 9,
      "winsA": 1,
      "winsB": 2,
      "comparableCategoryCount": 3,
      "benchmarkCountA": 19,
      "benchmarkCountB": 10,
      "categoryResults": {
        "agentic": {
          "categoryLabel": "Agentic",
          "avgA": 87,
          "avgB": 89.3,
          "winner": "B",
          "benchmarkCount": 4
        },
        "coding": {
          "categoryLabel": "Coding",
          "avgA": 85.9,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 4
        },
        "multimodalGrounded": {
          "categoryLabel": "Multimodal & Grounded",
          "avgA": 92.7,
          "avgB": 94,
          "winner": "B",
          "benchmarkCount": 5
        },
        "reasoning": {
          "categoryLabel": "Reasoning",
          "avgA": null,
          "avgB": 83.3,
          "winner": null,
          "benchmarkCount": 2
        },
        "knowledge": {
          "categoryLabel": "Knowledge",
          "avgA": 74.6,
          "avgB": 49,
          "winner": "A",
          "benchmarkCount": 5
        },
        "instructionFollowing": {
          "categoryLabel": "Instruction Following",
          "avgA": null,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 0
        },
        "multilingual": {
          "categoryLabel": "Multilingual",
          "avgA": null,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 1
        },
        "math": {
          "categoryLabel": "Mathematics",
          "avgA": null,
          "avgB": 50,
          "winner": null,
          "benchmarkCount": 3
        }
      }
    },
    {
      "slug": "claude-mythos-5-vs-gemini-3-pro-deep-think",
      "url": "https://benchlm.ai/compare/claude-mythos-5-vs-gemini-3-pro-deep-think",
      "markdownUrl": "https://benchlm.ai/md/compare/claude-mythos-5-vs-gemini-3-pro-deep-think.md",
      "modelA": {
        "slug": "claude-mythos-5",
        "canonicalModelKey": "claude-mythos-5",
        "model": "Claude Mythos 5",
        "creator": "Anthropic",
        "sourceType": "Proprietary",
        "reasoningType": "Reasoning",
        "contextWindow": "1M+",
        "contextWindowTokens": 1000000,
        "displayScore": 99,
        "rankingEligible": true,
        "overallRank": 1,
        "url": "https://benchlm.ai/models/claude-mythos-5",
        "markdownUrl": "https://benchlm.ai/md/models/claude-mythos-5.md"
      },
      "modelB": {
        "slug": "gemini-3-pro-deep-think",
        "canonicalModelKey": "gemini-3-pro-deep-think",
        "model": "Gemini 3 Pro Deep Think",
        "creator": "Google",
        "sourceType": "Proprietary",
        "reasoningType": "Reasoning",
        "contextWindow": "2M",
        "contextWindowTokens": 2000000,
        "displayScore": 89,
        "rankingEligible": true,
        "overallRank": 8,
        "url": "https://benchlm.ai/models/gemini-3-pro-deep-think",
        "markdownUrl": "https://benchlm.ai/md/models/gemini-3-pro-deep-think.md"
      },
      "overallWinner": "A",
      "winner": {
        "slug": "claude-mythos-5",
        "canonicalModelKey": "claude-mythos-5",
        "model": "Claude Mythos 5",
        "creator": "Anthropic",
        "sourceType": "Proprietary",
        "reasoningType": "Reasoning",
        "contextWindow": "1M+",
        "contextWindowTokens": 1000000,
        "displayScore": 99,
        "rankingEligible": true,
        "overallRank": 1,
        "url": "https://benchlm.ai/models/claude-mythos-5",
        "markdownUrl": "https://benchlm.ai/md/models/claude-mythos-5.md"
      },
      "scoreDiff": 10,
      "winsA": 0,
      "winsB": 0,
      "comparableCategoryCount": 0,
      "benchmarkCountA": 19,
      "benchmarkCountB": 4,
      "categoryResults": {
        "agentic": {
          "categoryLabel": "Agentic",
          "avgA": 87,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 5
        },
        "coding": {
          "categoryLabel": "Coding",
          "avgA": 85.9,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 4
        },
        "multimodalGrounded": {
          "categoryLabel": "Multimodal & Grounded",
          "avgA": 92.7,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 5
        },
        "reasoning": {
          "categoryLabel": "Reasoning",
          "avgA": null,
          "avgB": 45.1,
          "winner": null,
          "benchmarkCount": 2
        },
        "knowledge": {
          "categoryLabel": "Knowledge",
          "avgA": 74.6,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 3
        },
        "instructionFollowing": {
          "categoryLabel": "Instruction Following",
          "avgA": null,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 0
        },
        "multilingual": {
          "categoryLabel": "Multilingual",
          "avgA": null,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 1
        },
        "math": {
          "categoryLabel": "Mathematics",
          "avgA": null,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 1
        }
      }
    },
    {
      "slug": "claude-mythos-5-vs-grok-4-1",
      "url": "https://benchlm.ai/compare/claude-mythos-5-vs-grok-4-1",
      "markdownUrl": "https://benchlm.ai/md/compare/claude-mythos-5-vs-grok-4-1.md",
      "modelA": {
        "slug": "claude-mythos-5",
        "canonicalModelKey": "claude-mythos-5",
        "model": "Claude Mythos 5",
        "creator": "Anthropic",
        "sourceType": "Proprietary",
        "reasoningType": "Reasoning",
        "contextWindow": "1M+",
        "contextWindowTokens": 1000000,
        "displayScore": 99,
        "rankingEligible": true,
        "overallRank": 1,
        "url": "https://benchlm.ai/models/claude-mythos-5",
        "markdownUrl": "https://benchlm.ai/md/models/claude-mythos-5.md"
      },
      "modelB": {
        "slug": "grok-4-1",
        "canonicalModelKey": "grok-4-1",
        "model": "Grok 4.1",
        "creator": "xAI",
        "sourceType": "Proprietary",
        "reasoningType": "Non-Reasoning",
        "contextWindow": "1M",
        "contextWindowTokens": 1000000,
        "displayScore": 89,
        "rankingEligible": true,
        "overallRank": 9,
        "url": "https://benchlm.ai/models/grok-4-1",
        "markdownUrl": "https://benchlm.ai/md/models/grok-4-1.md"
      },
      "overallWinner": "A",
      "winner": {
        "slug": "claude-mythos-5",
        "canonicalModelKey": "claude-mythos-5",
        "model": "Claude Mythos 5",
        "creator": "Anthropic",
        "sourceType": "Proprietary",
        "reasoningType": "Reasoning",
        "contextWindow": "1M+",
        "contextWindowTokens": 1000000,
        "displayScore": 99,
        "rankingEligible": true,
        "overallRank": 1,
        "url": "https://benchlm.ai/models/claude-mythos-5",
        "markdownUrl": "https://benchlm.ai/md/models/claude-mythos-5.md"
      },
      "scoreDiff": 10,
      "winsA": 0,
      "winsB": 0,
      "comparableCategoryCount": 0,
      "benchmarkCountA": 19,
      "benchmarkCountB": 0,
      "categoryResults": {
        "agentic": {
          "categoryLabel": "Agentic",
          "avgA": 87,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 4
        },
        "coding": {
          "categoryLabel": "Coding",
          "avgA": 85.9,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 4
        },
        "multimodalGrounded": {
          "categoryLabel": "Multimodal & Grounded",
          "avgA": 92.7,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 5
        },
        "reasoning": {
          "categoryLabel": "Reasoning",
          "avgA": null,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 0
        },
        "knowledge": {
          "categoryLabel": "Knowledge",
          "avgA": 74.6,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 3
        },
        "instructionFollowing": {
          "categoryLabel": "Instruction Following",
          "avgA": null,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 0
        },
        "multilingual": {
          "categoryLabel": "Multilingual",
          "avgA": null,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 1
        },
        "math": {
          "categoryLabel": "Mathematics",
          "avgA": null,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 1
        }
      }
    },
    {
      "slug": "claude-mythos-5-vs-gpt-5-4",
      "url": "https://benchlm.ai/compare/claude-mythos-5-vs-gpt-5-4",
      "markdownUrl": "https://benchlm.ai/md/compare/claude-mythos-5-vs-gpt-5-4.md",
      "modelA": {
        "slug": "claude-mythos-5",
        "canonicalModelKey": "claude-mythos-5",
        "model": "Claude Mythos 5",
        "creator": "Anthropic",
        "sourceType": "Proprietary",
        "reasoningType": "Reasoning",
        "contextWindow": "1M+",
        "contextWindowTokens": 1000000,
        "displayScore": 99,
        "rankingEligible": true,
        "overallRank": 1,
        "url": "https://benchlm.ai/models/claude-mythos-5",
        "markdownUrl": "https://benchlm.ai/md/models/claude-mythos-5.md"
      },
      "modelB": {
        "slug": "gpt-5-4",
        "canonicalModelKey": "gpt-5-4",
        "model": "GPT-5.4",
        "creator": "OpenAI",
        "sourceType": "Proprietary",
        "reasoningType": "Reasoning",
        "contextWindow": "1.05M",
        "contextWindowTokens": 1050000,
        "displayScore": 88,
        "rankingEligible": true,
        "overallRank": 10,
        "url": "https://benchlm.ai/models/gpt-5-4",
        "markdownUrl": "https://benchlm.ai/md/models/gpt-5-4.md"
      },
      "overallWinner": "A",
      "winner": {
        "slug": "claude-mythos-5",
        "canonicalModelKey": "claude-mythos-5",
        "model": "Claude Mythos 5",
        "creator": "Anthropic",
        "sourceType": "Proprietary",
        "reasoningType": "Reasoning",
        "contextWindow": "1M+",
        "contextWindowTokens": 1000000,
        "displayScore": 99,
        "rankingEligible": true,
        "overallRank": 1,
        "url": "https://benchlm.ai/models/claude-mythos-5",
        "markdownUrl": "https://benchlm.ai/md/models/claude-mythos-5.md"
      },
      "scoreDiff": 11,
      "winsA": 4,
      "winsB": 0,
      "comparableCategoryCount": 4,
      "benchmarkCountA": 19,
      "benchmarkCountB": 48,
      "categoryResults": {
        "agentic": {
          "categoryLabel": "Agentic",
          "avgA": 87,
          "avgB": 77,
          "winner": "A",
          "benchmarkCount": 14
        },
        "coding": {
          "categoryLabel": "Coding",
          "avgA": 85.9,
          "avgB": 57.7,
          "winner": "A",
          "benchmarkCount": 10
        },
        "multimodalGrounded": {
          "categoryLabel": "Multimodal & Grounded",
          "avgA": 92.7,
          "avgB": 72.7,
          "winner": "A",
          "benchmarkCount": 15
        },
        "reasoning": {
          "categoryLabel": "Reasoning",
          "avgA": null,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 2
        },
        "knowledge": {
          "categoryLabel": "Knowledge",
          "avgA": 74.6,
          "avgB": 66.1,
          "winner": "A",
          "benchmarkCount": 12
        },
        "instructionFollowing": {
          "categoryLabel": "Instruction Following",
          "avgA": null,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 1
        },
        "multilingual": {
          "categoryLabel": "Multilingual",
          "avgA": null,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 1
        },
        "math": {
          "categoryLabel": "Mathematics",
          "avgA": null,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 1
        }
      }
    },
    {
      "slug": "claude-mythos-5-vs-qwen3-7-plus",
      "url": "https://benchlm.ai/compare/claude-mythos-5-vs-qwen3-7-plus",
      "markdownUrl": "https://benchlm.ai/md/compare/claude-mythos-5-vs-qwen3-7-plus.md",
      "modelA": {
        "slug": "claude-mythos-5",
        "canonicalModelKey": "claude-mythos-5",
        "model": "Claude Mythos 5",
        "creator": "Anthropic",
        "sourceType": "Proprietary",
        "reasoningType": "Reasoning",
        "contextWindow": "1M+",
        "contextWindowTokens": 1000000,
        "displayScore": 99,
        "rankingEligible": true,
        "overallRank": 1,
        "url": "https://benchlm.ai/models/claude-mythos-5",
        "markdownUrl": "https://benchlm.ai/md/models/claude-mythos-5.md"
      },
      "modelB": {
        "slug": "qwen3-7-plus",
        "canonicalModelKey": "qwen3-7-plus",
        "model": "Qwen3.7 Plus",
        "creator": "Alibaba",
        "sourceType": "Proprietary",
        "reasoningType": "Reasoning",
        "contextWindow": "1M",
        "contextWindowTokens": 1000000,
        "displayScore": 88,
        "rankingEligible": true,
        "overallRank": 11,
        "url": "https://benchlm.ai/models/qwen3-7-plus",
        "markdownUrl": "https://benchlm.ai/md/models/qwen3-7-plus.md"
      },
      "overallWinner": "A",
      "winner": {
        "slug": "claude-mythos-5",
        "canonicalModelKey": "claude-mythos-5",
        "model": "Claude Mythos 5",
        "creator": "Anthropic",
        "sourceType": "Proprietary",
        "reasoningType": "Reasoning",
        "contextWindow": "1M+",
        "contextWindowTokens": 1000000,
        "displayScore": 99,
        "rankingEligible": true,
        "overallRank": 1,
        "url": "https://benchlm.ai/models/claude-mythos-5",
        "markdownUrl": "https://benchlm.ai/md/models/claude-mythos-5.md"
      },
      "scoreDiff": 11,
      "winsA": 4,
      "winsB": 0,
      "comparableCategoryCount": 4,
      "benchmarkCountA": 19,
      "benchmarkCountB": 68,
      "categoryResults": {
        "agentic": {
          "categoryLabel": "Agentic",
          "avgA": 87,
          "avgB": 71.7,
          "winner": "A",
          "benchmarkCount": 16
        },
        "coding": {
          "categoryLabel": "Coding",
          "avgA": 85.9,
          "avgB": 71.1,
          "winner": "A",
          "benchmarkCount": 11
        },
        "multimodalGrounded": {
          "categoryLabel": "Multimodal & Grounded",
          "avgA": 92.7,
          "avgB": 81.1,
          "winner": "A",
          "benchmarkCount": 19
        },
        "reasoning": {
          "categoryLabel": "Reasoning",
          "avgA": null,
          "avgB": 91.7,
          "winner": null,
          "benchmarkCount": 3
        },
        "knowledge": {
          "categoryLabel": "Knowledge",
          "avgA": 74.6,
          "avgB": 67.9,
          "winner": "A",
          "benchmarkCount": 14
        },
        "instructionFollowing": {
          "categoryLabel": "Instruction Following",
          "avgA": null,
          "avgB": 89.2,
          "winner": null,
          "benchmarkCount": 3
        },
        "multilingual": {
          "categoryLabel": "Multilingual",
          "avgA": null,
          "avgB": 85.4,
          "winner": null,
          "benchmarkCount": 6
        },
        "math": {
          "categoryLabel": "Mathematics",
          "avgA": null,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 4
        }
      }
    },
    {
      "slug": "claude-mythos-5-vs-claude-opus-4-6",
      "url": "https://benchlm.ai/compare/claude-mythos-5-vs-claude-opus-4-6",
      "markdownUrl": "https://benchlm.ai/md/compare/claude-mythos-5-vs-claude-opus-4-6.md",
      "modelA": {
        "slug": "claude-mythos-5",
        "canonicalModelKey": "claude-mythos-5",
        "model": "Claude Mythos 5",
        "creator": "Anthropic",
        "sourceType": "Proprietary",
        "reasoningType": "Reasoning",
        "contextWindow": "1M+",
        "contextWindowTokens": 1000000,
        "displayScore": 99,
        "rankingEligible": true,
        "overallRank": 1,
        "url": "https://benchlm.ai/models/claude-mythos-5",
        "markdownUrl": "https://benchlm.ai/md/models/claude-mythos-5.md"
      },
      "modelB": {
        "slug": "claude-opus-4-6",
        "canonicalModelKey": "claude-opus-4-6",
        "model": "Claude Opus 4.6",
        "creator": "Anthropic",
        "sourceType": "Proprietary",
        "reasoningType": "Non-Reasoning",
        "contextWindow": "1M",
        "contextWindowTokens": 1000000,
        "displayScore": 86,
        "rankingEligible": true,
        "overallRank": 12,
        "url": "https://benchlm.ai/models/claude-opus-4-6",
        "markdownUrl": "https://benchlm.ai/md/models/claude-opus-4-6.md"
      },
      "overallWinner": "A",
      "winner": {
        "slug": "claude-mythos-5",
        "canonicalModelKey": "claude-mythos-5",
        "model": "Claude Mythos 5",
        "creator": "Anthropic",
        "sourceType": "Proprietary",
        "reasoningType": "Reasoning",
        "contextWindow": "1M+",
        "contextWindowTokens": 1000000,
        "displayScore": 99,
        "rankingEligible": true,
        "overallRank": 1,
        "url": "https://benchlm.ai/models/claude-mythos-5",
        "markdownUrl": "https://benchlm.ai/md/models/claude-mythos-5.md"
      },
      "scoreDiff": 13,
      "winsA": 3,
      "winsB": 1,
      "comparableCategoryCount": 4,
      "benchmarkCountA": 19,
      "benchmarkCountB": 47,
      "categoryResults": {
        "agentic": {
          "categoryLabel": "Agentic",
          "avgA": 87,
          "avgB": 72.6,
          "winner": "A",
          "benchmarkCount": 11
        },
        "coding": {
          "categoryLabel": "Coding",
          "avgA": 85.9,
          "avgB": 64.4,
          "winner": "A",
          "benchmarkCount": 12
        },
        "multimodalGrounded": {
          "categoryLabel": "Multimodal & Grounded",
          "avgA": 92.7,
          "avgB": 77.3,
          "winner": "A",
          "benchmarkCount": 11
        },
        "reasoning": {
          "categoryLabel": "Reasoning",
          "avgA": null,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 2
        },
        "knowledge": {
          "categoryLabel": "Knowledge",
          "avgA": 74.6,
          "avgB": 76.2,
          "winner": "B",
          "benchmarkCount": 15
        },
        "instructionFollowing": {
          "categoryLabel": "Instruction Following",
          "avgA": null,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 1
        },
        "multilingual": {
          "categoryLabel": "Multilingual",
          "avgA": null,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 1
        },
        "math": {
          "categoryLabel": "Mathematics",
          "avgA": null,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 2
        }
      }
    },
    {
      "slug": "claude-mythos-5-vs-gemini-3-5-flash",
      "url": "https://benchlm.ai/compare/claude-mythos-5-vs-gemini-3-5-flash",
      "markdownUrl": "https://benchlm.ai/md/compare/claude-mythos-5-vs-gemini-3-5-flash.md",
      "modelA": {
        "slug": "claude-mythos-5",
        "canonicalModelKey": "claude-mythos-5",
        "model": "Claude Mythos 5",
        "creator": "Anthropic",
        "sourceType": "Proprietary",
        "reasoningType": "Reasoning",
        "contextWindow": "1M+",
        "contextWindowTokens": 1000000,
        "displayScore": 99,
        "rankingEligible": true,
        "overallRank": 1,
        "url": "https://benchlm.ai/models/claude-mythos-5",
        "markdownUrl": "https://benchlm.ai/md/models/claude-mythos-5.md"
      },
      "modelB": {
        "slug": "gemini-3-5-flash",
        "canonicalModelKey": "gemini-3-5-flash",
        "model": "Gemini 3.5 Flash",
        "creator": "Google",
        "sourceType": "Proprietary",
        "reasoningType": "Reasoning",
        "contextWindow": "1M",
        "contextWindowTokens": 1000000,
        "displayScore": 86,
        "rankingEligible": true,
        "overallRank": 13,
        "url": "https://benchlm.ai/models/gemini-3-5-flash",
        "markdownUrl": "https://benchlm.ai/md/models/gemini-3-5-flash.md"
      },
      "overallWinner": "A",
      "winner": {
        "slug": "claude-mythos-5",
        "canonicalModelKey": "claude-mythos-5",
        "model": "Claude Mythos 5",
        "creator": "Anthropic",
        "sourceType": "Proprietary",
        "reasoningType": "Reasoning",
        "contextWindow": "1M+",
        "contextWindowTokens": 1000000,
        "displayScore": 99,
        "rankingEligible": true,
        "overallRank": 1,
        "url": "https://benchlm.ai/models/claude-mythos-5",
        "markdownUrl": "https://benchlm.ai/md/models/claude-mythos-5.md"
      },
      "scoreDiff": 13,
      "winsA": 4,
      "winsB": 0,
      "comparableCategoryCount": 4,
      "benchmarkCountA": 19,
      "benchmarkCountB": 40,
      "categoryResults": {
        "agentic": {
          "categoryLabel": "Agentic",
          "avgA": 87,
          "avgB": 77.2,
          "winner": "A",
          "benchmarkCount": 12
        },
        "coding": {
          "categoryLabel": "Coding",
          "avgA": 85.9,
          "avgB": 54.5,
          "winner": "A",
          "benchmarkCount": 10
        },
        "multimodalGrounded": {
          "categoryLabel": "Multimodal & Grounded",
          "avgA": 92.7,
          "avgB": 83.8,
          "winner": "A",
          "benchmarkCount": 7
        },
        "reasoning": {
          "categoryLabel": "Reasoning",
          "avgA": null,
          "avgB": 74.7,
          "winner": null,
          "benchmarkCount": 5
        },
        "knowledge": {
          "categoryLabel": "Knowledge",
          "avgA": 74.6,
          "avgB": 58,
          "winner": "A",
          "benchmarkCount": 10
        },
        "instructionFollowing": {
          "categoryLabel": "Instruction Following",
          "avgA": null,
          "avgB": 76.3,
          "winner": null,
          "benchmarkCount": 2
        },
        "multilingual": {
          "categoryLabel": "Multilingual",
          "avgA": null,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 1
        },
        "math": {
          "categoryLabel": "Mathematics",
          "avgA": null,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 1
        }
      }
    },
    {
      "slug": "claude-mythos-5-vs-deepseek-v4-pro-max",
      "url": "https://benchlm.ai/compare/claude-mythos-5-vs-deepseek-v4-pro-max",
      "markdownUrl": "https://benchlm.ai/md/compare/claude-mythos-5-vs-deepseek-v4-pro-max.md",
      "modelA": {
        "slug": "claude-mythos-5",
        "canonicalModelKey": "claude-mythos-5",
        "model": "Claude Mythos 5",
        "creator": "Anthropic",
        "sourceType": "Proprietary",
        "reasoningType": "Reasoning",
        "contextWindow": "1M+",
        "contextWindowTokens": 1000000,
        "displayScore": 99,
        "rankingEligible": true,
        "overallRank": 1,
        "url": "https://benchlm.ai/models/claude-mythos-5",
        "markdownUrl": "https://benchlm.ai/md/models/claude-mythos-5.md"
      },
      "modelB": {
        "slug": "deepseek-v4-pro-max",
        "canonicalModelKey": "deepseek-v4-pro-max",
        "model": "DeepSeek V4 Pro (Max)",
        "creator": "DeepSeek",
        "sourceType": "Open Weight",
        "reasoningType": "Reasoning",
        "contextWindow": "1M",
        "contextWindowTokens": 1000000,
        "displayScore": 86,
        "rankingEligible": true,
        "overallRank": 14,
        "url": "https://benchlm.ai/models/deepseek-v4-pro-max",
        "markdownUrl": "https://benchlm.ai/md/models/deepseek-v4-pro-max.md"
      },
      "overallWinner": "A",
      "winner": {
        "slug": "claude-mythos-5",
        "canonicalModelKey": "claude-mythos-5",
        "model": "Claude Mythos 5",
        "creator": "Anthropic",
        "sourceType": "Proprietary",
        "reasoningType": "Reasoning",
        "contextWindow": "1M+",
        "contextWindowTokens": 1000000,
        "displayScore": 99,
        "rankingEligible": true,
        "overallRank": 1,
        "url": "https://benchlm.ai/models/claude-mythos-5",
        "markdownUrl": "https://benchlm.ai/md/models/claude-mythos-5.md"
      },
      "scoreDiff": 13,
      "winsA": 3,
      "winsB": 0,
      "comparableCategoryCount": 3,
      "benchmarkCountA": 19,
      "benchmarkCountB": 42,
      "categoryResults": {
        "agentic": {
          "categoryLabel": "Agentic",
          "avgA": 87,
          "avgB": 74,
          "winner": "A",
          "benchmarkCount": 11
        },
        "coding": {
          "categoryLabel": "Coding",
          "avgA": 85.9,
          "avgB": 75.9,
          "winner": "A",
          "benchmarkCount": 11
        },
        "multimodalGrounded": {
          "categoryLabel": "Multimodal & Grounded",
          "avgA": 92.7,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 6
        },
        "reasoning": {
          "categoryLabel": "Reasoning",
          "avgA": null,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 4
        },
        "knowledge": {
          "categoryLabel": "Knowledge",
          "avgA": 74.6,
          "avgB": 66.1,
          "winner": "A",
          "benchmarkCount": 13
        },
        "instructionFollowing": {
          "categoryLabel": "Instruction Following",
          "avgA": null,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 1
        },
        "multilingual": {
          "categoryLabel": "Multilingual",
          "avgA": null,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 1
        },
        "math": {
          "categoryLabel": "Mathematics",
          "avgA": null,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 5
        }
      }
    },
    {
      "slug": "claude-mythos-5-vs-gpt-5-3-codex",
      "url": "https://benchlm.ai/compare/claude-mythos-5-vs-gpt-5-3-codex",
      "markdownUrl": "https://benchlm.ai/md/compare/claude-mythos-5-vs-gpt-5-3-codex.md",
      "modelA": {
        "slug": "claude-mythos-5",
        "canonicalModelKey": "claude-mythos-5",
        "model": "Claude Mythos 5",
        "creator": "Anthropic",
        "sourceType": "Proprietary",
        "reasoningType": "Reasoning",
        "contextWindow": "1M+",
        "contextWindowTokens": 1000000,
        "displayScore": 99,
        "rankingEligible": true,
        "overallRank": 1,
        "url": "https://benchlm.ai/models/claude-mythos-5",
        "markdownUrl": "https://benchlm.ai/md/models/claude-mythos-5.md"
      },
      "modelB": {
        "slug": "gpt-5-3-codex",
        "canonicalModelKey": "gpt-5-3-codex",
        "model": "GPT-5.3 Codex",
        "creator": "OpenAI",
        "sourceType": "Proprietary",
        "reasoningType": "Reasoning",
        "contextWindow": "400K",
        "contextWindowTokens": 400000,
        "displayScore": 85,
        "rankingEligible": true,
        "overallRank": 15,
        "url": "https://benchlm.ai/models/gpt-5-3-codex",
        "markdownUrl": "https://benchlm.ai/md/models/gpt-5-3-codex.md"
      },
      "overallWinner": "A",
      "winner": {
        "slug": "claude-mythos-5",
        "canonicalModelKey": "claude-mythos-5",
        "model": "Claude Mythos 5",
        "creator": "Anthropic",
        "sourceType": "Proprietary",
        "reasoningType": "Reasoning",
        "contextWindow": "1M+",
        "contextWindowTokens": 1000000,
        "displayScore": 99,
        "rankingEligible": true,
        "overallRank": 1,
        "url": "https://benchlm.ai/models/claude-mythos-5",
        "markdownUrl": "https://benchlm.ai/md/models/claude-mythos-5.md"
      },
      "scoreDiff": 14,
      "winsA": 2,
      "winsB": 0,
      "comparableCategoryCount": 2,
      "benchmarkCountA": 19,
      "benchmarkCountB": 25,
      "categoryResults": {
        "agentic": {
          "categoryLabel": "Agentic",
          "avgA": 87,
          "avgB": 71.5,
          "winner": "A",
          "benchmarkCount": 8
        },
        "coding": {
          "categoryLabel": "Coding",
          "avgA": 85.9,
          "avgB": 63.1,
          "winner": "A",
          "benchmarkCount": 9
        },
        "multimodalGrounded": {
          "categoryLabel": "Multimodal & Grounded",
          "avgA": 92.7,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 7
        },
        "reasoning": {
          "categoryLabel": "Reasoning",
          "avgA": null,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 2
        },
        "knowledge": {
          "categoryLabel": "Knowledge",
          "avgA": 74.6,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 9
        },
        "instructionFollowing": {
          "categoryLabel": "Instruction Following",
          "avgA": null,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 1
        },
        "multilingual": {
          "categoryLabel": "Multilingual",
          "avgA": null,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 1
        },
        "math": {
          "categoryLabel": "Mathematics",
          "avgA": null,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 1
        }
      }
    },
    {
      "slug": "claude-mythos-5-vs-claude-opus-4-7-adaptive",
      "url": "https://benchlm.ai/compare/claude-mythos-5-vs-claude-opus-4-7-adaptive",
      "markdownUrl": "https://benchlm.ai/md/compare/claude-mythos-5-vs-claude-opus-4-7-adaptive.md",
      "modelA": {
        "slug": "claude-mythos-5",
        "canonicalModelKey": "claude-mythos-5",
        "model": "Claude Mythos 5",
        "creator": "Anthropic",
        "sourceType": "Proprietary",
        "reasoningType": "Reasoning",
        "contextWindow": "1M+",
        "contextWindowTokens": 1000000,
        "displayScore": 99,
        "rankingEligible": true,
        "overallRank": 1,
        "url": "https://benchlm.ai/models/claude-mythos-5",
        "markdownUrl": "https://benchlm.ai/md/models/claude-mythos-5.md"
      },
      "modelB": {
        "slug": "claude-opus-4-7-adaptive",
        "canonicalModelKey": "claude-opus-4-7-max",
        "model": "Claude Opus 4.7 (Adaptive)",
        "creator": "Anthropic",
        "sourceType": "Proprietary",
        "reasoningType": "Reasoning",
        "contextWindow": "1M",
        "contextWindowTokens": 1000000,
        "displayScore": 84,
        "rankingEligible": true,
        "overallRank": 16,
        "url": "https://benchlm.ai/models/claude-opus-4-7-adaptive",
        "markdownUrl": "https://benchlm.ai/md/models/claude-opus-4-7-adaptive.md"
      },
      "overallWinner": "A",
      "winner": {
        "slug": "claude-mythos-5",
        "canonicalModelKey": "claude-mythos-5",
        "model": "Claude Mythos 5",
        "creator": "Anthropic",
        "sourceType": "Proprietary",
        "reasoningType": "Reasoning",
        "contextWindow": "1M+",
        "contextWindowTokens": 1000000,
        "displayScore": 99,
        "rankingEligible": true,
        "overallRank": 1,
        "url": "https://benchlm.ai/models/claude-mythos-5",
        "markdownUrl": "https://benchlm.ai/md/models/claude-mythos-5.md"
      },
      "scoreDiff": 15,
      "winsA": 4,
      "winsB": 0,
      "comparableCategoryCount": 4,
      "benchmarkCountA": 19,
      "benchmarkCountB": 36,
      "categoryResults": {
        "agentic": {
          "categoryLabel": "Agentic",
          "avgA": 87,
          "avgB": 74.9,
          "winner": "A",
          "benchmarkCount": 9
        },
        "coding": {
          "categoryLabel": "Coding",
          "avgA": 85.9,
          "avgB": 72.9,
          "winner": "A",
          "benchmarkCount": 7
        },
        "multimodalGrounded": {
          "categoryLabel": "Multimodal & Grounded",
          "avgA": 92.7,
          "avgB": 64.3,
          "winner": "A",
          "benchmarkCount": 8
        },
        "reasoning": {
          "categoryLabel": "Reasoning",
          "avgA": null,
          "avgB": 75.8,
          "winner": null,
          "benchmarkCount": 4
        },
        "knowledge": {
          "categoryLabel": "Knowledge",
          "avgA": 74.6,
          "avgB": 68.2,
          "winner": "A",
          "benchmarkCount": 10
        },
        "instructionFollowing": {
          "categoryLabel": "Instruction Following",
          "avgA": null,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 1
        },
        "multilingual": {
          "categoryLabel": "Multilingual",
          "avgA": null,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 1
        },
        "math": {
          "categoryLabel": "Mathematics",
          "avgA": null,
          "avgB": 43.8,
          "winner": null,
          "benchmarkCount": 2
        }
      }
    },
    {
      "slug": "claude-mythos-5-vs-glm-5-1",
      "url": "https://benchlm.ai/compare/claude-mythos-5-vs-glm-5-1",
      "markdownUrl": "https://benchlm.ai/md/compare/claude-mythos-5-vs-glm-5-1.md",
      "modelA": {
        "slug": "claude-mythos-5",
        "canonicalModelKey": "claude-mythos-5",
        "model": "Claude Mythos 5",
        "creator": "Anthropic",
        "sourceType": "Proprietary",
        "reasoningType": "Reasoning",
        "contextWindow": "1M+",
        "contextWindowTokens": 1000000,
        "displayScore": 99,
        "rankingEligible": true,
        "overallRank": 1,
        "url": "https://benchlm.ai/models/claude-mythos-5",
        "markdownUrl": "https://benchlm.ai/md/models/claude-mythos-5.md"
      },
      "modelB": {
        "slug": "glm-5-1",
        "canonicalModelKey": "glm-5-1",
        "model": "GLM-5.1",
        "creator": "Z.AI",
        "sourceType": "Open Weight",
        "reasoningType": "Reasoning",
        "contextWindow": "203K",
        "contextWindowTokens": 203000,
        "displayScore": 82,
        "rankingEligible": true,
        "overallRank": 17,
        "url": "https://benchlm.ai/models/glm-5-1",
        "markdownUrl": "https://benchlm.ai/md/models/glm-5-1.md"
      },
      "overallWinner": "A",
      "winner": {
        "slug": "claude-mythos-5",
        "canonicalModelKey": "claude-mythos-5",
        "model": "Claude Mythos 5",
        "creator": "Anthropic",
        "sourceType": "Proprietary",
        "reasoningType": "Reasoning",
        "contextWindow": "1M+",
        "contextWindowTokens": 1000000,
        "displayScore": 99,
        "rankingEligible": true,
        "overallRank": 1,
        "url": "https://benchlm.ai/models/claude-mythos-5",
        "markdownUrl": "https://benchlm.ai/md/models/claude-mythos-5.md"
      },
      "scoreDiff": 17,
      "winsA": 3,
      "winsB": 0,
      "comparableCategoryCount": 3,
      "benchmarkCountA": 19,
      "benchmarkCountB": 33,
      "categoryResults": {
        "agentic": {
          "categoryLabel": "Agentic",
          "avgA": 87,
          "avgB": 65.3,
          "winner": "A",
          "benchmarkCount": 12
        },
        "coding": {
          "categoryLabel": "Coding",
          "avgA": 85.9,
          "avgB": 60.9,
          "winner": "A",
          "benchmarkCount": 10
        },
        "multimodalGrounded": {
          "categoryLabel": "Multimodal & Grounded",
          "avgA": 92.7,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 6
        },
        "reasoning": {
          "categoryLabel": "Reasoning",
          "avgA": null,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 2
        },
        "knowledge": {
          "categoryLabel": "Knowledge",
          "avgA": 74.6,
          "avgB": 52.3,
          "winner": "A",
          "benchmarkCount": 10
        },
        "instructionFollowing": {
          "categoryLabel": "Instruction Following",
          "avgA": null,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 1
        },
        "multilingual": {
          "categoryLabel": "Multilingual",
          "avgA": null,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 1
        },
        "math": {
          "categoryLabel": "Mathematics",
          "avgA": null,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 5
        }
      }
    },
    {
      "slug": "claude-mythos-5-vs-claude-sonnet-4-6",
      "url": "https://benchlm.ai/compare/claude-mythos-5-vs-claude-sonnet-4-6",
      "markdownUrl": "https://benchlm.ai/md/compare/claude-mythos-5-vs-claude-sonnet-4-6.md",
      "modelA": {
        "slug": "claude-mythos-5",
        "canonicalModelKey": "claude-mythos-5",
        "model": "Claude Mythos 5",
        "creator": "Anthropic",
        "sourceType": "Proprietary",
        "reasoningType": "Reasoning",
        "contextWindow": "1M+",
        "contextWindowTokens": 1000000,
        "displayScore": 99,
        "rankingEligible": true,
        "overallRank": 1,
        "url": "https://benchlm.ai/models/claude-mythos-5",
        "markdownUrl": "https://benchlm.ai/md/models/claude-mythos-5.md"
      },
      "modelB": {
        "slug": "claude-sonnet-4-6",
        "canonicalModelKey": "claude-sonnet-4-6",
        "model": "Claude Sonnet 4.6",
        "creator": "Anthropic",
        "sourceType": "Proprietary",
        "reasoningType": "Non-Reasoning",
        "contextWindow": "200K",
        "contextWindowTokens": 200000,
        "displayScore": 82,
        "rankingEligible": true,
        "overallRank": 18,
        "url": "https://benchlm.ai/models/claude-sonnet-4-6",
        "markdownUrl": "https://benchlm.ai/md/models/claude-sonnet-4-6.md"
      },
      "overallWinner": "A",
      "winner": {
        "slug": "claude-mythos-5",
        "canonicalModelKey": "claude-mythos-5",
        "model": "Claude Mythos 5",
        "creator": "Anthropic",
        "sourceType": "Proprietary",
        "reasoningType": "Reasoning",
        "contextWindow": "1M+",
        "contextWindowTokens": 1000000,
        "displayScore": 99,
        "rankingEligible": true,
        "overallRank": 1,
        "url": "https://benchlm.ai/models/claude-mythos-5",
        "markdownUrl": "https://benchlm.ai/md/models/claude-mythos-5.md"
      },
      "scoreDiff": 17,
      "winsA": 4,
      "winsB": 0,
      "comparableCategoryCount": 4,
      "benchmarkCountA": 19,
      "benchmarkCountB": 33,
      "categoryResults": {
        "agentic": {
          "categoryLabel": "Agentic",
          "avgA": 87,
          "avgB": 65.1,
          "winner": "A",
          "benchmarkCount": 10
        },
        "coding": {
          "categoryLabel": "Coding",
          "avgA": 85.9,
          "avgB": 66.4,
          "winner": "A",
          "benchmarkCount": 11
        },
        "multimodalGrounded": {
          "categoryLabel": "Multimodal & Grounded",
          "avgA": 92.7,
          "avgB": 77.4,
          "winner": "A",
          "benchmarkCount": 7
        },
        "reasoning": {
          "categoryLabel": "Reasoning",
          "avgA": null,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 2
        },
        "knowledge": {
          "categoryLabel": "Knowledge",
          "avgA": 74.6,
          "avgB": 73.7,
          "winner": "A",
          "benchmarkCount": 11
        },
        "instructionFollowing": {
          "categoryLabel": "Instruction Following",
          "avgA": null,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 1
        },
        "multilingual": {
          "categoryLabel": "Multilingual",
          "avgA": null,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 1
        },
        "math": {
          "categoryLabel": "Mathematics",
          "avgA": null,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 1
        }
      }
    },
    {
      "slug": "claude-fable-vs-gemini-3-1-pro",
      "url": "https://benchlm.ai/compare/claude-fable-vs-gemini-3-1-pro",
      "markdownUrl": "https://benchlm.ai/md/compare/claude-fable-vs-gemini-3-1-pro.md",
      "modelA": {
        "slug": "claude-fable",
        "canonicalModelKey": "claude-fable-5",
        "model": "Claude Fable 5",
        "creator": "Anthropic",
        "sourceType": "Proprietary",
        "reasoningType": "Reasoning",
        "contextWindow": "1M+",
        "contextWindowTokens": 1000000,
        "displayScore": 97,
        "rankingEligible": true,
        "overallRank": 2,
        "url": "https://benchlm.ai/models/claude-fable",
        "markdownUrl": "https://benchlm.ai/md/models/claude-fable.md"
      },
      "modelB": {
        "slug": "gemini-3-1-pro",
        "canonicalModelKey": "gemini-3-1-pro",
        "model": "Gemini 3.1 Pro",
        "creator": "Google",
        "sourceType": "Proprietary",
        "reasoningType": "Non-Reasoning",
        "contextWindow": "1M",
        "contextWindowTokens": 1000000,
        "displayScore": 91,
        "rankingEligible": true,
        "overallRank": 4,
        "url": "https://benchlm.ai/models/gemini-3-1-pro",
        "markdownUrl": "https://benchlm.ai/md/models/gemini-3-1-pro.md"
      },
      "overallWinner": "A",
      "winner": {
        "slug": "claude-fable",
        "canonicalModelKey": "claude-fable-5",
        "model": "Claude Fable 5",
        "creator": "Anthropic",
        "sourceType": "Proprietary",
        "reasoningType": "Reasoning",
        "contextWindow": "1M+",
        "contextWindowTokens": 1000000,
        "displayScore": 97,
        "rankingEligible": true,
        "overallRank": 2,
        "url": "https://benchlm.ai/models/claude-fable",
        "markdownUrl": "https://benchlm.ai/md/models/claude-fable.md"
      },
      "scoreDiff": 6,
      "winsA": 1,
      "winsB": 0,
      "comparableCategoryCount": 1,
      "benchmarkCountA": 19,
      "benchmarkCountB": 38,
      "categoryResults": {
        "agentic": {
          "categoryLabel": "Agentic",
          "avgA": 85.2,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 11
        },
        "coding": {
          "categoryLabel": "Coding",
          "avgA": 85.6,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 10
        },
        "multimodalGrounded": {
          "categoryLabel": "Multimodal & Grounded",
          "avgA": 92.4,
          "avgB": 82.8,
          "winner": "A",
          "benchmarkCount": 13
        },
        "reasoning": {
          "categoryLabel": "Reasoning",
          "avgA": null,
          "avgB": 77.1,
          "winner": null,
          "benchmarkCount": 3
        },
        "knowledge": {
          "categoryLabel": "Knowledge",
          "avgA": 74.8,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 12
        },
        "instructionFollowing": {
          "categoryLabel": "Instruction Following",
          "avgA": null,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 1
        },
        "multilingual": {
          "categoryLabel": "Multilingual",
          "avgA": null,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 1
        },
        "math": {
          "categoryLabel": "Mathematics",
          "avgA": null,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 1
        }
      }
    },
    {
      "slug": "claude-fable-vs-qwen3-7-max",
      "url": "https://benchlm.ai/compare/claude-fable-vs-qwen3-7-max",
      "markdownUrl": "https://benchlm.ai/md/compare/claude-fable-vs-qwen3-7-max.md",
      "modelA": {
        "slug": "claude-fable",
        "canonicalModelKey": "claude-fable-5",
        "model": "Claude Fable 5",
        "creator": "Anthropic",
        "sourceType": "Proprietary",
        "reasoningType": "Reasoning",
        "contextWindow": "1M+",
        "contextWindowTokens": 1000000,
        "displayScore": 97,
        "rankingEligible": true,
        "overallRank": 2,
        "url": "https://benchlm.ai/models/claude-fable",
        "markdownUrl": "https://benchlm.ai/md/models/claude-fable.md"
      },
      "modelB": {
        "slug": "qwen3-7-max",
        "canonicalModelKey": "qwen3-7-max",
        "model": "Qwen3.7 Max",
        "creator": "Alibaba",
        "sourceType": "Proprietary",
        "reasoningType": "Reasoning",
        "contextWindow": "1M",
        "contextWindowTokens": 1000000,
        "displayScore": 91,
        "rankingEligible": true,
        "overallRank": 5,
        "url": "https://benchlm.ai/models/qwen3-7-max",
        "markdownUrl": "https://benchlm.ai/md/models/qwen3-7-max.md"
      },
      "overallWinner": "A",
      "winner": {
        "slug": "claude-fable",
        "canonicalModelKey": "claude-fable-5",
        "model": "Claude Fable 5",
        "creator": "Anthropic",
        "sourceType": "Proprietary",
        "reasoningType": "Reasoning",
        "contextWindow": "1M+",
        "contextWindowTokens": 1000000,
        "displayScore": 97,
        "rankingEligible": true,
        "overallRank": 2,
        "url": "https://benchlm.ai/models/claude-fable",
        "markdownUrl": "https://benchlm.ai/md/models/claude-fable.md"
      },
      "scoreDiff": 6,
      "winsA": 3,
      "winsB": 0,
      "comparableCategoryCount": 3,
      "benchmarkCountA": 19,
      "benchmarkCountB": 51,
      "categoryResults": {
        "agentic": {
          "categoryLabel": "Agentic",
          "avgA": 85.2,
          "avgB": 69.7,
          "winner": "A",
          "benchmarkCount": 15
        },
        "coding": {
          "categoryLabel": "Coding",
          "avgA": 85.6,
          "avgB": 73.6,
          "winner": "A",
          "benchmarkCount": 11
        },
        "multimodalGrounded": {
          "categoryLabel": "Multimodal & Grounded",
          "avgA": 92.4,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 6
        },
        "reasoning": {
          "categoryLabel": "Reasoning",
          "avgA": null,
          "avgB": 90.4,
          "winner": null,
          "benchmarkCount": 3
        },
        "knowledge": {
          "categoryLabel": "Knowledge",
          "avgA": 74.8,
          "avgB": 71.2,
          "winner": "A",
          "benchmarkCount": 14
        },
        "instructionFollowing": {
          "categoryLabel": "Instruction Following",
          "avgA": null,
          "avgB": 89,
          "winner": null,
          "benchmarkCount": 3
        },
        "multilingual": {
          "categoryLabel": "Multilingual",
          "avgA": null,
          "avgB": 87,
          "winner": null,
          "benchmarkCount": 6
        },
        "math": {
          "categoryLabel": "Mathematics",
          "avgA": null,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 4
        }
      }
    },
    {
      "slug": "claude-fable-vs-gpt-5-4-pro",
      "url": "https://benchlm.ai/compare/claude-fable-vs-gpt-5-4-pro",
      "markdownUrl": "https://benchlm.ai/md/compare/claude-fable-vs-gpt-5-4-pro.md",
      "modelA": {
        "slug": "claude-fable",
        "canonicalModelKey": "claude-fable-5",
        "model": "Claude Fable 5",
        "creator": "Anthropic",
        "sourceType": "Proprietary",
        "reasoningType": "Reasoning",
        "contextWindow": "1M+",
        "contextWindowTokens": 1000000,
        "displayScore": 97,
        "rankingEligible": true,
        "overallRank": 2,
        "url": "https://benchlm.ai/models/claude-fable",
        "markdownUrl": "https://benchlm.ai/md/models/claude-fable.md"
      },
      "modelB": {
        "slug": "gpt-5-4-pro",
        "canonicalModelKey": "gpt-5-4-pro",
        "model": "GPT-5.4 Pro",
        "creator": "OpenAI",
        "sourceType": "Proprietary",
        "reasoningType": "Reasoning",
        "contextWindow": "1.05M",
        "contextWindowTokens": 1050000,
        "displayScore": 90,
        "rankingEligible": true,
        "overallRank": 6,
        "url": "https://benchlm.ai/models/gpt-5-4-pro",
        "markdownUrl": "https://benchlm.ai/md/models/gpt-5-4-pro.md"
      },
      "overallWinner": "A",
      "winner": {
        "slug": "claude-fable",
        "canonicalModelKey": "claude-fable-5",
        "model": "Claude Fable 5",
        "creator": "Anthropic",
        "sourceType": "Proprietary",
        "reasoningType": "Reasoning",
        "contextWindow": "1M+",
        "contextWindowTokens": 1000000,
        "displayScore": 97,
        "rankingEligible": true,
        "overallRank": 2,
        "url": "https://benchlm.ai/models/claude-fable",
        "markdownUrl": "https://benchlm.ai/md/models/claude-fable.md"
      },
      "scoreDiff": 7,
      "winsA": 1,
      "winsB": 2,
      "comparableCategoryCount": 3,
      "benchmarkCountA": 19,
      "benchmarkCountB": 10,
      "categoryResults": {
        "agentic": {
          "categoryLabel": "Agentic",
          "avgA": 85.2,
          "avgB": 89.3,
          "winner": "B",
          "benchmarkCount": 4
        },
        "coding": {
          "categoryLabel": "Coding",
          "avgA": 85.6,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 4
        },
        "multimodalGrounded": {
          "categoryLabel": "Multimodal & Grounded",
          "avgA": 92.4,
          "avgB": 94,
          "winner": "B",
          "benchmarkCount": 5
        },
        "reasoning": {
          "categoryLabel": "Reasoning",
          "avgA": null,
          "avgB": 83.3,
          "winner": null,
          "benchmarkCount": 2
        },
        "knowledge": {
          "categoryLabel": "Knowledge",
          "avgA": 74.8,
          "avgB": 49,
          "winner": "A",
          "benchmarkCount": 5
        },
        "instructionFollowing": {
          "categoryLabel": "Instruction Following",
          "avgA": null,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 0
        },
        "multilingual": {
          "categoryLabel": "Multilingual",
          "avgA": null,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 1
        },
        "math": {
          "categoryLabel": "Mathematics",
          "avgA": null,
          "avgB": 50,
          "winner": null,
          "benchmarkCount": 3
        }
      }
    },
    {
      "slug": "claude-fable-vs-gemini-3-pro-deep-think",
      "url": "https://benchlm.ai/compare/claude-fable-vs-gemini-3-pro-deep-think",
      "markdownUrl": "https://benchlm.ai/md/compare/claude-fable-vs-gemini-3-pro-deep-think.md",
      "modelA": {
        "slug": "claude-fable",
        "canonicalModelKey": "claude-fable-5",
        "model": "Claude Fable 5",
        "creator": "Anthropic",
        "sourceType": "Proprietary",
        "reasoningType": "Reasoning",
        "contextWindow": "1M+",
        "contextWindowTokens": 1000000,
        "displayScore": 97,
        "rankingEligible": true,
        "overallRank": 2,
        "url": "https://benchlm.ai/models/claude-fable",
        "markdownUrl": "https://benchlm.ai/md/models/claude-fable.md"
      },
      "modelB": {
        "slug": "gemini-3-pro-deep-think",
        "canonicalModelKey": "gemini-3-pro-deep-think",
        "model": "Gemini 3 Pro Deep Think",
        "creator": "Google",
        "sourceType": "Proprietary",
        "reasoningType": "Reasoning",
        "contextWindow": "2M",
        "contextWindowTokens": 2000000,
        "displayScore": 89,
        "rankingEligible": true,
        "overallRank": 8,
        "url": "https://benchlm.ai/models/gemini-3-pro-deep-think",
        "markdownUrl": "https://benchlm.ai/md/models/gemini-3-pro-deep-think.md"
      },
      "overallWinner": "A",
      "winner": {
        "slug": "claude-fable",
        "canonicalModelKey": "claude-fable-5",
        "model": "Claude Fable 5",
        "creator": "Anthropic",
        "sourceType": "Proprietary",
        "reasoningType": "Reasoning",
        "contextWindow": "1M+",
        "contextWindowTokens": 1000000,
        "displayScore": 97,
        "rankingEligible": true,
        "overallRank": 2,
        "url": "https://benchlm.ai/models/claude-fable",
        "markdownUrl": "https://benchlm.ai/md/models/claude-fable.md"
      },
      "scoreDiff": 8,
      "winsA": 0,
      "winsB": 0,
      "comparableCategoryCount": 0,
      "benchmarkCountA": 19,
      "benchmarkCountB": 4,
      "categoryResults": {
        "agentic": {
          "categoryLabel": "Agentic",
          "avgA": 85.2,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 5
        },
        "coding": {
          "categoryLabel": "Coding",
          "avgA": 85.6,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 4
        },
        "multimodalGrounded": {
          "categoryLabel": "Multimodal & Grounded",
          "avgA": 92.4,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 5
        },
        "reasoning": {
          "categoryLabel": "Reasoning",
          "avgA": null,
          "avgB": 45.1,
          "winner": null,
          "benchmarkCount": 2
        },
        "knowledge": {
          "categoryLabel": "Knowledge",
          "avgA": 74.8,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 3
        },
        "instructionFollowing": {
          "categoryLabel": "Instruction Following",
          "avgA": null,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 0
        },
        "multilingual": {
          "categoryLabel": "Multilingual",
          "avgA": null,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 1
        },
        "math": {
          "categoryLabel": "Mathematics",
          "avgA": null,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 1
        }
      }
    },
    {
      "slug": "claude-fable-vs-grok-4-1",
      "url": "https://benchlm.ai/compare/claude-fable-vs-grok-4-1",
      "markdownUrl": "https://benchlm.ai/md/compare/claude-fable-vs-grok-4-1.md",
      "modelA": {
        "slug": "claude-fable",
        "canonicalModelKey": "claude-fable-5",
        "model": "Claude Fable 5",
        "creator": "Anthropic",
        "sourceType": "Proprietary",
        "reasoningType": "Reasoning",
        "contextWindow": "1M+",
        "contextWindowTokens": 1000000,
        "displayScore": 97,
        "rankingEligible": true,
        "overallRank": 2,
        "url": "https://benchlm.ai/models/claude-fable",
        "markdownUrl": "https://benchlm.ai/md/models/claude-fable.md"
      },
      "modelB": {
        "slug": "grok-4-1",
        "canonicalModelKey": "grok-4-1",
        "model": "Grok 4.1",
        "creator": "xAI",
        "sourceType": "Proprietary",
        "reasoningType": "Non-Reasoning",
        "contextWindow": "1M",
        "contextWindowTokens": 1000000,
        "displayScore": 89,
        "rankingEligible": true,
        "overallRank": 9,
        "url": "https://benchlm.ai/models/grok-4-1",
        "markdownUrl": "https://benchlm.ai/md/models/grok-4-1.md"
      },
      "overallWinner": "A",
      "winner": {
        "slug": "claude-fable",
        "canonicalModelKey": "claude-fable-5",
        "model": "Claude Fable 5",
        "creator": "Anthropic",
        "sourceType": "Proprietary",
        "reasoningType": "Reasoning",
        "contextWindow": "1M+",
        "contextWindowTokens": 1000000,
        "displayScore": 97,
        "rankingEligible": true,
        "overallRank": 2,
        "url": "https://benchlm.ai/models/claude-fable",
        "markdownUrl": "https://benchlm.ai/md/models/claude-fable.md"
      },
      "scoreDiff": 8,
      "winsA": 0,
      "winsB": 0,
      "comparableCategoryCount": 0,
      "benchmarkCountA": 19,
      "benchmarkCountB": 0,
      "categoryResults": {
        "agentic": {
          "categoryLabel": "Agentic",
          "avgA": 85.2,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 4
        },
        "coding": {
          "categoryLabel": "Coding",
          "avgA": 85.6,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 4
        },
        "multimodalGrounded": {
          "categoryLabel": "Multimodal & Grounded",
          "avgA": 92.4,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 5
        },
        "reasoning": {
          "categoryLabel": "Reasoning",
          "avgA": null,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 0
        },
        "knowledge": {
          "categoryLabel": "Knowledge",
          "avgA": 74.8,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 3
        },
        "instructionFollowing": {
          "categoryLabel": "Instruction Following",
          "avgA": null,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 0
        },
        "multilingual": {
          "categoryLabel": "Multilingual",
          "avgA": null,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 1
        },
        "math": {
          "categoryLabel": "Mathematics",
          "avgA": null,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 1
        }
      }
    },
    {
      "slug": "claude-fable-vs-gpt-5-4",
      "url": "https://benchlm.ai/compare/claude-fable-vs-gpt-5-4",
      "markdownUrl": "https://benchlm.ai/md/compare/claude-fable-vs-gpt-5-4.md",
      "modelA": {
        "slug": "claude-fable",
        "canonicalModelKey": "claude-fable-5",
        "model": "Claude Fable 5",
        "creator": "Anthropic",
        "sourceType": "Proprietary",
        "reasoningType": "Reasoning",
        "contextWindow": "1M+",
        "contextWindowTokens": 1000000,
        "displayScore": 97,
        "rankingEligible": true,
        "overallRank": 2,
        "url": "https://benchlm.ai/models/claude-fable",
        "markdownUrl": "https://benchlm.ai/md/models/claude-fable.md"
      },
      "modelB": {
        "slug": "gpt-5-4",
        "canonicalModelKey": "gpt-5-4",
        "model": "GPT-5.4",
        "creator": "OpenAI",
        "sourceType": "Proprietary",
        "reasoningType": "Reasoning",
        "contextWindow": "1.05M",
        "contextWindowTokens": 1050000,
        "displayScore": 88,
        "rankingEligible": true,
        "overallRank": 10,
        "url": "https://benchlm.ai/models/gpt-5-4",
        "markdownUrl": "https://benchlm.ai/md/models/gpt-5-4.md"
      },
      "overallWinner": "A",
      "winner": {
        "slug": "claude-fable",
        "canonicalModelKey": "claude-fable-5",
        "model": "Claude Fable 5",
        "creator": "Anthropic",
        "sourceType": "Proprietary",
        "reasoningType": "Reasoning",
        "contextWindow": "1M+",
        "contextWindowTokens": 1000000,
        "displayScore": 97,
        "rankingEligible": true,
        "overallRank": 2,
        "url": "https://benchlm.ai/models/claude-fable",
        "markdownUrl": "https://benchlm.ai/md/models/claude-fable.md"
      },
      "scoreDiff": 9,
      "winsA": 4,
      "winsB": 0,
      "comparableCategoryCount": 4,
      "benchmarkCountA": 19,
      "benchmarkCountB": 48,
      "categoryResults": {
        "agentic": {
          "categoryLabel": "Agentic",
          "avgA": 85.2,
          "avgB": 77,
          "winner": "A",
          "benchmarkCount": 14
        },
        "coding": {
          "categoryLabel": "Coding",
          "avgA": 85.6,
          "avgB": 57.7,
          "winner": "A",
          "benchmarkCount": 10
        },
        "multimodalGrounded": {
          "categoryLabel": "Multimodal & Grounded",
          "avgA": 92.4,
          "avgB": 72.7,
          "winner": "A",
          "benchmarkCount": 15
        },
        "reasoning": {
          "categoryLabel": "Reasoning",
          "avgA": null,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 2
        },
        "knowledge": {
          "categoryLabel": "Knowledge",
          "avgA": 74.8,
          "avgB": 66.1,
          "winner": "A",
          "benchmarkCount": 12
        },
        "instructionFollowing": {
          "categoryLabel": "Instruction Following",
          "avgA": null,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 1
        },
        "multilingual": {
          "categoryLabel": "Multilingual",
          "avgA": null,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 1
        },
        "math": {
          "categoryLabel": "Mathematics",
          "avgA": null,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 1
        }
      }
    },
    {
      "slug": "claude-fable-vs-qwen3-7-plus",
      "url": "https://benchlm.ai/compare/claude-fable-vs-qwen3-7-plus",
      "markdownUrl": "https://benchlm.ai/md/compare/claude-fable-vs-qwen3-7-plus.md",
      "modelA": {
        "slug": "claude-fable",
        "canonicalModelKey": "claude-fable-5",
        "model": "Claude Fable 5",
        "creator": "Anthropic",
        "sourceType": "Proprietary",
        "reasoningType": "Reasoning",
        "contextWindow": "1M+",
        "contextWindowTokens": 1000000,
        "displayScore": 97,
        "rankingEligible": true,
        "overallRank": 2,
        "url": "https://benchlm.ai/models/claude-fable",
        "markdownUrl": "https://benchlm.ai/md/models/claude-fable.md"
      },
      "modelB": {
        "slug": "qwen3-7-plus",
        "canonicalModelKey": "qwen3-7-plus",
        "model": "Qwen3.7 Plus",
        "creator": "Alibaba",
        "sourceType": "Proprietary",
        "reasoningType": "Reasoning",
        "contextWindow": "1M",
        "contextWindowTokens": 1000000,
        "displayScore": 88,
        "rankingEligible": true,
        "overallRank": 11,
        "url": "https://benchlm.ai/models/qwen3-7-plus",
        "markdownUrl": "https://benchlm.ai/md/models/qwen3-7-plus.md"
      },
      "overallWinner": "A",
      "winner": {
        "slug": "claude-fable",
        "canonicalModelKey": "claude-fable-5",
        "model": "Claude Fable 5",
        "creator": "Anthropic",
        "sourceType": "Proprietary",
        "reasoningType": "Reasoning",
        "contextWindow": "1M+",
        "contextWindowTokens": 1000000,
        "displayScore": 97,
        "rankingEligible": true,
        "overallRank": 2,
        "url": "https://benchlm.ai/models/claude-fable",
        "markdownUrl": "https://benchlm.ai/md/models/claude-fable.md"
      },
      "scoreDiff": 9,
      "winsA": 4,
      "winsB": 0,
      "comparableCategoryCount": 4,
      "benchmarkCountA": 19,
      "benchmarkCountB": 68,
      "categoryResults": {
        "agentic": {
          "categoryLabel": "Agentic",
          "avgA": 85.2,
          "avgB": 71.7,
          "winner": "A",
          "benchmarkCount": 16
        },
        "coding": {
          "categoryLabel": "Coding",
          "avgA": 85.6,
          "avgB": 71.1,
          "winner": "A",
          "benchmarkCount": 11
        },
        "multimodalGrounded": {
          "categoryLabel": "Multimodal & Grounded",
          "avgA": 92.4,
          "avgB": 81.1,
          "winner": "A",
          "benchmarkCount": 19
        },
        "reasoning": {
          "categoryLabel": "Reasoning",
          "avgA": null,
          "avgB": 91.7,
          "winner": null,
          "benchmarkCount": 3
        },
        "knowledge": {
          "categoryLabel": "Knowledge",
          "avgA": 74.8,
          "avgB": 67.9,
          "winner": "A",
          "benchmarkCount": 14
        },
        "instructionFollowing": {
          "categoryLabel": "Instruction Following",
          "avgA": null,
          "avgB": 89.2,
          "winner": null,
          "benchmarkCount": 3
        },
        "multilingual": {
          "categoryLabel": "Multilingual",
          "avgA": null,
          "avgB": 85.4,
          "winner": null,
          "benchmarkCount": 6
        },
        "math": {
          "categoryLabel": "Mathematics",
          "avgA": null,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 4
        }
      }
    },
    {
      "slug": "claude-fable-vs-claude-opus-4-6",
      "url": "https://benchlm.ai/compare/claude-fable-vs-claude-opus-4-6",
      "markdownUrl": "https://benchlm.ai/md/compare/claude-fable-vs-claude-opus-4-6.md",
      "modelA": {
        "slug": "claude-fable",
        "canonicalModelKey": "claude-fable-5",
        "model": "Claude Fable 5",
        "creator": "Anthropic",
        "sourceType": "Proprietary",
        "reasoningType": "Reasoning",
        "contextWindow": "1M+",
        "contextWindowTokens": 1000000,
        "displayScore": 97,
        "rankingEligible": true,
        "overallRank": 2,
        "url": "https://benchlm.ai/models/claude-fable",
        "markdownUrl": "https://benchlm.ai/md/models/claude-fable.md"
      },
      "modelB": {
        "slug": "claude-opus-4-6",
        "canonicalModelKey": "claude-opus-4-6",
        "model": "Claude Opus 4.6",
        "creator": "Anthropic",
        "sourceType": "Proprietary",
        "reasoningType": "Non-Reasoning",
        "contextWindow": "1M",
        "contextWindowTokens": 1000000,
        "displayScore": 86,
        "rankingEligible": true,
        "overallRank": 12,
        "url": "https://benchlm.ai/models/claude-opus-4-6",
        "markdownUrl": "https://benchlm.ai/md/models/claude-opus-4-6.md"
      },
      "overallWinner": "A",
      "winner": {
        "slug": "claude-fable",
        "canonicalModelKey": "claude-fable-5",
        "model": "Claude Fable 5",
        "creator": "Anthropic",
        "sourceType": "Proprietary",
        "reasoningType": "Reasoning",
        "contextWindow": "1M+",
        "contextWindowTokens": 1000000,
        "displayScore": 97,
        "rankingEligible": true,
        "overallRank": 2,
        "url": "https://benchlm.ai/models/claude-fable",
        "markdownUrl": "https://benchlm.ai/md/models/claude-fable.md"
      },
      "scoreDiff": 11,
      "winsA": 3,
      "winsB": 1,
      "comparableCategoryCount": 4,
      "benchmarkCountA": 19,
      "benchmarkCountB": 47,
      "categoryResults": {
        "agentic": {
          "categoryLabel": "Agentic",
          "avgA": 85.2,
          "avgB": 72.6,
          "winner": "A",
          "benchmarkCount": 11
        },
        "coding": {
          "categoryLabel": "Coding",
          "avgA": 85.6,
          "avgB": 64.4,
          "winner": "A",
          "benchmarkCount": 12
        },
        "multimodalGrounded": {
          "categoryLabel": "Multimodal & Grounded",
          "avgA": 92.4,
          "avgB": 77.3,
          "winner": "A",
          "benchmarkCount": 11
        },
        "reasoning": {
          "categoryLabel": "Reasoning",
          "avgA": null,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 2
        },
        "knowledge": {
          "categoryLabel": "Knowledge",
          "avgA": 74.8,
          "avgB": 76.2,
          "winner": "B",
          "benchmarkCount": 15
        },
        "instructionFollowing": {
          "categoryLabel": "Instruction Following",
          "avgA": null,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 1
        },
        "multilingual": {
          "categoryLabel": "Multilingual",
          "avgA": null,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 1
        },
        "math": {
          "categoryLabel": "Mathematics",
          "avgA": null,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 2
        }
      }
    },
    {
      "slug": "claude-fable-vs-gemini-3-5-flash",
      "url": "https://benchlm.ai/compare/claude-fable-vs-gemini-3-5-flash",
      "markdownUrl": "https://benchlm.ai/md/compare/claude-fable-vs-gemini-3-5-flash.md",
      "modelA": {
        "slug": "claude-fable",
        "canonicalModelKey": "claude-fable-5",
        "model": "Claude Fable 5",
        "creator": "Anthropic",
        "sourceType": "Proprietary",
        "reasoningType": "Reasoning",
        "contextWindow": "1M+",
        "contextWindowTokens": 1000000,
        "displayScore": 97,
        "rankingEligible": true,
        "overallRank": 2,
        "url": "https://benchlm.ai/models/claude-fable",
        "markdownUrl": "https://benchlm.ai/md/models/claude-fable.md"
      },
      "modelB": {
        "slug": "gemini-3-5-flash",
        "canonicalModelKey": "gemini-3-5-flash",
        "model": "Gemini 3.5 Flash",
        "creator": "Google",
        "sourceType": "Proprietary",
        "reasoningType": "Reasoning",
        "contextWindow": "1M",
        "contextWindowTokens": 1000000,
        "displayScore": 86,
        "rankingEligible": true,
        "overallRank": 13,
        "url": "https://benchlm.ai/models/gemini-3-5-flash",
        "markdownUrl": "https://benchlm.ai/md/models/gemini-3-5-flash.md"
      },
      "overallWinner": "A",
      "winner": {
        "slug": "claude-fable",
        "canonicalModelKey": "claude-fable-5",
        "model": "Claude Fable 5",
        "creator": "Anthropic",
        "sourceType": "Proprietary",
        "reasoningType": "Reasoning",
        "contextWindow": "1M+",
        "contextWindowTokens": 1000000,
        "displayScore": 97,
        "rankingEligible": true,
        "overallRank": 2,
        "url": "https://benchlm.ai/models/claude-fable",
        "markdownUrl": "https://benchlm.ai/md/models/claude-fable.md"
      },
      "scoreDiff": 11,
      "winsA": 4,
      "winsB": 0,
      "comparableCategoryCount": 4,
      "benchmarkCountA": 19,
      "benchmarkCountB": 40,
      "categoryResults": {
        "agentic": {
          "categoryLabel": "Agentic",
          "avgA": 85.2,
          "avgB": 77.2,
          "winner": "A",
          "benchmarkCount": 12
        },
        "coding": {
          "categoryLabel": "Coding",
          "avgA": 85.6,
          "avgB": 54.5,
          "winner": "A",
          "benchmarkCount": 10
        },
        "multimodalGrounded": {
          "categoryLabel": "Multimodal & Grounded",
          "avgA": 92.4,
          "avgB": 83.8,
          "winner": "A",
          "benchmarkCount": 7
        },
        "reasoning": {
          "categoryLabel": "Reasoning",
          "avgA": null,
          "avgB": 74.7,
          "winner": null,
          "benchmarkCount": 5
        },
        "knowledge": {
          "categoryLabel": "Knowledge",
          "avgA": 74.8,
          "avgB": 58,
          "winner": "A",
          "benchmarkCount": 10
        },
        "instructionFollowing": {
          "categoryLabel": "Instruction Following",
          "avgA": null,
          "avgB": 76.3,
          "winner": null,
          "benchmarkCount": 2
        },
        "multilingual": {
          "categoryLabel": "Multilingual",
          "avgA": null,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 1
        },
        "math": {
          "categoryLabel": "Mathematics",
          "avgA": null,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 1
        }
      }
    },
    {
      "slug": "claude-fable-vs-deepseek-v4-pro-max",
      "url": "https://benchlm.ai/compare/claude-fable-vs-deepseek-v4-pro-max",
      "markdownUrl": "https://benchlm.ai/md/compare/claude-fable-vs-deepseek-v4-pro-max.md",
      "modelA": {
        "slug": "claude-fable",
        "canonicalModelKey": "claude-fable-5",
        "model": "Claude Fable 5",
        "creator": "Anthropic",
        "sourceType": "Proprietary",
        "reasoningType": "Reasoning",
        "contextWindow": "1M+",
        "contextWindowTokens": 1000000,
        "displayScore": 97,
        "rankingEligible": true,
        "overallRank": 2,
        "url": "https://benchlm.ai/models/claude-fable",
        "markdownUrl": "https://benchlm.ai/md/models/claude-fable.md"
      },
      "modelB": {
        "slug": "deepseek-v4-pro-max",
        "canonicalModelKey": "deepseek-v4-pro-max",
        "model": "DeepSeek V4 Pro (Max)",
        "creator": "DeepSeek",
        "sourceType": "Open Weight",
        "reasoningType": "Reasoning",
        "contextWindow": "1M",
        "contextWindowTokens": 1000000,
        "displayScore": 86,
        "rankingEligible": true,
        "overallRank": 14,
        "url": "https://benchlm.ai/models/deepseek-v4-pro-max",
        "markdownUrl": "https://benchlm.ai/md/models/deepseek-v4-pro-max.md"
      },
      "overallWinner": "A",
      "winner": {
        "slug": "claude-fable",
        "canonicalModelKey": "claude-fable-5",
        "model": "Claude Fable 5",
        "creator": "Anthropic",
        "sourceType": "Proprietary",
        "reasoningType": "Reasoning",
        "contextWindow": "1M+",
        "contextWindowTokens": 1000000,
        "displayScore": 97,
        "rankingEligible": true,
        "overallRank": 2,
        "url": "https://benchlm.ai/models/claude-fable",
        "markdownUrl": "https://benchlm.ai/md/models/claude-fable.md"
      },
      "scoreDiff": 11,
      "winsA": 3,
      "winsB": 0,
      "comparableCategoryCount": 3,
      "benchmarkCountA": 19,
      "benchmarkCountB": 42,
      "categoryResults": {
        "agentic": {
          "categoryLabel": "Agentic",
          "avgA": 85.2,
          "avgB": 74,
          "winner": "A",
          "benchmarkCount": 11
        },
        "coding": {
          "categoryLabel": "Coding",
          "avgA": 85.6,
          "avgB": 75.9,
          "winner": "A",
          "benchmarkCount": 11
        },
        "multimodalGrounded": {
          "categoryLabel": "Multimodal & Grounded",
          "avgA": 92.4,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 6
        },
        "reasoning": {
          "categoryLabel": "Reasoning",
          "avgA": null,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 4
        },
        "knowledge": {
          "categoryLabel": "Knowledge",
          "avgA": 74.8,
          "avgB": 66.1,
          "winner": "A",
          "benchmarkCount": 13
        },
        "instructionFollowing": {
          "categoryLabel": "Instruction Following",
          "avgA": null,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 1
        },
        "multilingual": {
          "categoryLabel": "Multilingual",
          "avgA": null,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 1
        },
        "math": {
          "categoryLabel": "Mathematics",
          "avgA": null,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 5
        }
      }
    },
    {
      "slug": "claude-fable-vs-gpt-5-3-codex",
      "url": "https://benchlm.ai/compare/claude-fable-vs-gpt-5-3-codex",
      "markdownUrl": "https://benchlm.ai/md/compare/claude-fable-vs-gpt-5-3-codex.md",
      "modelA": {
        "slug": "claude-fable",
        "canonicalModelKey": "claude-fable-5",
        "model": "Claude Fable 5",
        "creator": "Anthropic",
        "sourceType": "Proprietary",
        "reasoningType": "Reasoning",
        "contextWindow": "1M+",
        "contextWindowTokens": 1000000,
        "displayScore": 97,
        "rankingEligible": true,
        "overallRank": 2,
        "url": "https://benchlm.ai/models/claude-fable",
        "markdownUrl": "https://benchlm.ai/md/models/claude-fable.md"
      },
      "modelB": {
        "slug": "gpt-5-3-codex",
        "canonicalModelKey": "gpt-5-3-codex",
        "model": "GPT-5.3 Codex",
        "creator": "OpenAI",
        "sourceType": "Proprietary",
        "reasoningType": "Reasoning",
        "contextWindow": "400K",
        "contextWindowTokens": 400000,
        "displayScore": 85,
        "rankingEligible": true,
        "overallRank": 15,
        "url": "https://benchlm.ai/models/gpt-5-3-codex",
        "markdownUrl": "https://benchlm.ai/md/models/gpt-5-3-codex.md"
      },
      "overallWinner": "A",
      "winner": {
        "slug": "claude-fable",
        "canonicalModelKey": "claude-fable-5",
        "model": "Claude Fable 5",
        "creator": "Anthropic",
        "sourceType": "Proprietary",
        "reasoningType": "Reasoning",
        "contextWindow": "1M+",
        "contextWindowTokens": 1000000,
        "displayScore": 97,
        "rankingEligible": true,
        "overallRank": 2,
        "url": "https://benchlm.ai/models/claude-fable",
        "markdownUrl": "https://benchlm.ai/md/models/claude-fable.md"
      },
      "scoreDiff": 12,
      "winsA": 2,
      "winsB": 0,
      "comparableCategoryCount": 2,
      "benchmarkCountA": 19,
      "benchmarkCountB": 25,
      "categoryResults": {
        "agentic": {
          "categoryLabel": "Agentic",
          "avgA": 85.2,
          "avgB": 71.5,
          "winner": "A",
          "benchmarkCount": 8
        },
        "coding": {
          "categoryLabel": "Coding",
          "avgA": 85.6,
          "avgB": 63.1,
          "winner": "A",
          "benchmarkCount": 9
        },
        "multimodalGrounded": {
          "categoryLabel": "Multimodal & Grounded",
          "avgA": 92.4,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 7
        },
        "reasoning": {
          "categoryLabel": "Reasoning",
          "avgA": null,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 2
        },
        "knowledge": {
          "categoryLabel": "Knowledge",
          "avgA": 74.8,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 9
        },
        "instructionFollowing": {
          "categoryLabel": "Instruction Following",
          "avgA": null,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 1
        },
        "multilingual": {
          "categoryLabel": "Multilingual",
          "avgA": null,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 1
        },
        "math": {
          "categoryLabel": "Mathematics",
          "avgA": null,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 1
        }
      }
    },
    {
      "slug": "claude-fable-vs-claude-opus-4-7-adaptive",
      "url": "https://benchlm.ai/compare/claude-fable-vs-claude-opus-4-7-adaptive",
      "markdownUrl": "https://benchlm.ai/md/compare/claude-fable-vs-claude-opus-4-7-adaptive.md",
      "modelA": {
        "slug": "claude-fable",
        "canonicalModelKey": "claude-fable-5",
        "model": "Claude Fable 5",
        "creator": "Anthropic",
        "sourceType": "Proprietary",
        "reasoningType": "Reasoning",
        "contextWindow": "1M+",
        "contextWindowTokens": 1000000,
        "displayScore": 97,
        "rankingEligible": true,
        "overallRank": 2,
        "url": "https://benchlm.ai/models/claude-fable",
        "markdownUrl": "https://benchlm.ai/md/models/claude-fable.md"
      },
      "modelB": {
        "slug": "claude-opus-4-7-adaptive",
        "canonicalModelKey": "claude-opus-4-7-max",
        "model": "Claude Opus 4.7 (Adaptive)",
        "creator": "Anthropic",
        "sourceType": "Proprietary",
        "reasoningType": "Reasoning",
        "contextWindow": "1M",
        "contextWindowTokens": 1000000,
        "displayScore": 84,
        "rankingEligible": true,
        "overallRank": 16,
        "url": "https://benchlm.ai/models/claude-opus-4-7-adaptive",
        "markdownUrl": "https://benchlm.ai/md/models/claude-opus-4-7-adaptive.md"
      },
      "overallWinner": "A",
      "winner": {
        "slug": "claude-fable",
        "canonicalModelKey": "claude-fable-5",
        "model": "Claude Fable 5",
        "creator": "Anthropic",
        "sourceType": "Proprietary",
        "reasoningType": "Reasoning",
        "contextWindow": "1M+",
        "contextWindowTokens": 1000000,
        "displayScore": 97,
        "rankingEligible": true,
        "overallRank": 2,
        "url": "https://benchlm.ai/models/claude-fable",
        "markdownUrl": "https://benchlm.ai/md/models/claude-fable.md"
      },
      "scoreDiff": 13,
      "winsA": 4,
      "winsB": 0,
      "comparableCategoryCount": 4,
      "benchmarkCountA": 19,
      "benchmarkCountB": 36,
      "categoryResults": {
        "agentic": {
          "categoryLabel": "Agentic",
          "avgA": 85.2,
          "avgB": 74.9,
          "winner": "A",
          "benchmarkCount": 9
        },
        "coding": {
          "categoryLabel": "Coding",
          "avgA": 85.6,
          "avgB": 72.9,
          "winner": "A",
          "benchmarkCount": 7
        },
        "multimodalGrounded": {
          "categoryLabel": "Multimodal & Grounded",
          "avgA": 92.4,
          "avgB": 64.3,
          "winner": "A",
          "benchmarkCount": 8
        },
        "reasoning": {
          "categoryLabel": "Reasoning",
          "avgA": null,
          "avgB": 75.8,
          "winner": null,
          "benchmarkCount": 4
        },
        "knowledge": {
          "categoryLabel": "Knowledge",
          "avgA": 74.8,
          "avgB": 68.2,
          "winner": "A",
          "benchmarkCount": 10
        },
        "instructionFollowing": {
          "categoryLabel": "Instruction Following",
          "avgA": null,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 1
        },
        "multilingual": {
          "categoryLabel": "Multilingual",
          "avgA": null,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 1
        },
        "math": {
          "categoryLabel": "Mathematics",
          "avgA": null,
          "avgB": 43.8,
          "winner": null,
          "benchmarkCount": 2
        }
      }
    },
    {
      "slug": "claude-fable-vs-glm-5-1",
      "url": "https://benchlm.ai/compare/claude-fable-vs-glm-5-1",
      "markdownUrl": "https://benchlm.ai/md/compare/claude-fable-vs-glm-5-1.md",
      "modelA": {
        "slug": "claude-fable",
        "canonicalModelKey": "claude-fable-5",
        "model": "Claude Fable 5",
        "creator": "Anthropic",
        "sourceType": "Proprietary",
        "reasoningType": "Reasoning",
        "contextWindow": "1M+",
        "contextWindowTokens": 1000000,
        "displayScore": 97,
        "rankingEligible": true,
        "overallRank": 2,
        "url": "https://benchlm.ai/models/claude-fable",
        "markdownUrl": "https://benchlm.ai/md/models/claude-fable.md"
      },
      "modelB": {
        "slug": "glm-5-1",
        "canonicalModelKey": "glm-5-1",
        "model": "GLM-5.1",
        "creator": "Z.AI",
        "sourceType": "Open Weight",
        "reasoningType": "Reasoning",
        "contextWindow": "203K",
        "contextWindowTokens": 203000,
        "displayScore": 82,
        "rankingEligible": true,
        "overallRank": 17,
        "url": "https://benchlm.ai/models/glm-5-1",
        "markdownUrl": "https://benchlm.ai/md/models/glm-5-1.md"
      },
      "overallWinner": "A",
      "winner": {
        "slug": "claude-fable",
        "canonicalModelKey": "claude-fable-5",
        "model": "Claude Fable 5",
        "creator": "Anthropic",
        "sourceType": "Proprietary",
        "reasoningType": "Reasoning",
        "contextWindow": "1M+",
        "contextWindowTokens": 1000000,
        "displayScore": 97,
        "rankingEligible": true,
        "overallRank": 2,
        "url": "https://benchlm.ai/models/claude-fable",
        "markdownUrl": "https://benchlm.ai/md/models/claude-fable.md"
      },
      "scoreDiff": 15,
      "winsA": 3,
      "winsB": 0,
      "comparableCategoryCount": 3,
      "benchmarkCountA": 19,
      "benchmarkCountB": 33,
      "categoryResults": {
        "agentic": {
          "categoryLabel": "Agentic",
          "avgA": 85.2,
          "avgB": 65.3,
          "winner": "A",
          "benchmarkCount": 12
        },
        "coding": {
          "categoryLabel": "Coding",
          "avgA": 85.6,
          "avgB": 60.9,
          "winner": "A",
          "benchmarkCount": 10
        },
        "multimodalGrounded": {
          "categoryLabel": "Multimodal & Grounded",
          "avgA": 92.4,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 6
        },
        "reasoning": {
          "categoryLabel": "Reasoning",
          "avgA": null,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 2
        },
        "knowledge": {
          "categoryLabel": "Knowledge",
          "avgA": 74.8,
          "avgB": 52.3,
          "winner": "A",
          "benchmarkCount": 10
        },
        "instructionFollowing": {
          "categoryLabel": "Instruction Following",
          "avgA": null,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 1
        },
        "multilingual": {
          "categoryLabel": "Multilingual",
          "avgA": null,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 1
        },
        "math": {
          "categoryLabel": "Mathematics",
          "avgA": null,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 5
        }
      }
    },
    {
      "slug": "claude-fable-vs-claude-sonnet-4-6",
      "url": "https://benchlm.ai/compare/claude-fable-vs-claude-sonnet-4-6",
      "markdownUrl": "https://benchlm.ai/md/compare/claude-fable-vs-claude-sonnet-4-6.md",
      "modelA": {
        "slug": "claude-fable",
        "canonicalModelKey": "claude-fable-5",
        "model": "Claude Fable 5",
        "creator": "Anthropic",
        "sourceType": "Proprietary",
        "reasoningType": "Reasoning",
        "contextWindow": "1M+",
        "contextWindowTokens": 1000000,
        "displayScore": 97,
        "rankingEligible": true,
        "overallRank": 2,
        "url": "https://benchlm.ai/models/claude-fable",
        "markdownUrl": "https://benchlm.ai/md/models/claude-fable.md"
      },
      "modelB": {
        "slug": "claude-sonnet-4-6",
        "canonicalModelKey": "claude-sonnet-4-6",
        "model": "Claude Sonnet 4.6",
        "creator": "Anthropic",
        "sourceType": "Proprietary",
        "reasoningType": "Non-Reasoning",
        "contextWindow": "200K",
        "contextWindowTokens": 200000,
        "displayScore": 82,
        "rankingEligible": true,
        "overallRank": 18,
        "url": "https://benchlm.ai/models/claude-sonnet-4-6",
        "markdownUrl": "https://benchlm.ai/md/models/claude-sonnet-4-6.md"
      },
      "overallWinner": "A",
      "winner": {
        "slug": "claude-fable",
        "canonicalModelKey": "claude-fable-5",
        "model": "Claude Fable 5",
        "creator": "Anthropic",
        "sourceType": "Proprietary",
        "reasoningType": "Reasoning",
        "contextWindow": "1M+",
        "contextWindowTokens": 1000000,
        "displayScore": 97,
        "rankingEligible": true,
        "overallRank": 2,
        "url": "https://benchlm.ai/models/claude-fable",
        "markdownUrl": "https://benchlm.ai/md/models/claude-fable.md"
      },
      "scoreDiff": 15,
      "winsA": 4,
      "winsB": 0,
      "comparableCategoryCount": 4,
      "benchmarkCountA": 19,
      "benchmarkCountB": 33,
      "categoryResults": {
        "agentic": {
          "categoryLabel": "Agentic",
          "avgA": 85.2,
          "avgB": 65.1,
          "winner": "A",
          "benchmarkCount": 10
        },
        "coding": {
          "categoryLabel": "Coding",
          "avgA": 85.6,
          "avgB": 66.4,
          "winner": "A",
          "benchmarkCount": 11
        },
        "multimodalGrounded": {
          "categoryLabel": "Multimodal & Grounded",
          "avgA": 92.4,
          "avgB": 77.4,
          "winner": "A",
          "benchmarkCount": 7
        },
        "reasoning": {
          "categoryLabel": "Reasoning",
          "avgA": null,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 2
        },
        "knowledge": {
          "categoryLabel": "Knowledge",
          "avgA": 74.8,
          "avgB": 73.7,
          "winner": "A",
          "benchmarkCount": 11
        },
        "instructionFollowing": {
          "categoryLabel": "Instruction Following",
          "avgA": null,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 1
        },
        "multilingual": {
          "categoryLabel": "Multilingual",
          "avgA": null,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 1
        },
        "math": {
          "categoryLabel": "Mathematics",
          "avgA": null,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 1
        }
      }
    },
    {
      "slug": "claude-opus-4-8-vs-gemini-3-1-pro",
      "url": "https://benchlm.ai/compare/claude-opus-4-8-vs-gemini-3-1-pro",
      "markdownUrl": "https://benchlm.ai/md/compare/claude-opus-4-8-vs-gemini-3-1-pro.md",
      "modelA": {
        "slug": "claude-opus-4-8",
        "canonicalModelKey": "claude-opus-4-8",
        "model": "Claude Opus 4.8",
        "creator": "Anthropic",
        "sourceType": "Proprietary",
        "reasoningType": "Reasoning",
        "contextWindow": "1M",
        "contextWindowTokens": 1000000,
        "displayScore": 93,
        "rankingEligible": true,
        "overallRank": 3,
        "url": "https://benchlm.ai/models/claude-opus-4-8",
        "markdownUrl": "https://benchlm.ai/md/models/claude-opus-4-8.md"
      },
      "modelB": {
        "slug": "gemini-3-1-pro",
        "canonicalModelKey": "gemini-3-1-pro",
        "model": "Gemini 3.1 Pro",
        "creator": "Google",
        "sourceType": "Proprietary",
        "reasoningType": "Non-Reasoning",
        "contextWindow": "1M",
        "contextWindowTokens": 1000000,
        "displayScore": 91,
        "rankingEligible": true,
        "overallRank": 4,
        "url": "https://benchlm.ai/models/gemini-3-1-pro",
        "markdownUrl": "https://benchlm.ai/md/models/gemini-3-1-pro.md"
      },
      "overallWinner": "A",
      "winner": {
        "slug": "claude-opus-4-8",
        "canonicalModelKey": "claude-opus-4-8",
        "model": "Claude Opus 4.8",
        "creator": "Anthropic",
        "sourceType": "Proprietary",
        "reasoningType": "Reasoning",
        "contextWindow": "1M",
        "contextWindowTokens": 1000000,
        "displayScore": 93,
        "rankingEligible": true,
        "overallRank": 3,
        "url": "https://benchlm.ai/models/claude-opus-4-8",
        "markdownUrl": "https://benchlm.ai/md/models/claude-opus-4-8.md"
      },
      "scoreDiff": 2,
      "winsA": 0,
      "winsB": 1,
      "comparableCategoryCount": 1,
      "benchmarkCountA": 41,
      "benchmarkCountB": 38,
      "categoryResults": {
        "agentic": {
          "categoryLabel": "Agentic",
          "avgA": 80.1,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 14
        },
        "coding": {
          "categoryLabel": "Coding",
          "avgA": 76.4,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 12
        },
        "multimodalGrounded": {
          "categoryLabel": "Multimodal & Grounded",
          "avgA": 76.1,
          "avgB": 82.8,
          "winner": "B",
          "benchmarkCount": 12
        },
        "reasoning": {
          "categoryLabel": "Reasoning",
          "avgA": null,
          "avgB": 77.1,
          "winner": null,
          "benchmarkCount": 3
        },
        "knowledge": {
          "categoryLabel": "Knowledge",
          "avgA": 70.1,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 12
        },
        "instructionFollowing": {
          "categoryLabel": "Instruction Following",
          "avgA": null,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 1
        },
        "multilingual": {
          "categoryLabel": "Multilingual",
          "avgA": null,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 1
        },
        "math": {
          "categoryLabel": "Mathematics",
          "avgA": null,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 1
        }
      }
    },
    {
      "slug": "claude-opus-4-8-vs-qwen3-7-max",
      "url": "https://benchlm.ai/compare/claude-opus-4-8-vs-qwen3-7-max",
      "markdownUrl": "https://benchlm.ai/md/compare/claude-opus-4-8-vs-qwen3-7-max.md",
      "modelA": {
        "slug": "claude-opus-4-8",
        "canonicalModelKey": "claude-opus-4-8",
        "model": "Claude Opus 4.8",
        "creator": "Anthropic",
        "sourceType": "Proprietary",
        "reasoningType": "Reasoning",
        "contextWindow": "1M",
        "contextWindowTokens": 1000000,
        "displayScore": 93,
        "rankingEligible": true,
        "overallRank": 3,
        "url": "https://benchlm.ai/models/claude-opus-4-8",
        "markdownUrl": "https://benchlm.ai/md/models/claude-opus-4-8.md"
      },
      "modelB": {
        "slug": "qwen3-7-max",
        "canonicalModelKey": "qwen3-7-max",
        "model": "Qwen3.7 Max",
        "creator": "Alibaba",
        "sourceType": "Proprietary",
        "reasoningType": "Reasoning",
        "contextWindow": "1M",
        "contextWindowTokens": 1000000,
        "displayScore": 91,
        "rankingEligible": true,
        "overallRank": 5,
        "url": "https://benchlm.ai/models/qwen3-7-max",
        "markdownUrl": "https://benchlm.ai/md/models/qwen3-7-max.md"
      },
      "overallWinner": "A",
      "winner": {
        "slug": "claude-opus-4-8",
        "canonicalModelKey": "claude-opus-4-8",
        "model": "Claude Opus 4.8",
        "creator": "Anthropic",
        "sourceType": "Proprietary",
        "reasoningType": "Reasoning",
        "contextWindow": "1M",
        "contextWindowTokens": 1000000,
        "displayScore": 93,
        "rankingEligible": true,
        "overallRank": 3,
        "url": "https://benchlm.ai/models/claude-opus-4-8",
        "markdownUrl": "https://benchlm.ai/md/models/claude-opus-4-8.md"
      },
      "scoreDiff": 2,
      "winsA": 2,
      "winsB": 1,
      "comparableCategoryCount": 3,
      "benchmarkCountA": 41,
      "benchmarkCountB": 51,
      "categoryResults": {
        "agentic": {
          "categoryLabel": "Agentic",
          "avgA": 80.1,
          "avgB": 69.7,
          "winner": "A",
          "benchmarkCount": 18
        },
        "coding": {
          "categoryLabel": "Coding",
          "avgA": 76.4,
          "avgB": 73.6,
          "winner": "A",
          "benchmarkCount": 12
        },
        "multimodalGrounded": {
          "categoryLabel": "Multimodal & Grounded",
          "avgA": 76.1,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 5
        },
        "reasoning": {
          "categoryLabel": "Reasoning",
          "avgA": null,
          "avgB": 90.4,
          "winner": null,
          "benchmarkCount": 3
        },
        "knowledge": {
          "categoryLabel": "Knowledge",
          "avgA": 70.1,
          "avgB": 71.2,
          "winner": "B",
          "benchmarkCount": 14
        },
        "instructionFollowing": {
          "categoryLabel": "Instruction Following",
          "avgA": null,
          "avgB": 89,
          "winner": null,
          "benchmarkCount": 3
        },
        "multilingual": {
          "categoryLabel": "Multilingual",
          "avgA": null,
          "avgB": 87,
          "winner": null,
          "benchmarkCount": 5
        },
        "math": {
          "categoryLabel": "Mathematics",
          "avgA": null,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 4
        }
      }
    },
    {
      "slug": "claude-opus-4-8-vs-gpt-5-4-pro",
      "url": "https://benchlm.ai/compare/claude-opus-4-8-vs-gpt-5-4-pro",
      "markdownUrl": "https://benchlm.ai/md/compare/claude-opus-4-8-vs-gpt-5-4-pro.md",
      "modelA": {
        "slug": "claude-opus-4-8",
        "canonicalModelKey": "claude-opus-4-8",
        "model": "Claude Opus 4.8",
        "creator": "Anthropic",
        "sourceType": "Proprietary",
        "reasoningType": "Reasoning",
        "contextWindow": "1M",
        "contextWindowTokens": 1000000,
        "displayScore": 93,
        "rankingEligible": true,
        "overallRank": 3,
        "url": "https://benchlm.ai/models/claude-opus-4-8",
        "markdownUrl": "https://benchlm.ai/md/models/claude-opus-4-8.md"
      },
      "modelB": {
        "slug": "gpt-5-4-pro",
        "canonicalModelKey": "gpt-5-4-pro",
        "model": "GPT-5.4 Pro",
        "creator": "OpenAI",
        "sourceType": "Proprietary",
        "reasoningType": "Reasoning",
        "contextWindow": "1.05M",
        "contextWindowTokens": 1050000,
        "displayScore": 90,
        "rankingEligible": true,
        "overallRank": 6,
        "url": "https://benchlm.ai/models/gpt-5-4-pro",
        "markdownUrl": "https://benchlm.ai/md/models/gpt-5-4-pro.md"
      },
      "overallWinner": "A",
      "winner": {
        "slug": "claude-opus-4-8",
        "canonicalModelKey": "claude-opus-4-8",
        "model": "Claude Opus 4.8",
        "creator": "Anthropic",
        "sourceType": "Proprietary",
        "reasoningType": "Reasoning",
        "contextWindow": "1M",
        "contextWindowTokens": 1000000,
        "displayScore": 93,
        "rankingEligible": true,
        "overallRank": 3,
        "url": "https://benchlm.ai/models/claude-opus-4-8",
        "markdownUrl": "https://benchlm.ai/md/models/claude-opus-4-8.md"
      },
      "scoreDiff": 3,
      "winsA": 1,
      "winsB": 2,
      "comparableCategoryCount": 3,
      "benchmarkCountA": 41,
      "benchmarkCountB": 10,
      "categoryResults": {
        "agentic": {
          "categoryLabel": "Agentic",
          "avgA": 80.1,
          "avgB": 89.3,
          "winner": "B",
          "benchmarkCount": 12
        },
        "coding": {
          "categoryLabel": "Coding",
          "avgA": 76.4,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 9
        },
        "multimodalGrounded": {
          "categoryLabel": "Multimodal & Grounded",
          "avgA": 76.1,
          "avgB": 94,
          "winner": "B",
          "benchmarkCount": 6
        },
        "reasoning": {
          "categoryLabel": "Reasoning",
          "avgA": null,
          "avgB": 83.3,
          "winner": null,
          "benchmarkCount": 3
        },
        "knowledge": {
          "categoryLabel": "Knowledge",
          "avgA": 70.1,
          "avgB": 49,
          "winner": "A",
          "benchmarkCount": 12
        },
        "instructionFollowing": {
          "categoryLabel": "Instruction Following",
          "avgA": null,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 1
        },
        "multilingual": {
          "categoryLabel": "Multilingual",
          "avgA": null,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 1
        },
        "math": {
          "categoryLabel": "Mathematics",
          "avgA": null,
          "avgB": 50,
          "winner": null,
          "benchmarkCount": 3
        }
      }
    },
    {
      "slug": "claude-opus-4-8-vs-gemini-3-pro-deep-think",
      "url": "https://benchlm.ai/compare/claude-opus-4-8-vs-gemini-3-pro-deep-think",
      "markdownUrl": "https://benchlm.ai/md/compare/claude-opus-4-8-vs-gemini-3-pro-deep-think.md",
      "modelA": {
        "slug": "claude-opus-4-8",
        "canonicalModelKey": "claude-opus-4-8",
        "model": "Claude Opus 4.8",
        "creator": "Anthropic",
        "sourceType": "Proprietary",
        "reasoningType": "Reasoning",
        "contextWindow": "1M",
        "contextWindowTokens": 1000000,
        "displayScore": 93,
        "rankingEligible": true,
        "overallRank": 3,
        "url": "https://benchlm.ai/models/claude-opus-4-8",
        "markdownUrl": "https://benchlm.ai/md/models/claude-opus-4-8.md"
      },
      "modelB": {
        "slug": "gemini-3-pro-deep-think",
        "canonicalModelKey": "gemini-3-pro-deep-think",
        "model": "Gemini 3 Pro Deep Think",
        "creator": "Google",
        "sourceType": "Proprietary",
        "reasoningType": "Reasoning",
        "contextWindow": "2M",
        "contextWindowTokens": 2000000,
        "displayScore": 89,
        "rankingEligible": true,
        "overallRank": 8,
        "url": "https://benchlm.ai/models/gemini-3-pro-deep-think",
        "markdownUrl": "https://benchlm.ai/md/models/gemini-3-pro-deep-think.md"
      },
      "overallWinner": "A",
      "winner": {
        "slug": "claude-opus-4-8",
        "canonicalModelKey": "claude-opus-4-8",
        "model": "Claude Opus 4.8",
        "creator": "Anthropic",
        "sourceType": "Proprietary",
        "reasoningType": "Reasoning",
        "contextWindow": "1M",
        "contextWindowTokens": 1000000,
        "displayScore": 93,
        "rankingEligible": true,
        "overallRank": 3,
        "url": "https://benchlm.ai/models/claude-opus-4-8",
        "markdownUrl": "https://benchlm.ai/md/models/claude-opus-4-8.md"
      },
      "scoreDiff": 4,
      "winsA": 0,
      "winsB": 0,
      "comparableCategoryCount": 0,
      "benchmarkCountA": 41,
      "benchmarkCountB": 4,
      "categoryResults": {
        "agentic": {
          "categoryLabel": "Agentic",
          "avgA": 80.1,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 12
        },
        "coding": {
          "categoryLabel": "Coding",
          "avgA": 76.4,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 9
        },
        "multimodalGrounded": {
          "categoryLabel": "Multimodal & Grounded",
          "avgA": 76.1,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 5
        },
        "reasoning": {
          "categoryLabel": "Reasoning",
          "avgA": null,
          "avgB": 45.1,
          "winner": null,
          "benchmarkCount": 3
        },
        "knowledge": {
          "categoryLabel": "Knowledge",
          "avgA": 70.1,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 10
        },
        "instructionFollowing": {
          "categoryLabel": "Instruction Following",
          "avgA": null,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 1
        },
        "multilingual": {
          "categoryLabel": "Multilingual",
          "avgA": null,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 1
        },
        "math": {
          "categoryLabel": "Mathematics",
          "avgA": null,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 1
        }
      }
    },
    {
      "slug": "claude-opus-4-8-vs-grok-4-1",
      "url": "https://benchlm.ai/compare/claude-opus-4-8-vs-grok-4-1",
      "markdownUrl": "https://benchlm.ai/md/compare/claude-opus-4-8-vs-grok-4-1.md",
      "modelA": {
        "slug": "claude-opus-4-8",
        "canonicalModelKey": "claude-opus-4-8",
        "model": "Claude Opus 4.8",
        "creator": "Anthropic",
        "sourceType": "Proprietary",
        "reasoningType": "Reasoning",
        "contextWindow": "1M",
        "contextWindowTokens": 1000000,
        "displayScore": 93,
        "rankingEligible": true,
        "overallRank": 3,
        "url": "https://benchlm.ai/models/claude-opus-4-8",
        "markdownUrl": "https://benchlm.ai/md/models/claude-opus-4-8.md"
      },
      "modelB": {
        "slug": "grok-4-1",
        "canonicalModelKey": "grok-4-1",
        "model": "Grok 4.1",
        "creator": "xAI",
        "sourceType": "Proprietary",
        "reasoningType": "Non-Reasoning",
        "contextWindow": "1M",
        "contextWindowTokens": 1000000,
        "displayScore": 89,
        "rankingEligible": true,
        "overallRank": 9,
        "url": "https://benchlm.ai/models/grok-4-1",
        "markdownUrl": "https://benchlm.ai/md/models/grok-4-1.md"
      },
      "overallWinner": "A",
      "winner": {
        "slug": "claude-opus-4-8",
        "canonicalModelKey": "claude-opus-4-8",
        "model": "Claude Opus 4.8",
        "creator": "Anthropic",
        "sourceType": "Proprietary",
        "reasoningType": "Reasoning",
        "contextWindow": "1M",
        "contextWindowTokens": 1000000,
        "displayScore": 93,
        "rankingEligible": true,
        "overallRank": 3,
        "url": "https://benchlm.ai/models/claude-opus-4-8",
        "markdownUrl": "https://benchlm.ai/md/models/claude-opus-4-8.md"
      },
      "scoreDiff": 4,
      "winsA": 0,
      "winsB": 0,
      "comparableCategoryCount": 0,
      "benchmarkCountA": 41,
      "benchmarkCountB": 0,
      "categoryResults": {
        "agentic": {
          "categoryLabel": "Agentic",
          "avgA": 80.1,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 12
        },
        "coding": {
          "categoryLabel": "Coding",
          "avgA": 76.4,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 9
        },
        "multimodalGrounded": {
          "categoryLabel": "Multimodal & Grounded",
          "avgA": 76.1,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 5
        },
        "reasoning": {
          "categoryLabel": "Reasoning",
          "avgA": null,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 2
        },
        "knowledge": {
          "categoryLabel": "Knowledge",
          "avgA": 70.1,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 10
        },
        "instructionFollowing": {
          "categoryLabel": "Instruction Following",
          "avgA": null,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 1
        },
        "multilingual": {
          "categoryLabel": "Multilingual",
          "avgA": null,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 1
        },
        "math": {
          "categoryLabel": "Mathematics",
          "avgA": null,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 1
        }
      }
    },
    {
      "slug": "claude-opus-4-8-vs-gpt-5-4",
      "url": "https://benchlm.ai/compare/claude-opus-4-8-vs-gpt-5-4",
      "markdownUrl": "https://benchlm.ai/md/compare/claude-opus-4-8-vs-gpt-5-4.md",
      "modelA": {
        "slug": "claude-opus-4-8",
        "canonicalModelKey": "claude-opus-4-8",
        "model": "Claude Opus 4.8",
        "creator": "Anthropic",
        "sourceType": "Proprietary",
        "reasoningType": "Reasoning",
        "contextWindow": "1M",
        "contextWindowTokens": 1000000,
        "displayScore": 93,
        "rankingEligible": true,
        "overallRank": 3,
        "url": "https://benchlm.ai/models/claude-opus-4-8",
        "markdownUrl": "https://benchlm.ai/md/models/claude-opus-4-8.md"
      },
      "modelB": {
        "slug": "gpt-5-4",
        "canonicalModelKey": "gpt-5-4",
        "model": "GPT-5.4",
        "creator": "OpenAI",
        "sourceType": "Proprietary",
        "reasoningType": "Reasoning",
        "contextWindow": "1.05M",
        "contextWindowTokens": 1050000,
        "displayScore": 88,
        "rankingEligible": true,
        "overallRank": 10,
        "url": "https://benchlm.ai/models/gpt-5-4",
        "markdownUrl": "https://benchlm.ai/md/models/gpt-5-4.md"
      },
      "overallWinner": "A",
      "winner": {
        "slug": "claude-opus-4-8",
        "canonicalModelKey": "claude-opus-4-8",
        "model": "Claude Opus 4.8",
        "creator": "Anthropic",
        "sourceType": "Proprietary",
        "reasoningType": "Reasoning",
        "contextWindow": "1M",
        "contextWindowTokens": 1000000,
        "displayScore": 93,
        "rankingEligible": true,
        "overallRank": 3,
        "url": "https://benchlm.ai/models/claude-opus-4-8",
        "markdownUrl": "https://benchlm.ai/md/models/claude-opus-4-8.md"
      },
      "scoreDiff": 5,
      "winsA": 4,
      "winsB": 0,
      "comparableCategoryCount": 4,
      "benchmarkCountA": 41,
      "benchmarkCountB": 48,
      "categoryResults": {
        "agentic": {
          "categoryLabel": "Agentic",
          "avgA": 80.1,
          "avgB": 77,
          "winner": "A",
          "benchmarkCount": 15
        },
        "coding": {
          "categoryLabel": "Coding",
          "avgA": 76.4,
          "avgB": 57.7,
          "winner": "A",
          "benchmarkCount": 12
        },
        "multimodalGrounded": {
          "categoryLabel": "Multimodal & Grounded",
          "avgA": 76.1,
          "avgB": 72.7,
          "winner": "A",
          "benchmarkCount": 13
        },
        "reasoning": {
          "categoryLabel": "Reasoning",
          "avgA": null,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 2
        },
        "knowledge": {
          "categoryLabel": "Knowledge",
          "avgA": 70.1,
          "avgB": 66.1,
          "winner": "A",
          "benchmarkCount": 12
        },
        "instructionFollowing": {
          "categoryLabel": "Instruction Following",
          "avgA": null,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 1
        },
        "multilingual": {
          "categoryLabel": "Multilingual",
          "avgA": null,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 1
        },
        "math": {
          "categoryLabel": "Mathematics",
          "avgA": null,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 1
        }
      }
    },
    {
      "slug": "claude-opus-4-8-vs-qwen3-7-plus",
      "url": "https://benchlm.ai/compare/claude-opus-4-8-vs-qwen3-7-plus",
      "markdownUrl": "https://benchlm.ai/md/compare/claude-opus-4-8-vs-qwen3-7-plus.md",
      "modelA": {
        "slug": "claude-opus-4-8",
        "canonicalModelKey": "claude-opus-4-8",
        "model": "Claude Opus 4.8",
        "creator": "Anthropic",
        "sourceType": "Proprietary",
        "reasoningType": "Reasoning",
        "contextWindow": "1M",
        "contextWindowTokens": 1000000,
        "displayScore": 93,
        "rankingEligible": true,
        "overallRank": 3,
        "url": "https://benchlm.ai/models/claude-opus-4-8",
        "markdownUrl": "https://benchlm.ai/md/models/claude-opus-4-8.md"
      },
      "modelB": {
        "slug": "qwen3-7-plus",
        "canonicalModelKey": "qwen3-7-plus",
        "model": "Qwen3.7 Plus",
        "creator": "Alibaba",
        "sourceType": "Proprietary",
        "reasoningType": "Reasoning",
        "contextWindow": "1M",
        "contextWindowTokens": 1000000,
        "displayScore": 88,
        "rankingEligible": true,
        "overallRank": 11,
        "url": "https://benchlm.ai/models/qwen3-7-plus",
        "markdownUrl": "https://benchlm.ai/md/models/qwen3-7-plus.md"
      },
      "overallWinner": "A",
      "winner": {
        "slug": "claude-opus-4-8",
        "canonicalModelKey": "claude-opus-4-8",
        "model": "Claude Opus 4.8",
        "creator": "Anthropic",
        "sourceType": "Proprietary",
        "reasoningType": "Reasoning",
        "contextWindow": "1M",
        "contextWindowTokens": 1000000,
        "displayScore": 93,
        "rankingEligible": true,
        "overallRank": 3,
        "url": "https://benchlm.ai/models/claude-opus-4-8",
        "markdownUrl": "https://benchlm.ai/md/models/claude-opus-4-8.md"
      },
      "scoreDiff": 5,
      "winsA": 3,
      "winsB": 1,
      "comparableCategoryCount": 4,
      "benchmarkCountA": 41,
      "benchmarkCountB": 68,
      "categoryResults": {
        "agentic": {
          "categoryLabel": "Agentic",
          "avgA": 80.1,
          "avgB": 71.7,
          "winner": "A",
          "benchmarkCount": 20
        },
        "coding": {
          "categoryLabel": "Coding",
          "avgA": 76.4,
          "avgB": 71.1,
          "winner": "A",
          "benchmarkCount": 12
        },
        "multimodalGrounded": {
          "categoryLabel": "Multimodal & Grounded",
          "avgA": 76.1,
          "avgB": 81.1,
          "winner": "B",
          "benchmarkCount": 19
        },
        "reasoning": {
          "categoryLabel": "Reasoning",
          "avgA": null,
          "avgB": 91.7,
          "winner": null,
          "benchmarkCount": 3
        },
        "knowledge": {
          "categoryLabel": "Knowledge",
          "avgA": 70.1,
          "avgB": 67.9,
          "winner": "A",
          "benchmarkCount": 14
        },
        "instructionFollowing": {
          "categoryLabel": "Instruction Following",
          "avgA": null,
          "avgB": 89.2,
          "winner": null,
          "benchmarkCount": 3
        },
        "multilingual": {
          "categoryLabel": "Multilingual",
          "avgA": null,
          "avgB": 85.4,
          "winner": null,
          "benchmarkCount": 5
        },
        "math": {
          "categoryLabel": "Mathematics",
          "avgA": null,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 4
        }
      }
    },
    {
      "slug": "claude-opus-4-6-vs-claude-opus-4-8",
      "url": "https://benchlm.ai/compare/claude-opus-4-6-vs-claude-opus-4-8",
      "markdownUrl": "https://benchlm.ai/md/compare/claude-opus-4-6-vs-claude-opus-4-8.md",
      "modelA": {
        "slug": "claude-opus-4-8",
        "canonicalModelKey": "claude-opus-4-8",
        "model": "Claude Opus 4.8",
        "creator": "Anthropic",
        "sourceType": "Proprietary",
        "reasoningType": "Reasoning",
        "contextWindow": "1M",
        "contextWindowTokens": 1000000,
        "displayScore": 93,
        "rankingEligible": true,
        "overallRank": 3,
        "url": "https://benchlm.ai/models/claude-opus-4-8",
        "markdownUrl": "https://benchlm.ai/md/models/claude-opus-4-8.md"
      },
      "modelB": {
        "slug": "claude-opus-4-6",
        "canonicalModelKey": "claude-opus-4-6",
        "model": "Claude Opus 4.6",
        "creator": "Anthropic",
        "sourceType": "Proprietary",
        "reasoningType": "Non-Reasoning",
        "contextWindow": "1M",
        "contextWindowTokens": 1000000,
        "displayScore": 86,
        "rankingEligible": true,
        "overallRank": 12,
        "url": "https://benchlm.ai/models/claude-opus-4-6",
        "markdownUrl": "https://benchlm.ai/md/models/claude-opus-4-6.md"
      },
      "overallWinner": "A",
      "winner": {
        "slug": "claude-opus-4-8",
        "canonicalModelKey": "claude-opus-4-8",
        "model": "Claude Opus 4.8",
        "creator": "Anthropic",
        "sourceType": "Proprietary",
        "reasoningType": "Reasoning",
        "contextWindow": "1M",
        "contextWindowTokens": 1000000,
        "displayScore": 93,
        "rankingEligible": true,
        "overallRank": 3,
        "url": "https://benchlm.ai/models/claude-opus-4-8",
        "markdownUrl": "https://benchlm.ai/md/models/claude-opus-4-8.md"
      },
      "scoreDiff": 7,
      "winsA": 2,
      "winsB": 2,
      "comparableCategoryCount": 4,
      "benchmarkCountA": 41,
      "benchmarkCountB": 47,
      "categoryResults": {
        "agentic": {
          "categoryLabel": "Agentic",
          "avgA": 80.1,
          "avgB": 72.6,
          "winner": "A",
          "benchmarkCount": 14
        },
        "coding": {
          "categoryLabel": "Coding",
          "avgA": 76.4,
          "avgB": 64.4,
          "winner": "A",
          "benchmarkCount": 14
        },
        "multimodalGrounded": {
          "categoryLabel": "Multimodal & Grounded",
          "avgA": 76.1,
          "avgB": 77.3,
          "winner": "B",
          "benchmarkCount": 10
        },
        "reasoning": {
          "categoryLabel": "Reasoning",
          "avgA": null,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 2
        },
        "knowledge": {
          "categoryLabel": "Knowledge",
          "avgA": 70.1,
          "avgB": 76.2,
          "winner": "B",
          "benchmarkCount": 15
        },
        "instructionFollowing": {
          "categoryLabel": "Instruction Following",
          "avgA": null,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 1
        },
        "multilingual": {
          "categoryLabel": "Multilingual",
          "avgA": null,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 1
        },
        "math": {
          "categoryLabel": "Mathematics",
          "avgA": null,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 2
        }
      }
    },
    {
      "slug": "claude-opus-4-8-vs-gemini-3-5-flash",
      "url": "https://benchlm.ai/compare/claude-opus-4-8-vs-gemini-3-5-flash",
      "markdownUrl": "https://benchlm.ai/md/compare/claude-opus-4-8-vs-gemini-3-5-flash.md",
      "modelA": {
        "slug": "claude-opus-4-8",
        "canonicalModelKey": "claude-opus-4-8",
        "model": "Claude Opus 4.8",
        "creator": "Anthropic",
        "sourceType": "Proprietary",
        "reasoningType": "Reasoning",
        "contextWindow": "1M",
        "contextWindowTokens": 1000000,
        "displayScore": 93,
        "rankingEligible": true,
        "overallRank": 3,
        "url": "https://benchlm.ai/models/claude-opus-4-8",
        "markdownUrl": "https://benchlm.ai/md/models/claude-opus-4-8.md"
      },
      "modelB": {
        "slug": "gemini-3-5-flash",
        "canonicalModelKey": "gemini-3-5-flash",
        "model": "Gemini 3.5 Flash",
        "creator": "Google",
        "sourceType": "Proprietary",
        "reasoningType": "Reasoning",
        "contextWindow": "1M",
        "contextWindowTokens": 1000000,
        "displayScore": 86,
        "rankingEligible": true,
        "overallRank": 13,
        "url": "https://benchlm.ai/models/gemini-3-5-flash",
        "markdownUrl": "https://benchlm.ai/md/models/gemini-3-5-flash.md"
      },
      "overallWinner": "A",
      "winner": {
        "slug": "claude-opus-4-8",
        "canonicalModelKey": "claude-opus-4-8",
        "model": "Claude Opus 4.8",
        "creator": "Anthropic",
        "sourceType": "Proprietary",
        "reasoningType": "Reasoning",
        "contextWindow": "1M",
        "contextWindowTokens": 1000000,
        "displayScore": 93,
        "rankingEligible": true,
        "overallRank": 3,
        "url": "https://benchlm.ai/models/claude-opus-4-8",
        "markdownUrl": "https://benchlm.ai/md/models/claude-opus-4-8.md"
      },
      "scoreDiff": 7,
      "winsA": 3,
      "winsB": 1,
      "comparableCategoryCount": 4,
      "benchmarkCountA": 41,
      "benchmarkCountB": 40,
      "categoryResults": {
        "agentic": {
          "categoryLabel": "Agentic",
          "avgA": 80.1,
          "avgB": 77.2,
          "winner": "A",
          "benchmarkCount": 13
        },
        "coding": {
          "categoryLabel": "Coding",
          "avgA": 76.4,
          "avgB": 54.5,
          "winner": "A",
          "benchmarkCount": 11
        },
        "multimodalGrounded": {
          "categoryLabel": "Multimodal & Grounded",
          "avgA": 76.1,
          "avgB": 83.8,
          "winner": "B",
          "benchmarkCount": 8
        },
        "reasoning": {
          "categoryLabel": "Reasoning",
          "avgA": null,
          "avgB": 74.7,
          "winner": null,
          "benchmarkCount": 5
        },
        "knowledge": {
          "categoryLabel": "Knowledge",
          "avgA": 70.1,
          "avgB": 58,
          "winner": "A",
          "benchmarkCount": 10
        },
        "instructionFollowing": {
          "categoryLabel": "Instruction Following",
          "avgA": null,
          "avgB": 76.3,
          "winner": null,
          "benchmarkCount": 2
        },
        "multilingual": {
          "categoryLabel": "Multilingual",
          "avgA": null,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 1
        },
        "math": {
          "categoryLabel": "Mathematics",
          "avgA": null,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 1
        }
      }
    },
    {
      "slug": "claude-opus-4-8-vs-deepseek-v4-pro-max",
      "url": "https://benchlm.ai/compare/claude-opus-4-8-vs-deepseek-v4-pro-max",
      "markdownUrl": "https://benchlm.ai/md/compare/claude-opus-4-8-vs-deepseek-v4-pro-max.md",
      "modelA": {
        "slug": "claude-opus-4-8",
        "canonicalModelKey": "claude-opus-4-8",
        "model": "Claude Opus 4.8",
        "creator": "Anthropic",
        "sourceType": "Proprietary",
        "reasoningType": "Reasoning",
        "contextWindow": "1M",
        "contextWindowTokens": 1000000,
        "displayScore": 93,
        "rankingEligible": true,
        "overallRank": 3,
        "url": "https://benchlm.ai/models/claude-opus-4-8",
        "markdownUrl": "https://benchlm.ai/md/models/claude-opus-4-8.md"
      },
      "modelB": {
        "slug": "deepseek-v4-pro-max",
        "canonicalModelKey": "deepseek-v4-pro-max",
        "model": "DeepSeek V4 Pro (Max)",
        "creator": "DeepSeek",
        "sourceType": "Open Weight",
        "reasoningType": "Reasoning",
        "contextWindow": "1M",
        "contextWindowTokens": 1000000,
        "displayScore": 86,
        "rankingEligible": true,
        "overallRank": 14,
        "url": "https://benchlm.ai/models/deepseek-v4-pro-max",
        "markdownUrl": "https://benchlm.ai/md/models/deepseek-v4-pro-max.md"
      },
      "overallWinner": "A",
      "winner": {
        "slug": "claude-opus-4-8",
        "canonicalModelKey": "claude-opus-4-8",
        "model": "Claude Opus 4.8",
        "creator": "Anthropic",
        "sourceType": "Proprietary",
        "reasoningType": "Reasoning",
        "contextWindow": "1M",
        "contextWindowTokens": 1000000,
        "displayScore": 93,
        "rankingEligible": true,
        "overallRank": 3,
        "url": "https://benchlm.ai/models/claude-opus-4-8",
        "markdownUrl": "https://benchlm.ai/md/models/claude-opus-4-8.md"
      },
      "scoreDiff": 7,
      "winsA": 3,
      "winsB": 0,
      "comparableCategoryCount": 3,
      "benchmarkCountA": 41,
      "benchmarkCountB": 42,
      "categoryResults": {
        "agentic": {
          "categoryLabel": "Agentic",
          "avgA": 80.1,
          "avgB": 74,
          "winner": "A",
          "benchmarkCount": 14
        },
        "coding": {
          "categoryLabel": "Coding",
          "avgA": 76.4,
          "avgB": 75.9,
          "winner": "A",
          "benchmarkCount": 12
        },
        "multimodalGrounded": {
          "categoryLabel": "Multimodal & Grounded",
          "avgA": 76.1,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 5
        },
        "reasoning": {
          "categoryLabel": "Reasoning",
          "avgA": null,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 4
        },
        "knowledge": {
          "categoryLabel": "Knowledge",
          "avgA": 70.1,
          "avgB": 66.1,
          "winner": "A",
          "benchmarkCount": 13
        },
        "instructionFollowing": {
          "categoryLabel": "Instruction Following",
          "avgA": null,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 1
        },
        "multilingual": {
          "categoryLabel": "Multilingual",
          "avgA": null,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 1
        },
        "math": {
          "categoryLabel": "Mathematics",
          "avgA": null,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 5
        }
      }
    },
    {
      "slug": "claude-opus-4-8-vs-gpt-5-3-codex",
      "url": "https://benchlm.ai/compare/claude-opus-4-8-vs-gpt-5-3-codex",
      "markdownUrl": "https://benchlm.ai/md/compare/claude-opus-4-8-vs-gpt-5-3-codex.md",
      "modelA": {
        "slug": "claude-opus-4-8",
        "canonicalModelKey": "claude-opus-4-8",
        "model": "Claude Opus 4.8",
        "creator": "Anthropic",
        "sourceType": "Proprietary",
        "reasoningType": "Reasoning",
        "contextWindow": "1M",
        "contextWindowTokens": 1000000,
        "displayScore": 93,
        "rankingEligible": true,
        "overallRank": 3,
        "url": "https://benchlm.ai/models/claude-opus-4-8",
        "markdownUrl": "https://benchlm.ai/md/models/claude-opus-4-8.md"
      },
      "modelB": {
        "slug": "gpt-5-3-codex",
        "canonicalModelKey": "gpt-5-3-codex",
        "model": "GPT-5.3 Codex",
        "creator": "OpenAI",
        "sourceType": "Proprietary",
        "reasoningType": "Reasoning",
        "contextWindow": "400K",
        "contextWindowTokens": 400000,
        "displayScore": 85,
        "rankingEligible": true,
        "overallRank": 15,
        "url": "https://benchlm.ai/models/gpt-5-3-codex",
        "markdownUrl": "https://benchlm.ai/md/models/gpt-5-3-codex.md"
      },
      "overallWinner": "A",
      "winner": {
        "slug": "claude-opus-4-8",
        "canonicalModelKey": "claude-opus-4-8",
        "model": "Claude Opus 4.8",
        "creator": "Anthropic",
        "sourceType": "Proprietary",
        "reasoningType": "Reasoning",
        "contextWindow": "1M",
        "contextWindowTokens": 1000000,
        "displayScore": 93,
        "rankingEligible": true,
        "overallRank": 3,
        "url": "https://benchlm.ai/models/claude-opus-4-8",
        "markdownUrl": "https://benchlm.ai/md/models/claude-opus-4-8.md"
      },
      "scoreDiff": 8,
      "winsA": 2,
      "winsB": 0,
      "comparableCategoryCount": 2,
      "benchmarkCountA": 41,
      "benchmarkCountB": 25,
      "categoryResults": {
        "agentic": {
          "categoryLabel": "Agentic",
          "avgA": 80.1,
          "avgB": 71.5,
          "winner": "A",
          "benchmarkCount": 12
        },
        "coding": {
          "categoryLabel": "Coding",
          "avgA": 76.4,
          "avgB": 63.1,
          "winner": "A",
          "benchmarkCount": 11
        },
        "multimodalGrounded": {
          "categoryLabel": "Multimodal & Grounded",
          "avgA": 76.1,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 6
        },
        "reasoning": {
          "categoryLabel": "Reasoning",
          "avgA": null,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 2
        },
        "knowledge": {
          "categoryLabel": "Knowledge",
          "avgA": 70.1,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 10
        },
        "instructionFollowing": {
          "categoryLabel": "Instruction Following",
          "avgA": null,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 1
        },
        "multilingual": {
          "categoryLabel": "Multilingual",
          "avgA": null,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 1
        },
        "math": {
          "categoryLabel": "Mathematics",
          "avgA": null,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 1
        }
      }
    },
    {
      "slug": "claude-opus-4-8-vs-glm-5-1",
      "url": "https://benchlm.ai/compare/claude-opus-4-8-vs-glm-5-1",
      "markdownUrl": "https://benchlm.ai/md/compare/claude-opus-4-8-vs-glm-5-1.md",
      "modelA": {
        "slug": "claude-opus-4-8",
        "canonicalModelKey": "claude-opus-4-8",
        "model": "Claude Opus 4.8",
        "creator": "Anthropic",
        "sourceType": "Proprietary",
        "reasoningType": "Reasoning",
        "contextWindow": "1M",
        "contextWindowTokens": 1000000,
        "displayScore": 93,
        "rankingEligible": true,
        "overallRank": 3,
        "url": "https://benchlm.ai/models/claude-opus-4-8",
        "markdownUrl": "https://benchlm.ai/md/models/claude-opus-4-8.md"
      },
      "modelB": {
        "slug": "glm-5-1",
        "canonicalModelKey": "glm-5-1",
        "model": "GLM-5.1",
        "creator": "Z.AI",
        "sourceType": "Open Weight",
        "reasoningType": "Reasoning",
        "contextWindow": "203K",
        "contextWindowTokens": 203000,
        "displayScore": 82,
        "rankingEligible": true,
        "overallRank": 17,
        "url": "https://benchlm.ai/models/glm-5-1",
        "markdownUrl": "https://benchlm.ai/md/models/glm-5-1.md"
      },
      "overallWinner": "A",
      "winner": {
        "slug": "claude-opus-4-8",
        "canonicalModelKey": "claude-opus-4-8",
        "model": "Claude Opus 4.8",
        "creator": "Anthropic",
        "sourceType": "Proprietary",
        "reasoningType": "Reasoning",
        "contextWindow": "1M",
        "contextWindowTokens": 1000000,
        "displayScore": 93,
        "rankingEligible": true,
        "overallRank": 3,
        "url": "https://benchlm.ai/models/claude-opus-4-8",
        "markdownUrl": "https://benchlm.ai/md/models/claude-opus-4-8.md"
      },
      "scoreDiff": 11,
      "winsA": 3,
      "winsB": 0,
      "comparableCategoryCount": 3,
      "benchmarkCountA": 41,
      "benchmarkCountB": 33,
      "categoryResults": {
        "agentic": {
          "categoryLabel": "Agentic",
          "avgA": 80.1,
          "avgB": 65.3,
          "winner": "A",
          "benchmarkCount": 15
        },
        "coding": {
          "categoryLabel": "Coding",
          "avgA": 76.4,
          "avgB": 60.9,
          "winner": "A",
          "benchmarkCount": 12
        },
        "multimodalGrounded": {
          "categoryLabel": "Multimodal & Grounded",
          "avgA": 76.1,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 5
        },
        "reasoning": {
          "categoryLabel": "Reasoning",
          "avgA": null,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 2
        },
        "knowledge": {
          "categoryLabel": "Knowledge",
          "avgA": 70.1,
          "avgB": 52.3,
          "winner": "A",
          "benchmarkCount": 10
        },
        "instructionFollowing": {
          "categoryLabel": "Instruction Following",
          "avgA": null,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 1
        },
        "multilingual": {
          "categoryLabel": "Multilingual",
          "avgA": null,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 1
        },
        "math": {
          "categoryLabel": "Mathematics",
          "avgA": null,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 5
        }
      }
    },
    {
      "slug": "claude-opus-4-8-vs-claude-sonnet-4-6",
      "url": "https://benchlm.ai/compare/claude-opus-4-8-vs-claude-sonnet-4-6",
      "markdownUrl": "https://benchlm.ai/md/compare/claude-opus-4-8-vs-claude-sonnet-4-6.md",
      "modelA": {
        "slug": "claude-opus-4-8",
        "canonicalModelKey": "claude-opus-4-8",
        "model": "Claude Opus 4.8",
        "creator": "Anthropic",
        "sourceType": "Proprietary",
        "reasoningType": "Reasoning",
        "contextWindow": "1M",
        "contextWindowTokens": 1000000,
        "displayScore": 93,
        "rankingEligible": true,
        "overallRank": 3,
        "url": "https://benchlm.ai/models/claude-opus-4-8",
        "markdownUrl": "https://benchlm.ai/md/models/claude-opus-4-8.md"
      },
      "modelB": {
        "slug": "claude-sonnet-4-6",
        "canonicalModelKey": "claude-sonnet-4-6",
        "model": "Claude Sonnet 4.6",
        "creator": "Anthropic",
        "sourceType": "Proprietary",
        "reasoningType": "Non-Reasoning",
        "contextWindow": "200K",
        "contextWindowTokens": 200000,
        "displayScore": 82,
        "rankingEligible": true,
        "overallRank": 18,
        "url": "https://benchlm.ai/models/claude-sonnet-4-6",
        "markdownUrl": "https://benchlm.ai/md/models/claude-sonnet-4-6.md"
      },
      "overallWinner": "A",
      "winner": {
        "slug": "claude-opus-4-8",
        "canonicalModelKey": "claude-opus-4-8",
        "model": "Claude Opus 4.8",
        "creator": "Anthropic",
        "sourceType": "Proprietary",
        "reasoningType": "Reasoning",
        "contextWindow": "1M",
        "contextWindowTokens": 1000000,
        "displayScore": 93,
        "rankingEligible": true,
        "overallRank": 3,
        "url": "https://benchlm.ai/models/claude-opus-4-8",
        "markdownUrl": "https://benchlm.ai/md/models/claude-opus-4-8.md"
      },
      "scoreDiff": 11,
      "winsA": 2,
      "winsB": 2,
      "comparableCategoryCount": 4,
      "benchmarkCountA": 41,
      "benchmarkCountB": 33,
      "categoryResults": {
        "agentic": {
          "categoryLabel": "Agentic",
          "avgA": 80.1,
          "avgB": 65.1,
          "winner": "A",
          "benchmarkCount": 14
        },
        "coding": {
          "categoryLabel": "Coding",
          "avgA": 76.4,
          "avgB": 66.4,
          "winner": "A",
          "benchmarkCount": 12
        },
        "multimodalGrounded": {
          "categoryLabel": "Multimodal & Grounded",
          "avgA": 76.1,
          "avgB": 77.4,
          "winner": "B",
          "benchmarkCount": 6
        },
        "reasoning": {
          "categoryLabel": "Reasoning",
          "avgA": null,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 2
        },
        "knowledge": {
          "categoryLabel": "Knowledge",
          "avgA": 70.1,
          "avgB": 73.7,
          "winner": "B",
          "benchmarkCount": 12
        },
        "instructionFollowing": {
          "categoryLabel": "Instruction Following",
          "avgA": null,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 1
        },
        "multilingual": {
          "categoryLabel": "Multilingual",
          "avgA": null,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 1
        },
        "math": {
          "categoryLabel": "Mathematics",
          "avgA": null,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 1
        }
      }
    },
    {
      "slug": "gemini-3-1-pro-vs-qwen3-7-max",
      "url": "https://benchlm.ai/compare/gemini-3-1-pro-vs-qwen3-7-max",
      "markdownUrl": "https://benchlm.ai/md/compare/gemini-3-1-pro-vs-qwen3-7-max.md",
      "modelA": {
        "slug": "gemini-3-1-pro",
        "canonicalModelKey": "gemini-3-1-pro",
        "model": "Gemini 3.1 Pro",
        "creator": "Google",
        "sourceType": "Proprietary",
        "reasoningType": "Non-Reasoning",
        "contextWindow": "1M",
        "contextWindowTokens": 1000000,
        "displayScore": 91,
        "rankingEligible": true,
        "overallRank": 4,
        "url": "https://benchlm.ai/models/gemini-3-1-pro",
        "markdownUrl": "https://benchlm.ai/md/models/gemini-3-1-pro.md"
      },
      "modelB": {
        "slug": "qwen3-7-max",
        "canonicalModelKey": "qwen3-7-max",
        "model": "Qwen3.7 Max",
        "creator": "Alibaba",
        "sourceType": "Proprietary",
        "reasoningType": "Reasoning",
        "contextWindow": "1M",
        "contextWindowTokens": 1000000,
        "displayScore": 91,
        "rankingEligible": true,
        "overallRank": 5,
        "url": "https://benchlm.ai/models/qwen3-7-max",
        "markdownUrl": "https://benchlm.ai/md/models/qwen3-7-max.md"
      },
      "overallWinner": "tie",
      "winner": null,
      "scoreDiff": 0,
      "winsA": 0,
      "winsB": 1,
      "comparableCategoryCount": 1,
      "benchmarkCountA": 38,
      "benchmarkCountB": 51,
      "categoryResults": {
        "agentic": {
          "categoryLabel": "Agentic",
          "avgA": null,
          "avgB": 69.7,
          "winner": null,
          "benchmarkCount": 15
        },
        "coding": {
          "categoryLabel": "Coding",
          "avgA": null,
          "avgB": 73.6,
          "winner": null,
          "benchmarkCount": 13
        },
        "multimodalGrounded": {
          "categoryLabel": "Multimodal & Grounded",
          "avgA": 82.8,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 10
        },
        "reasoning": {
          "categoryLabel": "Reasoning",
          "avgA": 77.1,
          "avgB": 90.4,
          "winner": "B",
          "benchmarkCount": 4
        },
        "knowledge": {
          "categoryLabel": "Knowledge",
          "avgA": null,
          "avgB": 71.2,
          "winner": null,
          "benchmarkCount": 16
        },
        "instructionFollowing": {
          "categoryLabel": "Instruction Following",
          "avgA": null,
          "avgB": 89,
          "winner": null,
          "benchmarkCount": 3
        },
        "multilingual": {
          "categoryLabel": "Multilingual",
          "avgA": null,
          "avgB": 87,
          "winner": null,
          "benchmarkCount": 5
        },
        "math": {
          "categoryLabel": "Mathematics",
          "avgA": null,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 3
        }
      }
    },
    {
      "slug": "gemini-3-1-pro-vs-gpt-5-4-pro",
      "url": "https://benchlm.ai/compare/gemini-3-1-pro-vs-gpt-5-4-pro",
      "markdownUrl": "https://benchlm.ai/md/compare/gemini-3-1-pro-vs-gpt-5-4-pro.md",
      "modelA": {
        "slug": "gemini-3-1-pro",
        "canonicalModelKey": "gemini-3-1-pro",
        "model": "Gemini 3.1 Pro",
        "creator": "Google",
        "sourceType": "Proprietary",
        "reasoningType": "Non-Reasoning",
        "contextWindow": "1M",
        "contextWindowTokens": 1000000,
        "displayScore": 91,
        "rankingEligible": true,
        "overallRank": 4,
        "url": "https://benchlm.ai/models/gemini-3-1-pro",
        "markdownUrl": "https://benchlm.ai/md/models/gemini-3-1-pro.md"
      },
      "modelB": {
        "slug": "gpt-5-4-pro",
        "canonicalModelKey": "gpt-5-4-pro",
        "model": "GPT-5.4 Pro",
        "creator": "OpenAI",
        "sourceType": "Proprietary",
        "reasoningType": "Reasoning",
        "contextWindow": "1.05M",
        "contextWindowTokens": 1050000,
        "displayScore": 90,
        "rankingEligible": true,
        "overallRank": 6,
        "url": "https://benchlm.ai/models/gpt-5-4-pro",
        "markdownUrl": "https://benchlm.ai/md/models/gpt-5-4-pro.md"
      },
      "overallWinner": "A",
      "winner": {
        "slug": "gemini-3-1-pro",
        "canonicalModelKey": "gemini-3-1-pro",
        "model": "Gemini 3.1 Pro",
        "creator": "Google",
        "sourceType": "Proprietary",
        "reasoningType": "Non-Reasoning",
        "contextWindow": "1M",
        "contextWindowTokens": 1000000,
        "displayScore": 91,
        "rankingEligible": true,
        "overallRank": 4,
        "url": "https://benchlm.ai/models/gemini-3-1-pro",
        "markdownUrl": "https://benchlm.ai/md/models/gemini-3-1-pro.md"
      },
      "scoreDiff": 1,
      "winsA": 0,
      "winsB": 2,
      "comparableCategoryCount": 2,
      "benchmarkCountA": 38,
      "benchmarkCountB": 10,
      "categoryResults": {
        "agentic": {
          "categoryLabel": "Agentic",
          "avgA": null,
          "avgB": 89.3,
          "winner": null,
          "benchmarkCount": 9
        },
        "coding": {
          "categoryLabel": "Coding",
          "avgA": null,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 6
        },
        "multimodalGrounded": {
          "categoryLabel": "Multimodal & Grounded",
          "avgA": 82.8,
          "avgB": 94,
          "winner": "B",
          "benchmarkCount": 10
        },
        "reasoning": {
          "categoryLabel": "Reasoning",
          "avgA": 77.1,
          "avgB": 83.3,
          "winner": "B",
          "benchmarkCount": 3
        },
        "knowledge": {
          "categoryLabel": "Knowledge",
          "avgA": null,
          "avgB": 49,
          "winner": null,
          "benchmarkCount": 13
        },
        "instructionFollowing": {
          "categoryLabel": "Instruction Following",
          "avgA": null,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 1
        },
        "multilingual": {
          "categoryLabel": "Multilingual",
          "avgA": null,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 0
        },
        "math": {
          "categoryLabel": "Mathematics",
          "avgA": null,
          "avgB": 50,
          "winner": null,
          "benchmarkCount": 2
        }
      }
    },
    {
      "slug": "gemini-3-1-pro-vs-gemini-3-pro-deep-think",
      "url": "https://benchlm.ai/compare/gemini-3-1-pro-vs-gemini-3-pro-deep-think",
      "markdownUrl": "https://benchlm.ai/md/compare/gemini-3-1-pro-vs-gemini-3-pro-deep-think.md",
      "modelA": {
        "slug": "gemini-3-1-pro",
        "canonicalModelKey": "gemini-3-1-pro",
        "model": "Gemini 3.1 Pro",
        "creator": "Google",
        "sourceType": "Proprietary",
        "reasoningType": "Non-Reasoning",
        "contextWindow": "1M",
        "contextWindowTokens": 1000000,
        "displayScore": 91,
        "rankingEligible": true,
        "overallRank": 4,
        "url": "https://benchlm.ai/models/gemini-3-1-pro",
        "markdownUrl": "https://benchlm.ai/md/models/gemini-3-1-pro.md"
      },
      "modelB": {
        "slug": "gemini-3-pro-deep-think",
        "canonicalModelKey": "gemini-3-pro-deep-think",
        "model": "Gemini 3 Pro Deep Think",
        "creator": "Google",
        "sourceType": "Proprietary",
        "reasoningType": "Reasoning",
        "contextWindow": "2M",
        "contextWindowTokens": 2000000,
        "displayScore": 89,
        "rankingEligible": true,
        "overallRank": 8,
        "url": "https://benchlm.ai/models/gemini-3-pro-deep-think",
        "markdownUrl": "https://benchlm.ai/md/models/gemini-3-pro-deep-think.md"
      },
      "overallWinner": "A",
      "winner": {
        "slug": "gemini-3-1-pro",
        "canonicalModelKey": "gemini-3-1-pro",
        "model": "Gemini 3.1 Pro",
        "creator": "Google",
        "sourceType": "Proprietary",
        "reasoningType": "Non-Reasoning",
        "contextWindow": "1M",
        "contextWindowTokens": 1000000,
        "displayScore": 91,
        "rankingEligible": true,
        "overallRank": 4,
        "url": "https://benchlm.ai/models/gemini-3-1-pro",
        "markdownUrl": "https://benchlm.ai/md/models/gemini-3-1-pro.md"
      },
      "scoreDiff": 2,
      "winsA": 1,
      "winsB": 0,
      "comparableCategoryCount": 1,
      "benchmarkCountA": 38,
      "benchmarkCountB": 4,
      "categoryResults": {
        "agentic": {
          "categoryLabel": "Agentic",
          "avgA": null,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 8
        },
        "coding": {
          "categoryLabel": "Coding",
          "avgA": null,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 6
        },
        "multimodalGrounded": {
          "categoryLabel": "Multimodal & Grounded",
          "avgA": 82.8,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 10
        },
        "reasoning": {
          "categoryLabel": "Reasoning",
          "avgA": 77.1,
          "avgB": 45.1,
          "winner": "A",
          "benchmarkCount": 3
        },
        "knowledge": {
          "categoryLabel": "Knowledge",
          "avgA": null,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 10
        },
        "instructionFollowing": {
          "categoryLabel": "Instruction Following",
          "avgA": null,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 1
        },
        "multilingual": {
          "categoryLabel": "Multilingual",
          "avgA": null,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 0
        },
        "math": {
          "categoryLabel": "Mathematics",
          "avgA": null,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 0
        }
      }
    },
    {
      "slug": "gemini-3-1-pro-vs-grok-4-1",
      "url": "https://benchlm.ai/compare/gemini-3-1-pro-vs-grok-4-1",
      "markdownUrl": "https://benchlm.ai/md/compare/gemini-3-1-pro-vs-grok-4-1.md",
      "modelA": {
        "slug": "gemini-3-1-pro",
        "canonicalModelKey": "gemini-3-1-pro",
        "model": "Gemini 3.1 Pro",
        "creator": "Google",
        "sourceType": "Proprietary",
        "reasoningType": "Non-Reasoning",
        "contextWindow": "1M",
        "contextWindowTokens": 1000000,
        "displayScore": 91,
        "rankingEligible": true,
        "overallRank": 4,
        "url": "https://benchlm.ai/models/gemini-3-1-pro",
        "markdownUrl": "https://benchlm.ai/md/models/gemini-3-1-pro.md"
      },
      "modelB": {
        "slug": "grok-4-1",
        "canonicalModelKey": "grok-4-1",
        "model": "Grok 4.1",
        "creator": "xAI",
        "sourceType": "Proprietary",
        "reasoningType": "Non-Reasoning",
        "contextWindow": "1M",
        "contextWindowTokens": 1000000,
        "displayScore": 89,
        "rankingEligible": true,
        "overallRank": 9,
        "url": "https://benchlm.ai/models/grok-4-1",
        "markdownUrl": "https://benchlm.ai/md/models/grok-4-1.md"
      },
      "overallWinner": "A",
      "winner": {
        "slug": "gemini-3-1-pro",
        "canonicalModelKey": "gemini-3-1-pro",
        "model": "Gemini 3.1 Pro",
        "creator": "Google",
        "sourceType": "Proprietary",
        "reasoningType": "Non-Reasoning",
        "contextWindow": "1M",
        "contextWindowTokens": 1000000,
        "displayScore": 91,
        "rankingEligible": true,
        "overallRank": 4,
        "url": "https://benchlm.ai/models/gemini-3-1-pro",
        "markdownUrl": "https://benchlm.ai/md/models/gemini-3-1-pro.md"
      },
      "scoreDiff": 2,
      "winsA": 0,
      "winsB": 0,
      "comparableCategoryCount": 0,
      "benchmarkCountA": 38,
      "benchmarkCountB": 0,
      "categoryResults": {
        "agentic": {
          "categoryLabel": "Agentic",
          "avgA": null,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 8
        },
        "coding": {
          "categoryLabel": "Coding",
          "avgA": null,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 6
        },
        "multimodalGrounded": {
          "categoryLabel": "Multimodal & Grounded",
          "avgA": 82.8,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 10
        },
        "reasoning": {
          "categoryLabel": "Reasoning",
          "avgA": 77.1,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 3
        },
        "knowledge": {
          "categoryLabel": "Knowledge",
          "avgA": null,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 10
        },
        "instructionFollowing": {
          "categoryLabel": "Instruction Following",
          "avgA": null,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 1
        },
        "multilingual": {
          "categoryLabel": "Multilingual",
          "avgA": null,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 0
        },
        "math": {
          "categoryLabel": "Mathematics",
          "avgA": null,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 0
        }
      }
    },
    {
      "slug": "gemini-3-1-pro-vs-gpt-5-4",
      "url": "https://benchlm.ai/compare/gemini-3-1-pro-vs-gpt-5-4",
      "markdownUrl": "https://benchlm.ai/md/compare/gemini-3-1-pro-vs-gpt-5-4.md",
      "modelA": {
        "slug": "gemini-3-1-pro",
        "canonicalModelKey": "gemini-3-1-pro",
        "model": "Gemini 3.1 Pro",
        "creator": "Google",
        "sourceType": "Proprietary",
        "reasoningType": "Non-Reasoning",
        "contextWindow": "1M",
        "contextWindowTokens": 1000000,
        "displayScore": 91,
        "rankingEligible": true,
        "overallRank": 4,
        "url": "https://benchlm.ai/models/gemini-3-1-pro",
        "markdownUrl": "https://benchlm.ai/md/models/gemini-3-1-pro.md"
      },
      "modelB": {
        "slug": "gpt-5-4",
        "canonicalModelKey": "gpt-5-4",
        "model": "GPT-5.4",
        "creator": "OpenAI",
        "sourceType": "Proprietary",
        "reasoningType": "Reasoning",
        "contextWindow": "1.05M",
        "contextWindowTokens": 1050000,
        "displayScore": 88,
        "rankingEligible": true,
        "overallRank": 10,
        "url": "https://benchlm.ai/models/gpt-5-4",
        "markdownUrl": "https://benchlm.ai/md/models/gpt-5-4.md"
      },
      "overallWinner": "A",
      "winner": {
        "slug": "gemini-3-1-pro",
        "canonicalModelKey": "gemini-3-1-pro",
        "model": "Gemini 3.1 Pro",
        "creator": "Google",
        "sourceType": "Proprietary",
        "reasoningType": "Non-Reasoning",
        "contextWindow": "1M",
        "contextWindowTokens": 1000000,
        "displayScore": 91,
        "rankingEligible": true,
        "overallRank": 4,
        "url": "https://benchlm.ai/models/gemini-3-1-pro",
        "markdownUrl": "https://benchlm.ai/md/models/gemini-3-1-pro.md"
      },
      "scoreDiff": 3,
      "winsA": 1,
      "winsB": 0,
      "comparableCategoryCount": 1,
      "benchmarkCountA": 38,
      "benchmarkCountB": 48,
      "categoryResults": {
        "agentic": {
          "categoryLabel": "Agentic",
          "avgA": null,
          "avgB": 77,
          "winner": null,
          "benchmarkCount": 14
        },
        "coding": {
          "categoryLabel": "Coding",
          "avgA": null,
          "avgB": 57.7,
          "winner": null,
          "benchmarkCount": 7
        },
        "multimodalGrounded": {
          "categoryLabel": "Multimodal & Grounded",
          "avgA": 82.8,
          "avgB": 72.7,
          "winner": "A",
          "benchmarkCount": 12
        },
        "reasoning": {
          "categoryLabel": "Reasoning",
          "avgA": 77.1,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 3
        },
        "knowledge": {
          "categoryLabel": "Knowledge",
          "avgA": null,
          "avgB": 66.1,
          "winner": null,
          "benchmarkCount": 12
        },
        "instructionFollowing": {
          "categoryLabel": "Instruction Following",
          "avgA": null,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 1
        },
        "multilingual": {
          "categoryLabel": "Multilingual",
          "avgA": null,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 0
        },
        "math": {
          "categoryLabel": "Mathematics",
          "avgA": null,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 0
        }
      }
    },
    {
      "slug": "gemini-3-1-pro-vs-qwen3-7-plus",
      "url": "https://benchlm.ai/compare/gemini-3-1-pro-vs-qwen3-7-plus",
      "markdownUrl": "https://benchlm.ai/md/compare/gemini-3-1-pro-vs-qwen3-7-plus.md",
      "modelA": {
        "slug": "gemini-3-1-pro",
        "canonicalModelKey": "gemini-3-1-pro",
        "model": "Gemini 3.1 Pro",
        "creator": "Google",
        "sourceType": "Proprietary",
        "reasoningType": "Non-Reasoning",
        "contextWindow": "1M",
        "contextWindowTokens": 1000000,
        "displayScore": 91,
        "rankingEligible": true,
        "overallRank": 4,
        "url": "https://benchlm.ai/models/gemini-3-1-pro",
        "markdownUrl": "https://benchlm.ai/md/models/gemini-3-1-pro.md"
      },
      "modelB": {
        "slug": "qwen3-7-plus",
        "canonicalModelKey": "qwen3-7-plus",
        "model": "Qwen3.7 Plus",
        "creator": "Alibaba",
        "sourceType": "Proprietary",
        "reasoningType": "Reasoning",
        "contextWindow": "1M",
        "contextWindowTokens": 1000000,
        "displayScore": 88,
        "rankingEligible": true,
        "overallRank": 11,
        "url": "https://benchlm.ai/models/qwen3-7-plus",
        "markdownUrl": "https://benchlm.ai/md/models/qwen3-7-plus.md"
      },
      "overallWinner": "A",
      "winner": {
        "slug": "gemini-3-1-pro",
        "canonicalModelKey": "gemini-3-1-pro",
        "model": "Gemini 3.1 Pro",
        "creator": "Google",
        "sourceType": "Proprietary",
        "reasoningType": "Non-Reasoning",
        "contextWindow": "1M",
        "contextWindowTokens": 1000000,
        "displayScore": 91,
        "rankingEligible": true,
        "overallRank": 4,
        "url": "https://benchlm.ai/models/gemini-3-1-pro",
        "markdownUrl": "https://benchlm.ai/md/models/gemini-3-1-pro.md"
      },
      "scoreDiff": 3,
      "winsA": 1,
      "winsB": 1,
      "comparableCategoryCount": 2,
      "benchmarkCountA": 38,
      "benchmarkCountB": 68,
      "categoryResults": {
        "agentic": {
          "categoryLabel": "Agentic",
          "avgA": null,
          "avgB": 71.7,
          "winner": null,
          "benchmarkCount": 17
        },
        "coding": {
          "categoryLabel": "Coding",
          "avgA": null,
          "avgB": 71.1,
          "winner": null,
          "benchmarkCount": 13
        },
        "multimodalGrounded": {
          "categoryLabel": "Multimodal & Grounded",
          "avgA": 82.8,
          "avgB": 81.1,
          "winner": "A",
          "benchmarkCount": 19
        },
        "reasoning": {
          "categoryLabel": "Reasoning",
          "avgA": 77.1,
          "avgB": 91.7,
          "winner": "B",
          "benchmarkCount": 4
        },
        "knowledge": {
          "categoryLabel": "Knowledge",
          "avgA": null,
          "avgB": 67.9,
          "winner": null,
          "benchmarkCount": 16
        },
        "instructionFollowing": {
          "categoryLabel": "Instruction Following",
          "avgA": null,
          "avgB": 89.2,
          "winner": null,
          "benchmarkCount": 3
        },
        "multilingual": {
          "categoryLabel": "Multilingual",
          "avgA": null,
          "avgB": 85.4,
          "winner": null,
          "benchmarkCount": 5
        },
        "math": {
          "categoryLabel": "Mathematics",
          "avgA": null,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 3
        }
      }
    },
    {
      "slug": "claude-opus-4-6-vs-gemini-3-1-pro",
      "url": "https://benchlm.ai/compare/claude-opus-4-6-vs-gemini-3-1-pro",
      "markdownUrl": "https://benchlm.ai/md/compare/claude-opus-4-6-vs-gemini-3-1-pro.md",
      "modelA": {
        "slug": "gemini-3-1-pro",
        "canonicalModelKey": "gemini-3-1-pro",
        "model": "Gemini 3.1 Pro",
        "creator": "Google",
        "sourceType": "Proprietary",
        "reasoningType": "Non-Reasoning",
        "contextWindow": "1M",
        "contextWindowTokens": 1000000,
        "displayScore": 91,
        "rankingEligible": true,
        "overallRank": 4,
        "url": "https://benchlm.ai/models/gemini-3-1-pro",
        "markdownUrl": "https://benchlm.ai/md/models/gemini-3-1-pro.md"
      },
      "modelB": {
        "slug": "claude-opus-4-6",
        "canonicalModelKey": "claude-opus-4-6",
        "model": "Claude Opus 4.6",
        "creator": "Anthropic",
        "sourceType": "Proprietary",
        "reasoningType": "Non-Reasoning",
        "contextWindow": "1M",
        "contextWindowTokens": 1000000,
        "displayScore": 86,
        "rankingEligible": true,
        "overallRank": 12,
        "url": "https://benchlm.ai/models/claude-opus-4-6",
        "markdownUrl": "https://benchlm.ai/md/models/claude-opus-4-6.md"
      },
      "overallWinner": "A",
      "winner": {
        "slug": "gemini-3-1-pro",
        "canonicalModelKey": "gemini-3-1-pro",
        "model": "Gemini 3.1 Pro",
        "creator": "Google",
        "sourceType": "Proprietary",
        "reasoningType": "Non-Reasoning",
        "contextWindow": "1M",
        "contextWindowTokens": 1000000,
        "displayScore": 91,
        "rankingEligible": true,
        "overallRank": 4,
        "url": "https://benchlm.ai/models/gemini-3-1-pro",
        "markdownUrl": "https://benchlm.ai/md/models/gemini-3-1-pro.md"
      },
      "scoreDiff": 5,
      "winsA": 1,
      "winsB": 0,
      "comparableCategoryCount": 1,
      "benchmarkCountA": 38,
      "benchmarkCountB": 47,
      "categoryResults": {
        "agentic": {
          "categoryLabel": "Agentic",
          "avgA": null,
          "avgB": 72.6,
          "winner": null,
          "benchmarkCount": 12
        },
        "coding": {
          "categoryLabel": "Coding",
          "avgA": null,
          "avgB": 64.4,
          "winner": null,
          "benchmarkCount": 10
        },
        "multimodalGrounded": {
          "categoryLabel": "Multimodal & Grounded",
          "avgA": 82.8,
          "avgB": 77.3,
          "winner": "A",
          "benchmarkCount": 10
        },
        "reasoning": {
          "categoryLabel": "Reasoning",
          "avgA": 77.1,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 3
        },
        "knowledge": {
          "categoryLabel": "Knowledge",
          "avgA": null,
          "avgB": 76.2,
          "winner": null,
          "benchmarkCount": 15
        },
        "instructionFollowing": {
          "categoryLabel": "Instruction Following",
          "avgA": null,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 1
        },
        "multilingual": {
          "categoryLabel": "Multilingual",
          "avgA": null,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 0
        },
        "math": {
          "categoryLabel": "Mathematics",
          "avgA": null,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 1
        }
      }
    },
    {
      "slug": "deepseek-v4-pro-max-vs-gemini-3-1-pro",
      "url": "https://benchlm.ai/compare/deepseek-v4-pro-max-vs-gemini-3-1-pro",
      "markdownUrl": "https://benchlm.ai/md/compare/deepseek-v4-pro-max-vs-gemini-3-1-pro.md",
      "modelA": {
        "slug": "gemini-3-1-pro",
        "canonicalModelKey": "gemini-3-1-pro",
        "model": "Gemini 3.1 Pro",
        "creator": "Google",
        "sourceType": "Proprietary",
        "reasoningType": "Non-Reasoning",
        "contextWindow": "1M",
        "contextWindowTokens": 1000000,
        "displayScore": 91,
        "rankingEligible": true,
        "overallRank": 4,
        "url": "https://benchlm.ai/models/gemini-3-1-pro",
        "markdownUrl": "https://benchlm.ai/md/models/gemini-3-1-pro.md"
      },
      "modelB": {
        "slug": "deepseek-v4-pro-max",
        "canonicalModelKey": "deepseek-v4-pro-max",
        "model": "DeepSeek V4 Pro (Max)",
        "creator": "DeepSeek",
        "sourceType": "Open Weight",
        "reasoningType": "Reasoning",
        "contextWindow": "1M",
        "contextWindowTokens": 1000000,
        "displayScore": 86,
        "rankingEligible": true,
        "overallRank": 14,
        "url": "https://benchlm.ai/models/deepseek-v4-pro-max",
        "markdownUrl": "https://benchlm.ai/md/models/deepseek-v4-pro-max.md"
      },
      "overallWinner": "A",
      "winner": {
        "slug": "gemini-3-1-pro",
        "canonicalModelKey": "gemini-3-1-pro",
        "model": "Gemini 3.1 Pro",
        "creator": "Google",
        "sourceType": "Proprietary",
        "reasoningType": "Non-Reasoning",
        "contextWindow": "1M",
        "contextWindowTokens": 1000000,
        "displayScore": 91,
        "rankingEligible": true,
        "overallRank": 4,
        "url": "https://benchlm.ai/models/gemini-3-1-pro",
        "markdownUrl": "https://benchlm.ai/md/models/gemini-3-1-pro.md"
      },
      "scoreDiff": 5,
      "winsA": 0,
      "winsB": 0,
      "comparableCategoryCount": 0,
      "benchmarkCountA": 38,
      "benchmarkCountB": 42,
      "categoryResults": {
        "agentic": {
          "categoryLabel": "Agentic",
          "avgA": null,
          "avgB": 74,
          "winner": null,
          "benchmarkCount": 13
        },
        "coding": {
          "categoryLabel": "Coding",
          "avgA": null,
          "avgB": 75.9,
          "winner": null,
          "benchmarkCount": 12
        },
        "multimodalGrounded": {
          "categoryLabel": "Multimodal & Grounded",
          "avgA": 82.8,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 10
        },
        "reasoning": {
          "categoryLabel": "Reasoning",
          "avgA": 77.1,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 5
        },
        "knowledge": {
          "categoryLabel": "Knowledge",
          "avgA": null,
          "avgB": 66.1,
          "winner": null,
          "benchmarkCount": 15
        },
        "instructionFollowing": {
          "categoryLabel": "Instruction Following",
          "avgA": null,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 1
        },
        "multilingual": {
          "categoryLabel": "Multilingual",
          "avgA": null,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 0
        },
        "math": {
          "categoryLabel": "Mathematics",
          "avgA": null,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 4
        }
      }
    },
    {
      "slug": "gemini-3-1-pro-vs-gpt-5-3-codex",
      "url": "https://benchlm.ai/compare/gemini-3-1-pro-vs-gpt-5-3-codex",
      "markdownUrl": "https://benchlm.ai/md/compare/gemini-3-1-pro-vs-gpt-5-3-codex.md",
      "modelA": {
        "slug": "gemini-3-1-pro",
        "canonicalModelKey": "gemini-3-1-pro",
        "model": "Gemini 3.1 Pro",
        "creator": "Google",
        "sourceType": "Proprietary",
        "reasoningType": "Non-Reasoning",
        "contextWindow": "1M",
        "contextWindowTokens": 1000000,
        "displayScore": 91,
        "rankingEligible": true,
        "overallRank": 4,
        "url": "https://benchlm.ai/models/gemini-3-1-pro",
        "markdownUrl": "https://benchlm.ai/md/models/gemini-3-1-pro.md"
      },
      "modelB": {
        "slug": "gpt-5-3-codex",
        "canonicalModelKey": "gpt-5-3-codex",
        "model": "GPT-5.3 Codex",
        "creator": "OpenAI",
        "sourceType": "Proprietary",
        "reasoningType": "Reasoning",
        "contextWindow": "400K",
        "contextWindowTokens": 400000,
        "displayScore": 85,
        "rankingEligible": true,
        "overallRank": 15,
        "url": "https://benchlm.ai/models/gpt-5-3-codex",
        "markdownUrl": "https://benchlm.ai/md/models/gpt-5-3-codex.md"
      },
      "overallWinner": "A",
      "winner": {
        "slug": "gemini-3-1-pro",
        "canonicalModelKey": "gemini-3-1-pro",
        "model": "Gemini 3.1 Pro",
        "creator": "Google",
        "sourceType": "Proprietary",
        "reasoningType": "Non-Reasoning",
        "contextWindow": "1M",
        "contextWindowTokens": 1000000,
        "displayScore": 91,
        "rankingEligible": true,
        "overallRank": 4,
        "url": "https://benchlm.ai/models/gemini-3-1-pro",
        "markdownUrl": "https://benchlm.ai/md/models/gemini-3-1-pro.md"
      },
      "scoreDiff": 6,
      "winsA": 0,
      "winsB": 0,
      "comparableCategoryCount": 0,
      "benchmarkCountA": 38,
      "benchmarkCountB": 25,
      "categoryResults": {
        "agentic": {
          "categoryLabel": "Agentic",
          "avgA": null,
          "avgB": 71.5,
          "winner": null,
          "benchmarkCount": 10
        },
        "coding": {
          "categoryLabel": "Coding",
          "avgA": null,
          "avgB": 63.1,
          "winner": null,
          "benchmarkCount": 9
        },
        "multimodalGrounded": {
          "categoryLabel": "Multimodal & Grounded",
          "avgA": 82.8,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 10
        },
        "reasoning": {
          "categoryLabel": "Reasoning",
          "avgA": 77.1,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 3
        },
        "knowledge": {
          "categoryLabel": "Knowledge",
          "avgA": null,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 10
        },
        "instructionFollowing": {
          "categoryLabel": "Instruction Following",
          "avgA": null,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 1
        },
        "multilingual": {
          "categoryLabel": "Multilingual",
          "avgA": null,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 0
        },
        "math": {
          "categoryLabel": "Mathematics",
          "avgA": null,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 0
        }
      }
    },
    {
      "slug": "claude-opus-4-7-adaptive-vs-gemini-3-1-pro",
      "url": "https://benchlm.ai/compare/claude-opus-4-7-adaptive-vs-gemini-3-1-pro",
      "markdownUrl": "https://benchlm.ai/md/compare/claude-opus-4-7-adaptive-vs-gemini-3-1-pro.md",
      "modelA": {
        "slug": "gemini-3-1-pro",
        "canonicalModelKey": "gemini-3-1-pro",
        "model": "Gemini 3.1 Pro",
        "creator": "Google",
        "sourceType": "Proprietary",
        "reasoningType": "Non-Reasoning",
        "contextWindow": "1M",
        "contextWindowTokens": 1000000,
        "displayScore": 91,
        "rankingEligible": true,
        "overallRank": 4,
        "url": "https://benchlm.ai/models/gemini-3-1-pro",
        "markdownUrl": "https://benchlm.ai/md/models/gemini-3-1-pro.md"
      },
      "modelB": {
        "slug": "claude-opus-4-7-adaptive",
        "canonicalModelKey": "claude-opus-4-7-max",
        "model": "Claude Opus 4.7 (Adaptive)",
        "creator": "Anthropic",
        "sourceType": "Proprietary",
        "reasoningType": "Reasoning",
        "contextWindow": "1M",
        "contextWindowTokens": 1000000,
        "displayScore": 84,
        "rankingEligible": true,
        "overallRank": 16,
        "url": "https://benchlm.ai/models/claude-opus-4-7-adaptive",
        "markdownUrl": "https://benchlm.ai/md/models/claude-opus-4-7-adaptive.md"
      },
      "overallWinner": "A",
      "winner": {
        "slug": "gemini-3-1-pro",
        "canonicalModelKey": "gemini-3-1-pro",
        "model": "Gemini 3.1 Pro",
        "creator": "Google",
        "sourceType": "Proprietary",
        "reasoningType": "Non-Reasoning",
        "contextWindow": "1M",
        "contextWindowTokens": 1000000,
        "displayScore": 91,
        "rankingEligible": true,
        "overallRank": 4,
        "url": "https://benchlm.ai/models/gemini-3-1-pro",
        "markdownUrl": "https://benchlm.ai/md/models/gemini-3-1-pro.md"
      },
      "scoreDiff": 7,
      "winsA": 2,
      "winsB": 0,
      "comparableCategoryCount": 2,
      "benchmarkCountA": 38,
      "benchmarkCountB": 36,
      "categoryResults": {
        "agentic": {
          "categoryLabel": "Agentic",
          "avgA": null,
          "avgB": 74.9,
          "winner": null,
          "benchmarkCount": 13
        },
        "coding": {
          "categoryLabel": "Coding",
          "avgA": null,
          "avgB": 72.9,
          "winner": null,
          "benchmarkCount": 9
        },
        "multimodalGrounded": {
          "categoryLabel": "Multimodal & Grounded",
          "avgA": 82.8,
          "avgB": 64.3,
          "winner": "A",
          "benchmarkCount": 12
        },
        "reasoning": {
          "categoryLabel": "Reasoning",
          "avgA": 77.1,
          "avgB": 75.8,
          "winner": "A",
          "benchmarkCount": 4
        },
        "knowledge": {
          "categoryLabel": "Knowledge",
          "avgA": null,
          "avgB": 68.2,
          "winner": null,
          "benchmarkCount": 12
        },
        "instructionFollowing": {
          "categoryLabel": "Instruction Following",
          "avgA": null,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 1
        },
        "multilingual": {
          "categoryLabel": "Multilingual",
          "avgA": null,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 0
        },
        "math": {
          "categoryLabel": "Mathematics",
          "avgA": null,
          "avgB": 43.8,
          "winner": null,
          "benchmarkCount": 1
        }
      }
    },
    {
      "slug": "gemini-3-1-pro-vs-glm-5-1",
      "url": "https://benchlm.ai/compare/gemini-3-1-pro-vs-glm-5-1",
      "markdownUrl": "https://benchlm.ai/md/compare/gemini-3-1-pro-vs-glm-5-1.md",
      "modelA": {
        "slug": "gemini-3-1-pro",
        "canonicalModelKey": "gemini-3-1-pro",
        "model": "Gemini 3.1 Pro",
        "creator": "Google",
        "sourceType": "Proprietary",
        "reasoningType": "Non-Reasoning",
        "contextWindow": "1M",
        "contextWindowTokens": 1000000,
        "displayScore": 91,
        "rankingEligible": true,
        "overallRank": 4,
        "url": "https://benchlm.ai/models/gemini-3-1-pro",
        "markdownUrl": "https://benchlm.ai/md/models/gemini-3-1-pro.md"
      },
      "modelB": {
        "slug": "glm-5-1",
        "canonicalModelKey": "glm-5-1",
        "model": "GLM-5.1",
        "creator": "Z.AI",
        "sourceType": "Open Weight",
        "reasoningType": "Reasoning",
        "contextWindow": "203K",
        "contextWindowTokens": 203000,
        "displayScore": 82,
        "rankingEligible": true,
        "overallRank": 17,
        "url": "https://benchlm.ai/models/glm-5-1",
        "markdownUrl": "https://benchlm.ai/md/models/glm-5-1.md"
      },
      "overallWinner": "A",
      "winner": {
        "slug": "gemini-3-1-pro",
        "canonicalModelKey": "gemini-3-1-pro",
        "model": "Gemini 3.1 Pro",
        "creator": "Google",
        "sourceType": "Proprietary",
        "reasoningType": "Non-Reasoning",
        "contextWindow": "1M",
        "contextWindowTokens": 1000000,
        "displayScore": 91,
        "rankingEligible": true,
        "overallRank": 4,
        "url": "https://benchlm.ai/models/gemini-3-1-pro",
        "markdownUrl": "https://benchlm.ai/md/models/gemini-3-1-pro.md"
      },
      "scoreDiff": 9,
      "winsA": 0,
      "winsB": 0,
      "comparableCategoryCount": 0,
      "benchmarkCountA": 38,
      "benchmarkCountB": 33,
      "categoryResults": {
        "agentic": {
          "categoryLabel": "Agentic",
          "avgA": null,
          "avgB": 65.3,
          "winner": null,
          "benchmarkCount": 13
        },
        "coding": {
          "categoryLabel": "Coding",
          "avgA": null,
          "avgB": 60.9,
          "winner": null,
          "benchmarkCount": 9
        },
        "multimodalGrounded": {
          "categoryLabel": "Multimodal & Grounded",
          "avgA": 82.8,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 10
        },
        "reasoning": {
          "categoryLabel": "Reasoning",
          "avgA": 77.1,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 3
        },
        "knowledge": {
          "categoryLabel": "Knowledge",
          "avgA": null,
          "avgB": 52.3,
          "winner": null,
          "benchmarkCount": 11
        },
        "instructionFollowing": {
          "categoryLabel": "Instruction Following",
          "avgA": null,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 1
        },
        "multilingual": {
          "categoryLabel": "Multilingual",
          "avgA": null,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 0
        },
        "math": {
          "categoryLabel": "Mathematics",
          "avgA": null,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 4
        }
      }
    },
    {
      "slug": "claude-sonnet-4-6-vs-gemini-3-1-pro",
      "url": "https://benchlm.ai/compare/claude-sonnet-4-6-vs-gemini-3-1-pro",
      "markdownUrl": "https://benchlm.ai/md/compare/claude-sonnet-4-6-vs-gemini-3-1-pro.md",
      "modelA": {
        "slug": "gemini-3-1-pro",
        "canonicalModelKey": "gemini-3-1-pro",
        "model": "Gemini 3.1 Pro",
        "creator": "Google",
        "sourceType": "Proprietary",
        "reasoningType": "Non-Reasoning",
        "contextWindow": "1M",
        "contextWindowTokens": 1000000,
        "displayScore": 91,
        "rankingEligible": true,
        "overallRank": 4,
        "url": "https://benchlm.ai/models/gemini-3-1-pro",
        "markdownUrl": "https://benchlm.ai/md/models/gemini-3-1-pro.md"
      },
      "modelB": {
        "slug": "claude-sonnet-4-6",
        "canonicalModelKey": "claude-sonnet-4-6",
        "model": "Claude Sonnet 4.6",
        "creator": "Anthropic",
        "sourceType": "Proprietary",
        "reasoningType": "Non-Reasoning",
        "contextWindow": "200K",
        "contextWindowTokens": 200000,
        "displayScore": 82,
        "rankingEligible": true,
        "overallRank": 18,
        "url": "https://benchlm.ai/models/claude-sonnet-4-6",
        "markdownUrl": "https://benchlm.ai/md/models/claude-sonnet-4-6.md"
      },
      "overallWinner": "A",
      "winner": {
        "slug": "gemini-3-1-pro",
        "canonicalModelKey": "gemini-3-1-pro",
        "model": "Gemini 3.1 Pro",
        "creator": "Google",
        "sourceType": "Proprietary",
        "reasoningType": "Non-Reasoning",
        "contextWindow": "1M",
        "contextWindowTokens": 1000000,
        "displayScore": 91,
        "rankingEligible": true,
        "overallRank": 4,
        "url": "https://benchlm.ai/models/gemini-3-1-pro",
        "markdownUrl": "https://benchlm.ai/md/models/gemini-3-1-pro.md"
      },
      "scoreDiff": 9,
      "winsA": 1,
      "winsB": 0,
      "comparableCategoryCount": 1,
      "benchmarkCountA": 38,
      "benchmarkCountB": 33,
      "categoryResults": {
        "agentic": {
          "categoryLabel": "Agentic",
          "avgA": null,
          "avgB": 65.1,
          "winner": null,
          "benchmarkCount": 11
        },
        "coding": {
          "categoryLabel": "Coding",
          "avgA": null,
          "avgB": 66.4,
          "winner": null,
          "benchmarkCount": 9
        },
        "multimodalGrounded": {
          "categoryLabel": "Multimodal & Grounded",
          "avgA": 82.8,
          "avgB": 77.4,
          "winner": "A",
          "benchmarkCount": 10
        },
        "reasoning": {
          "categoryLabel": "Reasoning",
          "avgA": 77.1,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 3
        },
        "knowledge": {
          "categoryLabel": "Knowledge",
          "avgA": null,
          "avgB": 73.7,
          "winner": null,
          "benchmarkCount": 14
        },
        "instructionFollowing": {
          "categoryLabel": "Instruction Following",
          "avgA": null,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 1
        },
        "multilingual": {
          "categoryLabel": "Multilingual",
          "avgA": null,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 0
        },
        "math": {
          "categoryLabel": "Mathematics",
          "avgA": null,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 0
        }
      }
    },
    {
      "slug": "gpt-5-4-pro-vs-qwen3-7-max",
      "url": "https://benchlm.ai/compare/gpt-5-4-pro-vs-qwen3-7-max",
      "markdownUrl": "https://benchlm.ai/md/compare/gpt-5-4-pro-vs-qwen3-7-max.md",
      "modelA": {
        "slug": "qwen3-7-max",
        "canonicalModelKey": "qwen3-7-max",
        "model": "Qwen3.7 Max",
        "creator": "Alibaba",
        "sourceType": "Proprietary",
        "reasoningType": "Reasoning",
        "contextWindow": "1M",
        "contextWindowTokens": 1000000,
        "displayScore": 91,
        "rankingEligible": true,
        "overallRank": 5,
        "url": "https://benchlm.ai/models/qwen3-7-max",
        "markdownUrl": "https://benchlm.ai/md/models/qwen3-7-max.md"
      },
      "modelB": {
        "slug": "gpt-5-4-pro",
        "canonicalModelKey": "gpt-5-4-pro",
        "model": "GPT-5.4 Pro",
        "creator": "OpenAI",
        "sourceType": "Proprietary",
        "reasoningType": "Reasoning",
        "contextWindow": "1.05M",
        "contextWindowTokens": 1050000,
        "displayScore": 90,
        "rankingEligible": true,
        "overallRank": 6,
        "url": "https://benchlm.ai/models/gpt-5-4-pro",
        "markdownUrl": "https://benchlm.ai/md/models/gpt-5-4-pro.md"
      },
      "overallWinner": "A",
      "winner": {
        "slug": "qwen3-7-max",
        "canonicalModelKey": "qwen3-7-max",
        "model": "Qwen3.7 Max",
        "creator": "Alibaba",
        "sourceType": "Proprietary",
        "reasoningType": "Reasoning",
        "contextWindow": "1M",
        "contextWindowTokens": 1000000,
        "displayScore": 91,
        "rankingEligible": true,
        "overallRank": 5,
        "url": "https://benchlm.ai/models/qwen3-7-max",
        "markdownUrl": "https://benchlm.ai/md/models/qwen3-7-max.md"
      },
      "scoreDiff": 1,
      "winsA": 2,
      "winsB": 1,
      "comparableCategoryCount": 3,
      "benchmarkCountA": 51,
      "benchmarkCountB": 10,
      "categoryResults": {
        "agentic": {
          "categoryLabel": "Agentic",
          "avgA": 69.7,
          "avgB": 89.3,
          "winner": "B",
          "benchmarkCount": 14
        },
        "coding": {
          "categoryLabel": "Coding",
          "avgA": 73.6,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 10
        },
        "multimodalGrounded": {
          "categoryLabel": "Multimodal & Grounded",
          "avgA": null,
          "avgB": 94,
          "winner": null,
          "benchmarkCount": 2
        },
        "reasoning": {
          "categoryLabel": "Reasoning",
          "avgA": 90.4,
          "avgB": 83.3,
          "winner": "A",
          "benchmarkCount": 4
        },
        "knowledge": {
          "categoryLabel": "Knowledge",
          "avgA": 71.2,
          "avgB": 49,
          "winner": "A",
          "benchmarkCount": 16
        },
        "instructionFollowing": {
          "categoryLabel": "Instruction Following",
          "avgA": 89,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 3
        },
        "multilingual": {
          "categoryLabel": "Multilingual",
          "avgA": 87,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 5
        },
        "math": {
          "categoryLabel": "Mathematics",
          "avgA": null,
          "avgB": 50,
          "winner": null,
          "benchmarkCount": 5
        }
      }
    },
    {
      "slug": "gpt-5-5-vs-qwen3-7-max",
      "url": "https://benchlm.ai/compare/gpt-5-5-vs-qwen3-7-max",
      "markdownUrl": "https://benchlm.ai/md/compare/gpt-5-5-vs-qwen3-7-max.md",
      "modelA": {
        "slug": "qwen3-7-max",
        "canonicalModelKey": "qwen3-7-max",
        "model": "Qwen3.7 Max",
        "creator": "Alibaba",
        "sourceType": "Proprietary",
        "reasoningType": "Reasoning",
        "contextWindow": "1M",
        "contextWindowTokens": 1000000,
        "displayScore": 91,
        "rankingEligible": true,
        "overallRank": 5,
        "url": "https://benchlm.ai/models/qwen3-7-max",
        "markdownUrl": "https://benchlm.ai/md/models/qwen3-7-max.md"
      },
      "modelB": {
        "slug": "gpt-5-5",
        "canonicalModelKey": "gpt-5-5",
        "model": "GPT-5.5",
        "creator": "OpenAI",
        "sourceType": "Proprietary",
        "reasoningType": "Reasoning",
        "contextWindow": "1M",
        "contextWindowTokens": 1000000,
        "displayScore": 89,
        "rankingEligible": true,
        "overallRank": 7,
        "url": "https://benchlm.ai/models/gpt-5-5",
        "markdownUrl": "https://benchlm.ai/md/models/gpt-5-5.md"
      },
      "overallWinner": "A",
      "winner": {
        "slug": "qwen3-7-max",
        "canonicalModelKey": "qwen3-7-max",
        "model": "Qwen3.7 Max",
        "creator": "Alibaba",
        "sourceType": "Proprietary",
        "reasoningType": "Reasoning",
        "contextWindow": "1M",
        "contextWindowTokens": 1000000,
        "displayScore": 91,
        "rankingEligible": true,
        "overallRank": 5,
        "url": "https://benchlm.ai/models/qwen3-7-max",
        "markdownUrl": "https://benchlm.ai/md/models/qwen3-7-max.md"
      },
      "scoreDiff": 2,
      "winsA": 3,
      "winsB": 1,
      "comparableCategoryCount": 4,
      "benchmarkCountA": 51,
      "benchmarkCountB": 42,
      "categoryResults": {
        "agentic": {
          "categoryLabel": "Agentic",
          "avgA": 69.7,
          "avgB": 81.5,
          "winner": "B",
          "benchmarkCount": 18
        },
        "coding": {
          "categoryLabel": "Coding",
          "avgA": 73.6,
          "avgB": 58.6,
          "winner": "A",
          "benchmarkCount": 13
        },
        "multimodalGrounded": {
          "categoryLabel": "Multimodal & Grounded",
          "avgA": null,
          "avgB": 70.4,
          "winner": null,
          "benchmarkCount": 5
        },
        "reasoning": {
          "categoryLabel": "Reasoning",
          "avgA": 90.4,
          "avgB": 85,
          "winner": "A",
          "benchmarkCount": 6
        },
        "knowledge": {
          "categoryLabel": "Knowledge",
          "avgA": 71.2,
          "avgB": 66.4,
          "winner": "A",
          "benchmarkCount": 14
        },
        "instructionFollowing": {
          "categoryLabel": "Instruction Following",
          "avgA": 89,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 3
        },
        "multilingual": {
          "categoryLabel": "Multilingual",
          "avgA": 87,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 5
        },
        "math": {
          "categoryLabel": "Mathematics",
          "avgA": null,
          "avgB": 51.7,
          "winner": null,
          "benchmarkCount": 4
        }
      }
    },
    {
      "slug": "gemini-3-pro-deep-think-vs-qwen3-7-max",
      "url": "https://benchlm.ai/compare/gemini-3-pro-deep-think-vs-qwen3-7-max",
      "markdownUrl": "https://benchlm.ai/md/compare/gemini-3-pro-deep-think-vs-qwen3-7-max.md",
      "modelA": {
        "slug": "qwen3-7-max",
        "canonicalModelKey": "qwen3-7-max",
        "model": "Qwen3.7 Max",
        "creator": "Alibaba",
        "sourceType": "Proprietary",
        "reasoningType": "Reasoning",
        "contextWindow": "1M",
        "contextWindowTokens": 1000000,
        "displayScore": 91,
        "rankingEligible": true,
        "overallRank": 5,
        "url": "https://benchlm.ai/models/qwen3-7-max",
        "markdownUrl": "https://benchlm.ai/md/models/qwen3-7-max.md"
      },
      "modelB": {
        "slug": "gemini-3-pro-deep-think",
        "canonicalModelKey": "gemini-3-pro-deep-think",
        "model": "Gemini 3 Pro Deep Think",
        "creator": "Google",
        "sourceType": "Proprietary",
        "reasoningType": "Reasoning",
        "contextWindow": "2M",
        "contextWindowTokens": 2000000,
        "displayScore": 89,
        "rankingEligible": true,
        "overallRank": 8,
        "url": "https://benchlm.ai/models/gemini-3-pro-deep-think",
        "markdownUrl": "https://benchlm.ai/md/models/gemini-3-pro-deep-think.md"
      },
      "overallWinner": "A",
      "winner": {
        "slug": "qwen3-7-max",
        "canonicalModelKey": "qwen3-7-max",
        "model": "Qwen3.7 Max",
        "creator": "Alibaba",
        "sourceType": "Proprietary",
        "reasoningType": "Reasoning",
        "contextWindow": "1M",
        "contextWindowTokens": 1000000,
        "displayScore": 91,
        "rankingEligible": true,
        "overallRank": 5,
        "url": "https://benchlm.ai/models/qwen3-7-max",
        "markdownUrl": "https://benchlm.ai/md/models/qwen3-7-max.md"
      },
      "scoreDiff": 2,
      "winsA": 1,
      "winsB": 0,
      "comparableCategoryCount": 1,
      "benchmarkCountA": 51,
      "benchmarkCountB": 4,
      "categoryResults": {
        "agentic": {
          "categoryLabel": "Agentic",
          "avgA": 69.7,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 13
        },
        "coding": {
          "categoryLabel": "Coding",
          "avgA": 73.6,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 10
        },
        "multimodalGrounded": {
          "categoryLabel": "Multimodal & Grounded",
          "avgA": null,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 1
        },
        "reasoning": {
          "categoryLabel": "Reasoning",
          "avgA": 90.4,
          "avgB": 45.1,
          "winner": "A",
          "benchmarkCount": 4
        },
        "knowledge": {
          "categoryLabel": "Knowledge",
          "avgA": 71.2,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 13
        },
        "instructionFollowing": {
          "categoryLabel": "Instruction Following",
          "avgA": 89,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 3
        },
        "multilingual": {
          "categoryLabel": "Multilingual",
          "avgA": 87,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 5
        },
        "math": {
          "categoryLabel": "Mathematics",
          "avgA": null,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 3
        }
      }
    },
    {
      "slug": "grok-4-1-vs-qwen3-7-max",
      "url": "https://benchlm.ai/compare/grok-4-1-vs-qwen3-7-max",
      "markdownUrl": "https://benchlm.ai/md/compare/grok-4-1-vs-qwen3-7-max.md",
      "modelA": {
        "slug": "qwen3-7-max",
        "canonicalModelKey": "qwen3-7-max",
        "model": "Qwen3.7 Max",
        "creator": "Alibaba",
        "sourceType": "Proprietary",
        "reasoningType": "Reasoning",
        "contextWindow": "1M",
        "contextWindowTokens": 1000000,
        "displayScore": 91,
        "rankingEligible": true,
        "overallRank": 5,
        "url": "https://benchlm.ai/models/qwen3-7-max",
        "markdownUrl": "https://benchlm.ai/md/models/qwen3-7-max.md"
      },
      "modelB": {
        "slug": "grok-4-1",
        "canonicalModelKey": "grok-4-1",
        "model": "Grok 4.1",
        "creator": "xAI",
        "sourceType": "Proprietary",
        "reasoningType": "Non-Reasoning",
        "contextWindow": "1M",
        "contextWindowTokens": 1000000,
        "displayScore": 89,
        "rankingEligible": true,
        "overallRank": 9,
        "url": "https://benchlm.ai/models/grok-4-1",
        "markdownUrl": "https://benchlm.ai/md/models/grok-4-1.md"
      },
      "overallWinner": "A",
      "winner": {
        "slug": "qwen3-7-max",
        "canonicalModelKey": "qwen3-7-max",
        "model": "Qwen3.7 Max",
        "creator": "Alibaba",
        "sourceType": "Proprietary",
        "reasoningType": "Reasoning",
        "contextWindow": "1M",
        "contextWindowTokens": 1000000,
        "displayScore": 91,
        "rankingEligible": true,
        "overallRank": 5,
        "url": "https://benchlm.ai/models/qwen3-7-max",
        "markdownUrl": "https://benchlm.ai/md/models/qwen3-7-max.md"
      },
      "scoreDiff": 2,
      "winsA": 0,
      "winsB": 0,
      "comparableCategoryCount": 0,
      "benchmarkCountA": 51,
      "benchmarkCountB": 0,
      "categoryResults": {
        "agentic": {
          "categoryLabel": "Agentic",
          "avgA": 69.7,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 13
        },
        "coding": {
          "categoryLabel": "Coding",
          "avgA": 73.6,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 10
        },
        "multimodalGrounded": {
          "categoryLabel": "Multimodal & Grounded",
          "avgA": null,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 1
        },
        "reasoning": {
          "categoryLabel": "Reasoning",
          "avgA": 90.4,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 3
        },
        "knowledge": {
          "categoryLabel": "Knowledge",
          "avgA": 71.2,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 13
        },
        "instructionFollowing": {
          "categoryLabel": "Instruction Following",
          "avgA": 89,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 3
        },
        "multilingual": {
          "categoryLabel": "Multilingual",
          "avgA": 87,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 5
        },
        "math": {
          "categoryLabel": "Mathematics",
          "avgA": null,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 3
        }
      }
    },
    {
      "slug": "gpt-5-4-vs-qwen3-7-max",
      "url": "https://benchlm.ai/compare/gpt-5-4-vs-qwen3-7-max",
      "markdownUrl": "https://benchlm.ai/md/compare/gpt-5-4-vs-qwen3-7-max.md",
      "modelA": {
        "slug": "qwen3-7-max",
        "canonicalModelKey": "qwen3-7-max",
        "model": "Qwen3.7 Max",
        "creator": "Alibaba",
        "sourceType": "Proprietary",
        "reasoningType": "Reasoning",
        "contextWindow": "1M",
        "contextWindowTokens": 1000000,
        "displayScore": 91,
        "rankingEligible": true,
        "overallRank": 5,
        "url": "https://benchlm.ai/models/qwen3-7-max",
        "markdownUrl": "https://benchlm.ai/md/models/qwen3-7-max.md"
      },
      "modelB": {
        "slug": "gpt-5-4",
        "canonicalModelKey": "gpt-5-4",
        "model": "GPT-5.4",
        "creator": "OpenAI",
        "sourceType": "Proprietary",
        "reasoningType": "Reasoning",
        "contextWindow": "1.05M",
        "contextWindowTokens": 1050000,
        "displayScore": 88,
        "rankingEligible": true,
        "overallRank": 10,
        "url": "https://benchlm.ai/models/gpt-5-4",
        "markdownUrl": "https://benchlm.ai/md/models/gpt-5-4.md"
      },
      "overallWinner": "A",
      "winner": {
        "slug": "qwen3-7-max",
        "canonicalModelKey": "qwen3-7-max",
        "model": "Qwen3.7 Max",
        "creator": "Alibaba",
        "sourceType": "Proprietary",
        "reasoningType": "Reasoning",
        "contextWindow": "1M",
        "contextWindowTokens": 1000000,
        "displayScore": 91,
        "rankingEligible": true,
        "overallRank": 5,
        "url": "https://benchlm.ai/models/qwen3-7-max",
        "markdownUrl": "https://benchlm.ai/md/models/qwen3-7-max.md"
      },
      "scoreDiff": 3,
      "winsA": 2,
      "winsB": 1,
      "comparableCategoryCount": 3,
      "benchmarkCountA": 51,
      "benchmarkCountB": 48,
      "categoryResults": {
        "agentic": {
          "categoryLabel": "Agentic",
          "avgA": 69.7,
          "avgB": 77,
          "winner": "B",
          "benchmarkCount": 19
        },
        "coding": {
          "categoryLabel": "Coding",
          "avgA": 73.6,
          "avgB": 57.7,
          "winner": "A",
          "benchmarkCount": 13
        },
        "multimodalGrounded": {
          "categoryLabel": "Multimodal & Grounded",
          "avgA": null,
          "avgB": 72.7,
          "winner": null,
          "benchmarkCount": 12
        },
        "reasoning": {
          "categoryLabel": "Reasoning",
          "avgA": 90.4,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 3
        },
        "knowledge": {
          "categoryLabel": "Knowledge",
          "avgA": 71.2,
          "avgB": 66.1,
          "winner": "A",
          "benchmarkCount": 16
        },
        "instructionFollowing": {
          "categoryLabel": "Instruction Following",
          "avgA": 89,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 3
        },
        "multilingual": {
          "categoryLabel": "Multilingual",
          "avgA": 87,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 5
        },
        "math": {
          "categoryLabel": "Mathematics",
          "avgA": null,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 3
        }
      }
    },
    {
      "slug": "qwen3-7-max-vs-qwen3-7-plus",
      "url": "https://benchlm.ai/compare/qwen3-7-max-vs-qwen3-7-plus",
      "markdownUrl": "https://benchlm.ai/md/compare/qwen3-7-max-vs-qwen3-7-plus.md",
      "modelA": {
        "slug": "qwen3-7-max",
        "canonicalModelKey": "qwen3-7-max",
        "model": "Qwen3.7 Max",
        "creator": "Alibaba",
        "sourceType": "Proprietary",
        "reasoningType": "Reasoning",
        "contextWindow": "1M",
        "contextWindowTokens": 1000000,
        "displayScore": 91,
        "rankingEligible": true,
        "overallRank": 5,
        "url": "https://benchlm.ai/models/qwen3-7-max",
        "markdownUrl": "https://benchlm.ai/md/models/qwen3-7-max.md"
      },
      "modelB": {
        "slug": "qwen3-7-plus",
        "canonicalModelKey": "qwen3-7-plus",
        "model": "Qwen3.7 Plus",
        "creator": "Alibaba",
        "sourceType": "Proprietary",
        "reasoningType": "Reasoning",
        "contextWindow": "1M",
        "contextWindowTokens": 1000000,
        "displayScore": 88,
        "rankingEligible": true,
        "overallRank": 11,
        "url": "https://benchlm.ai/models/qwen3-7-plus",
        "markdownUrl": "https://benchlm.ai/md/models/qwen3-7-plus.md"
      },
      "overallWinner": "A",
      "winner": {
        "slug": "qwen3-7-max",
        "canonicalModelKey": "qwen3-7-max",
        "model": "Qwen3.7 Max",
        "creator": "Alibaba",
        "sourceType": "Proprietary",
        "reasoningType": "Reasoning",
        "contextWindow": "1M",
        "contextWindowTokens": 1000000,
        "displayScore": 91,
        "rankingEligible": true,
        "overallRank": 5,
        "url": "https://benchlm.ai/models/qwen3-7-max",
        "markdownUrl": "https://benchlm.ai/md/models/qwen3-7-max.md"
      },
      "scoreDiff": 3,
      "winsA": 3,
      "winsB": 3,
      "comparableCategoryCount": 6,
      "benchmarkCountA": 51,
      "benchmarkCountB": 68,
      "categoryResults": {
        "agentic": {
          "categoryLabel": "Agentic",
          "avgA": 69.7,
          "avgB": 71.7,
          "winner": "B",
          "benchmarkCount": 17
        },
        "coding": {
          "categoryLabel": "Coding",
          "avgA": 73.6,
          "avgB": 71.1,
          "winner": "A",
          "benchmarkCount": 10
        },
        "multimodalGrounded": {
          "categoryLabel": "Multimodal & Grounded",
          "avgA": null,
          "avgB": 81.1,
          "winner": null,
          "benchmarkCount": 17
        },
        "reasoning": {
          "categoryLabel": "Reasoning",
          "avgA": 90.4,
          "avgB": 91.7,
          "winner": "B",
          "benchmarkCount": 3
        },
        "knowledge": {
          "categoryLabel": "Knowledge",
          "avgA": 71.2,
          "avgB": 67.9,
          "winner": "A",
          "benchmarkCount": 13
        },
        "instructionFollowing": {
          "categoryLabel": "Instruction Following",
          "avgA": 89,
          "avgB": 89.2,
          "winner": "B",
          "benchmarkCount": 3
        },
        "multilingual": {
          "categoryLabel": "Multilingual",
          "avgA": 87,
          "avgB": 85.4,
          "winner": "A",
          "benchmarkCount": 5
        },
        "math": {
          "categoryLabel": "Mathematics",
          "avgA": null,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 3
        }
      }
    },
    {
      "slug": "claude-opus-4-6-vs-qwen3-7-max",
      "url": "https://benchlm.ai/compare/claude-opus-4-6-vs-qwen3-7-max",
      "markdownUrl": "https://benchlm.ai/md/compare/claude-opus-4-6-vs-qwen3-7-max.md",
      "modelA": {
        "slug": "qwen3-7-max",
        "canonicalModelKey": "qwen3-7-max",
        "model": "Qwen3.7 Max",
        "creator": "Alibaba",
        "sourceType": "Proprietary",
        "reasoningType": "Reasoning",
        "contextWindow": "1M",
        "contextWindowTokens": 1000000,
        "displayScore": 91,
        "rankingEligible": true,
        "overallRank": 5,
        "url": "https://benchlm.ai/models/qwen3-7-max",
        "markdownUrl": "https://benchlm.ai/md/models/qwen3-7-max.md"
      },
      "modelB": {
        "slug": "claude-opus-4-6",
        "canonicalModelKey": "claude-opus-4-6",
        "model": "Claude Opus 4.6",
        "creator": "Anthropic",
        "sourceType": "Proprietary",
        "reasoningType": "Non-Reasoning",
        "contextWindow": "1M",
        "contextWindowTokens": 1000000,
        "displayScore": 86,
        "rankingEligible": true,
        "overallRank": 12,
        "url": "https://benchlm.ai/models/claude-opus-4-6",
        "markdownUrl": "https://benchlm.ai/md/models/claude-opus-4-6.md"
      },
      "overallWinner": "A",
      "winner": {
        "slug": "qwen3-7-max",
        "canonicalModelKey": "qwen3-7-max",
        "model": "Qwen3.7 Max",
        "creator": "Alibaba",
        "sourceType": "Proprietary",
        "reasoningType": "Reasoning",
        "contextWindow": "1M",
        "contextWindowTokens": 1000000,
        "displayScore": 91,
        "rankingEligible": true,
        "overallRank": 5,
        "url": "https://benchlm.ai/models/qwen3-7-max",
        "markdownUrl": "https://benchlm.ai/md/models/qwen3-7-max.md"
      },
      "scoreDiff": 5,
      "winsA": 1,
      "winsB": 2,
      "comparableCategoryCount": 3,
      "benchmarkCountA": 51,
      "benchmarkCountB": 47,
      "categoryResults": {
        "agentic": {
          "categoryLabel": "Agentic",
          "avgA": 69.7,
          "avgB": 72.6,
          "winner": "B",
          "benchmarkCount": 17
        },
        "coding": {
          "categoryLabel": "Coding",
          "avgA": 73.6,
          "avgB": 64.4,
          "winner": "A",
          "benchmarkCount": 15
        },
        "multimodalGrounded": {
          "categoryLabel": "Multimodal & Grounded",
          "avgA": null,
          "avgB": 77.3,
          "winner": null,
          "benchmarkCount": 7
        },
        "reasoning": {
          "categoryLabel": "Reasoning",
          "avgA": 90.4,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 3
        },
        "knowledge": {
          "categoryLabel": "Knowledge",
          "avgA": 71.2,
          "avgB": 76.2,
          "winner": "B",
          "benchmarkCount": 17
        },
        "instructionFollowing": {
          "categoryLabel": "Instruction Following",
          "avgA": 89,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 3
        },
        "multilingual": {
          "categoryLabel": "Multilingual",
          "avgA": 87,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 5
        },
        "math": {
          "categoryLabel": "Mathematics",
          "avgA": null,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 4
        }
      }
    },
    {
      "slug": "gemini-3-5-flash-vs-qwen3-7-max",
      "url": "https://benchlm.ai/compare/gemini-3-5-flash-vs-qwen3-7-max",
      "markdownUrl": "https://benchlm.ai/md/compare/gemini-3-5-flash-vs-qwen3-7-max.md",
      "modelA": {
        "slug": "qwen3-7-max",
        "canonicalModelKey": "qwen3-7-max",
        "model": "Qwen3.7 Max",
        "creator": "Alibaba",
        "sourceType": "Proprietary",
        "reasoningType": "Reasoning",
        "contextWindow": "1M",
        "contextWindowTokens": 1000000,
        "displayScore": 91,
        "rankingEligible": true,
        "overallRank": 5,
        "url": "https://benchlm.ai/models/qwen3-7-max",
        "markdownUrl": "https://benchlm.ai/md/models/qwen3-7-max.md"
      },
      "modelB": {
        "slug": "gemini-3-5-flash",
        "canonicalModelKey": "gemini-3-5-flash",
        "model": "Gemini 3.5 Flash",
        "creator": "Google",
        "sourceType": "Proprietary",
        "reasoningType": "Reasoning",
        "contextWindow": "1M",
        "contextWindowTokens": 1000000,
        "displayScore": 86,
        "rankingEligible": true,
        "overallRank": 13,
        "url": "https://benchlm.ai/models/gemini-3-5-flash",
        "markdownUrl": "https://benchlm.ai/md/models/gemini-3-5-flash.md"
      },
      "overallWinner": "A",
      "winner": {
        "slug": "qwen3-7-max",
        "canonicalModelKey": "qwen3-7-max",
        "model": "Qwen3.7 Max",
        "creator": "Alibaba",
        "sourceType": "Proprietary",
        "reasoningType": "Reasoning",
        "contextWindow": "1M",
        "contextWindowTokens": 1000000,
        "displayScore": 91,
        "rankingEligible": true,
        "overallRank": 5,
        "url": "https://benchlm.ai/models/qwen3-7-max",
        "markdownUrl": "https://benchlm.ai/md/models/qwen3-7-max.md"
      },
      "scoreDiff": 5,
      "winsA": 4,
      "winsB": 1,
      "comparableCategoryCount": 5,
      "benchmarkCountA": 51,
      "benchmarkCountB": 40,
      "categoryResults": {
        "agentic": {
          "categoryLabel": "Agentic",
          "avgA": 69.7,
          "avgB": 77.2,
          "winner": "B",
          "benchmarkCount": 17
        },
        "coding": {
          "categoryLabel": "Coding",
          "avgA": 73.6,
          "avgB": 54.5,
          "winner": "A",
          "benchmarkCount": 12
        },
        "multimodalGrounded": {
          "categoryLabel": "Multimodal & Grounded",
          "avgA": null,
          "avgB": 83.8,
          "winner": null,
          "benchmarkCount": 5
        },
        "reasoning": {
          "categoryLabel": "Reasoning",
          "avgA": 90.4,
          "avgB": 74.7,
          "winner": "A",
          "benchmarkCount": 5
        },
        "knowledge": {
          "categoryLabel": "Knowledge",
          "avgA": 71.2,
          "avgB": 58,
          "winner": "A",
          "benchmarkCount": 13
        },
        "instructionFollowing": {
          "categoryLabel": "Instruction Following",
          "avgA": 89,
          "avgB": 76.3,
          "winner": "A",
          "benchmarkCount": 3
        },
        "multilingual": {
          "categoryLabel": "Multilingual",
          "avgA": 87,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 5
        },
        "math": {
          "categoryLabel": "Mathematics",
          "avgA": null,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 3
        }
      }
    },
    {
      "slug": "deepseek-v4-pro-max-vs-qwen3-7-max",
      "url": "https://benchlm.ai/compare/deepseek-v4-pro-max-vs-qwen3-7-max",
      "markdownUrl": "https://benchlm.ai/md/compare/deepseek-v4-pro-max-vs-qwen3-7-max.md",
      "modelA": {
        "slug": "qwen3-7-max",
        "canonicalModelKey": "qwen3-7-max",
        "model": "Qwen3.7 Max",
        "creator": "Alibaba",
        "sourceType": "Proprietary",
        "reasoningType": "Reasoning",
        "contextWindow": "1M",
        "contextWindowTokens": 1000000,
        "displayScore": 91,
        "rankingEligible": true,
        "overallRank": 5,
        "url": "https://benchlm.ai/models/qwen3-7-max",
        "markdownUrl": "https://benchlm.ai/md/models/qwen3-7-max.md"
      },
      "modelB": {
        "slug": "deepseek-v4-pro-max",
        "canonicalModelKey": "deepseek-v4-pro-max",
        "model": "DeepSeek V4 Pro (Max)",
        "creator": "DeepSeek",
        "sourceType": "Open Weight",
        "reasoningType": "Reasoning",
        "contextWindow": "1M",
        "contextWindowTokens": 1000000,
        "displayScore": 86,
        "rankingEligible": true,
        "overallRank": 14,
        "url": "https://benchlm.ai/models/deepseek-v4-pro-max",
        "markdownUrl": "https://benchlm.ai/md/models/deepseek-v4-pro-max.md"
      },
      "overallWinner": "A",
      "winner": {
        "slug": "qwen3-7-max",
        "canonicalModelKey": "qwen3-7-max",
        "model": "Qwen3.7 Max",
        "creator": "Alibaba",
        "sourceType": "Proprietary",
        "reasoningType": "Reasoning",
        "contextWindow": "1M",
        "contextWindowTokens": 1000000,
        "displayScore": 91,
        "rankingEligible": true,
        "overallRank": 5,
        "url": "https://benchlm.ai/models/qwen3-7-max",
        "markdownUrl": "https://benchlm.ai/md/models/qwen3-7-max.md"
      },
      "scoreDiff": 5,
      "winsA": 1,
      "winsB": 2,
      "comparableCategoryCount": 3,
      "benchmarkCountA": 51,
      "benchmarkCountB": 42,
      "categoryResults": {
        "agentic": {
          "categoryLabel": "Agentic",
          "avgA": 69.7,
          "avgB": 74,
          "winner": "B",
          "benchmarkCount": 16
        },
        "coding": {
          "categoryLabel": "Coding",
          "avgA": 73.6,
          "avgB": 75.9,
          "winner": "B",
          "benchmarkCount": 12
        },
        "multimodalGrounded": {
          "categoryLabel": "Multimodal & Grounded",
          "avgA": null,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 1
        },
        "reasoning": {
          "categoryLabel": "Reasoning",
          "avgA": 90.4,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 5
        },
        "knowledge": {
          "categoryLabel": "Knowledge",
          "avgA": 71.2,
          "avgB": 66.1,
          "winner": "A",
          "benchmarkCount": 15
        },
        "instructionFollowing": {
          "categoryLabel": "Instruction Following",
          "avgA": 89,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 3
        },
        "multilingual": {
          "categoryLabel": "Multilingual",
          "avgA": 87,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 5
        },
        "math": {
          "categoryLabel": "Mathematics",
          "avgA": null,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 4
        }
      }
    },
    {
      "slug": "gpt-5-3-codex-vs-qwen3-7-max",
      "url": "https://benchlm.ai/compare/gpt-5-3-codex-vs-qwen3-7-max",
      "markdownUrl": "https://benchlm.ai/md/compare/gpt-5-3-codex-vs-qwen3-7-max.md",
      "modelA": {
        "slug": "qwen3-7-max",
        "canonicalModelKey": "qwen3-7-max",
        "model": "Qwen3.7 Max",
        "creator": "Alibaba",
        "sourceType": "Proprietary",
        "reasoningType": "Reasoning",
        "contextWindow": "1M",
        "contextWindowTokens": 1000000,
        "displayScore": 91,
        "rankingEligible": true,
        "overallRank": 5,
        "url": "https://benchlm.ai/models/qwen3-7-max",
        "markdownUrl": "https://benchlm.ai/md/models/qwen3-7-max.md"
      },
      "modelB": {
        "slug": "gpt-5-3-codex",
        "canonicalModelKey": "gpt-5-3-codex",
        "model": "GPT-5.3 Codex",
        "creator": "OpenAI",
        "sourceType": "Proprietary",
        "reasoningType": "Reasoning",
        "contextWindow": "400K",
        "contextWindowTokens": 400000,
        "displayScore": 85,
        "rankingEligible": true,
        "overallRank": 15,
        "url": "https://benchlm.ai/models/gpt-5-3-codex",
        "markdownUrl": "https://benchlm.ai/md/models/gpt-5-3-codex.md"
      },
      "overallWinner": "A",
      "winner": {
        "slug": "qwen3-7-max",
        "canonicalModelKey": "qwen3-7-max",
        "model": "Qwen3.7 Max",
        "creator": "Alibaba",
        "sourceType": "Proprietary",
        "reasoningType": "Reasoning",
        "contextWindow": "1M",
        "contextWindowTokens": 1000000,
        "displayScore": 91,
        "rankingEligible": true,
        "overallRank": 5,
        "url": "https://benchlm.ai/models/qwen3-7-max",
        "markdownUrl": "https://benchlm.ai/md/models/qwen3-7-max.md"
      },
      "scoreDiff": 6,
      "winsA": 1,
      "winsB": 1,
      "comparableCategoryCount": 2,
      "benchmarkCountA": 51,
      "benchmarkCountB": 25,
      "categoryResults": {
        "agentic": {
          "categoryLabel": "Agentic",
          "avgA": 69.7,
          "avgB": 71.5,
          "winner": "B",
          "benchmarkCount": 14
        },
        "coding": {
          "categoryLabel": "Coding",
          "avgA": 73.6,
          "avgB": 63.1,
          "winner": "A",
          "benchmarkCount": 12
        },
        "multimodalGrounded": {
          "categoryLabel": "Multimodal & Grounded",
          "avgA": null,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 2
        },
        "reasoning": {
          "categoryLabel": "Reasoning",
          "avgA": 90.4,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 3
        },
        "knowledge": {
          "categoryLabel": "Knowledge",
          "avgA": 71.2,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 13
        },
        "instructionFollowing": {
          "categoryLabel": "Instruction Following",
          "avgA": 89,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 3
        },
        "multilingual": {
          "categoryLabel": "Multilingual",
          "avgA": 87,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 5
        },
        "math": {
          "categoryLabel": "Mathematics",
          "avgA": null,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 3
        }
      }
    },
    {
      "slug": "claude-opus-4-7-adaptive-vs-qwen3-7-max",
      "url": "https://benchlm.ai/compare/claude-opus-4-7-adaptive-vs-qwen3-7-max",
      "markdownUrl": "https://benchlm.ai/md/compare/claude-opus-4-7-adaptive-vs-qwen3-7-max.md",
      "modelA": {
        "slug": "qwen3-7-max",
        "canonicalModelKey": "qwen3-7-max",
        "model": "Qwen3.7 Max",
        "creator": "Alibaba",
        "sourceType": "Proprietary",
        "reasoningType": "Reasoning",
        "contextWindow": "1M",
        "contextWindowTokens": 1000000,
        "displayScore": 91,
        "rankingEligible": true,
        "overallRank": 5,
        "url": "https://benchlm.ai/models/qwen3-7-max",
        "markdownUrl": "https://benchlm.ai/md/models/qwen3-7-max.md"
      },
      "modelB": {
        "slug": "claude-opus-4-7-adaptive",
        "canonicalModelKey": "claude-opus-4-7-max",
        "model": "Claude Opus 4.7 (Adaptive)",
        "creator": "Anthropic",
        "sourceType": "Proprietary",
        "reasoningType": "Reasoning",
        "contextWindow": "1M",
        "contextWindowTokens": 1000000,
        "displayScore": 84,
        "rankingEligible": true,
        "overallRank": 16,
        "url": "https://benchlm.ai/models/claude-opus-4-7-adaptive",
        "markdownUrl": "https://benchlm.ai/md/models/claude-opus-4-7-adaptive.md"
      },
      "overallWinner": "A",
      "winner": {
        "slug": "qwen3-7-max",
        "canonicalModelKey": "qwen3-7-max",
        "model": "Qwen3.7 Max",
        "creator": "Alibaba",
        "sourceType": "Proprietary",
        "reasoningType": "Reasoning",
        "contextWindow": "1M",
        "contextWindowTokens": 1000000,
        "displayScore": 91,
        "rankingEligible": true,
        "overallRank": 5,
        "url": "https://benchlm.ai/models/qwen3-7-max",
        "markdownUrl": "https://benchlm.ai/md/models/qwen3-7-max.md"
      },
      "scoreDiff": 7,
      "winsA": 3,
      "winsB": 1,
      "comparableCategoryCount": 4,
      "benchmarkCountA": 51,
      "benchmarkCountB": 36,
      "categoryResults": {
        "agentic": {
          "categoryLabel": "Agentic",
          "avgA": 69.7,
          "avgB": 74.9,
          "winner": "B",
          "benchmarkCount": 16
        },
        "coding": {
          "categoryLabel": "Coding",
          "avgA": 73.6,
          "avgB": 72.9,
          "winner": "A",
          "benchmarkCount": 10
        },
        "multimodalGrounded": {
          "categoryLabel": "Multimodal & Grounded",
          "avgA": null,
          "avgB": 64.3,
          "winner": null,
          "benchmarkCount": 5
        },
        "reasoning": {
          "categoryLabel": "Reasoning",
          "avgA": 90.4,
          "avgB": 75.8,
          "winner": "A",
          "benchmarkCount": 5
        },
        "knowledge": {
          "categoryLabel": "Knowledge",
          "avgA": 71.2,
          "avgB": 68.2,
          "winner": "A",
          "benchmarkCount": 14
        },
        "instructionFollowing": {
          "categoryLabel": "Instruction Following",
          "avgA": 89,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 3
        },
        "multilingual": {
          "categoryLabel": "Multilingual",
          "avgA": 87,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 5
        },
        "math": {
          "categoryLabel": "Mathematics",
          "avgA": null,
          "avgB": 43.8,
          "winner": null,
          "benchmarkCount": 4
        }
      }
    },
    {
      "slug": "glm-5-1-vs-qwen3-7-max",
      "url": "https://benchlm.ai/compare/glm-5-1-vs-qwen3-7-max",
      "markdownUrl": "https://benchlm.ai/md/compare/glm-5-1-vs-qwen3-7-max.md",
      "modelA": {
        "slug": "qwen3-7-max",
        "canonicalModelKey": "qwen3-7-max",
        "model": "Qwen3.7 Max",
        "creator": "Alibaba",
        "sourceType": "Proprietary",
        "reasoningType": "Reasoning",
        "contextWindow": "1M",
        "contextWindowTokens": 1000000,
        "displayScore": 91,
        "rankingEligible": true,
        "overallRank": 5,
        "url": "https://benchlm.ai/models/qwen3-7-max",
        "markdownUrl": "https://benchlm.ai/md/models/qwen3-7-max.md"
      },
      "modelB": {
        "slug": "glm-5-1",
        "canonicalModelKey": "glm-5-1",
        "model": "GLM-5.1",
        "creator": "Z.AI",
        "sourceType": "Open Weight",
        "reasoningType": "Reasoning",
        "contextWindow": "203K",
        "contextWindowTokens": 203000,
        "displayScore": 82,
        "rankingEligible": true,
        "overallRank": 17,
        "url": "https://benchlm.ai/models/glm-5-1",
        "markdownUrl": "https://benchlm.ai/md/models/glm-5-1.md"
      },
      "overallWinner": "A",
      "winner": {
        "slug": "qwen3-7-max",
        "canonicalModelKey": "qwen3-7-max",
        "model": "Qwen3.7 Max",
        "creator": "Alibaba",
        "sourceType": "Proprietary",
        "reasoningType": "Reasoning",
        "contextWindow": "1M",
        "contextWindowTokens": 1000000,
        "displayScore": 91,
        "rankingEligible": true,
        "overallRank": 5,
        "url": "https://benchlm.ai/models/qwen3-7-max",
        "markdownUrl": "https://benchlm.ai/md/models/qwen3-7-max.md"
      },
      "scoreDiff": 9,
      "winsA": 3,
      "winsB": 0,
      "comparableCategoryCount": 3,
      "benchmarkCountA": 51,
      "benchmarkCountB": 33,
      "categoryResults": {
        "agentic": {
          "categoryLabel": "Agentic",
          "avgA": 69.7,
          "avgB": 65.3,
          "winner": "A",
          "benchmarkCount": 16
        },
        "coding": {
          "categoryLabel": "Coding",
          "avgA": 73.6,
          "avgB": 60.9,
          "winner": "A",
          "benchmarkCount": 12
        },
        "multimodalGrounded": {
          "categoryLabel": "Multimodal & Grounded",
          "avgA": null,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 1
        },
        "reasoning": {
          "categoryLabel": "Reasoning",
          "avgA": 90.4,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 3
        },
        "knowledge": {
          "categoryLabel": "Knowledge",
          "avgA": 71.2,
          "avgB": 52.3,
          "winner": "A",
          "benchmarkCount": 13
        },
        "instructionFollowing": {
          "categoryLabel": "Instruction Following",
          "avgA": 89,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 3
        },
        "multilingual": {
          "categoryLabel": "Multilingual",
          "avgA": 87,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 5
        },
        "math": {
          "categoryLabel": "Mathematics",
          "avgA": null,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 6
        }
      }
    },
    {
      "slug": "claude-sonnet-4-6-vs-qwen3-7-max",
      "url": "https://benchlm.ai/compare/claude-sonnet-4-6-vs-qwen3-7-max",
      "markdownUrl": "https://benchlm.ai/md/compare/claude-sonnet-4-6-vs-qwen3-7-max.md",
      "modelA": {
        "slug": "qwen3-7-max",
        "canonicalModelKey": "qwen3-7-max",
        "model": "Qwen3.7 Max",
        "creator": "Alibaba",
        "sourceType": "Proprietary",
        "reasoningType": "Reasoning",
        "contextWindow": "1M",
        "contextWindowTokens": 1000000,
        "displayScore": 91,
        "rankingEligible": true,
        "overallRank": 5,
        "url": "https://benchlm.ai/models/qwen3-7-max",
        "markdownUrl": "https://benchlm.ai/md/models/qwen3-7-max.md"
      },
      "modelB": {
        "slug": "claude-sonnet-4-6",
        "canonicalModelKey": "claude-sonnet-4-6",
        "model": "Claude Sonnet 4.6",
        "creator": "Anthropic",
        "sourceType": "Proprietary",
        "reasoningType": "Non-Reasoning",
        "contextWindow": "200K",
        "contextWindowTokens": 200000,
        "displayScore": 82,
        "rankingEligible": true,
        "overallRank": 18,
        "url": "https://benchlm.ai/models/claude-sonnet-4-6",
        "markdownUrl": "https://benchlm.ai/md/models/claude-sonnet-4-6.md"
      },
      "overallWinner": "A",
      "winner": {
        "slug": "qwen3-7-max",
        "canonicalModelKey": "qwen3-7-max",
        "model": "Qwen3.7 Max",
        "creator": "Alibaba",
        "sourceType": "Proprietary",
        "reasoningType": "Reasoning",
        "contextWindow": "1M",
        "contextWindowTokens": 1000000,
        "displayScore": 91,
        "rankingEligible": true,
        "overallRank": 5,
        "url": "https://benchlm.ai/models/qwen3-7-max",
        "markdownUrl": "https://benchlm.ai/md/models/qwen3-7-max.md"
      },
      "scoreDiff": 9,
      "winsA": 2,
      "winsB": 1,
      "comparableCategoryCount": 3,
      "benchmarkCountA": 51,
      "benchmarkCountB": 33,
      "categoryResults": {
        "agentic": {
          "categoryLabel": "Agentic",
          "avgA": 69.7,
          "avgB": 65.1,
          "winner": "A",
          "benchmarkCount": 15
        },
        "coding": {
          "categoryLabel": "Coding",
          "avgA": 73.6,
          "avgB": 66.4,
          "winner": "A",
          "benchmarkCount": 14
        },
        "multimodalGrounded": {
          "categoryLabel": "Multimodal & Grounded",
          "avgA": null,
          "avgB": 77.4,
          "winner": null,
          "benchmarkCount": 3
        },
        "reasoning": {
          "categoryLabel": "Reasoning",
          "avgA": 90.4,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 3
        },
        "knowledge": {
          "categoryLabel": "Knowledge",
          "avgA": 71.2,
          "avgB": 73.7,
          "winner": "B",
          "benchmarkCount": 13
        },
        "instructionFollowing": {
          "categoryLabel": "Instruction Following",
          "avgA": 89,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 3
        },
        "multilingual": {
          "categoryLabel": "Multilingual",
          "avgA": 87,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 5
        },
        "math": {
          "categoryLabel": "Mathematics",
          "avgA": null,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 3
        }
      }
    },
    {
      "slug": "gpt-5-4-pro-vs-gpt-5-5",
      "url": "https://benchlm.ai/compare/gpt-5-4-pro-vs-gpt-5-5",
      "markdownUrl": "https://benchlm.ai/md/compare/gpt-5-4-pro-vs-gpt-5-5.md",
      "modelA": {
        "slug": "gpt-5-4-pro",
        "canonicalModelKey": "gpt-5-4-pro",
        "model": "GPT-5.4 Pro",
        "creator": "OpenAI",
        "sourceType": "Proprietary",
        "reasoningType": "Reasoning",
        "contextWindow": "1.05M",
        "contextWindowTokens": 1050000,
        "displayScore": 90,
        "rankingEligible": true,
        "overallRank": 6,
        "url": "https://benchlm.ai/models/gpt-5-4-pro",
        "markdownUrl": "https://benchlm.ai/md/models/gpt-5-4-pro.md"
      },
      "modelB": {
        "slug": "gpt-5-5",
        "canonicalModelKey": "gpt-5-5",
        "model": "GPT-5.5",
        "creator": "OpenAI",
        "sourceType": "Proprietary",
        "reasoningType": "Reasoning",
        "contextWindow": "1M",
        "contextWindowTokens": 1000000,
        "displayScore": 89,
        "rankingEligible": true,
        "overallRank": 7,
        "url": "https://benchlm.ai/models/gpt-5-5",
        "markdownUrl": "https://benchlm.ai/md/models/gpt-5-5.md"
      },
      "overallWinner": "A",
      "winner": {
        "slug": "gpt-5-4-pro",
        "canonicalModelKey": "gpt-5-4-pro",
        "model": "GPT-5.4 Pro",
        "creator": "OpenAI",
        "sourceType": "Proprietary",
        "reasoningType": "Reasoning",
        "contextWindow": "1.05M",
        "contextWindowTokens": 1050000,
        "displayScore": 90,
        "rankingEligible": true,
        "overallRank": 6,
        "url": "https://benchlm.ai/models/gpt-5-4-pro",
        "markdownUrl": "https://benchlm.ai/md/models/gpt-5-4-pro.md"
      },
      "scoreDiff": 1,
      "winsA": 2,
      "winsB": 3,
      "comparableCategoryCount": 5,
      "benchmarkCountA": 10,
      "benchmarkCountB": 42,
      "categoryResults": {
        "agentic": {
          "categoryLabel": "Agentic",
          "avgA": 89.3,
          "avgB": 81.5,
          "winner": "A",
          "benchmarkCount": 12
        },
        "coding": {
          "categoryLabel": "Coding",
          "avgA": null,
          "avgB": 58.6,
          "winner": null,
          "benchmarkCount": 8
        },
        "multimodalGrounded": {
          "categoryLabel": "Multimodal & Grounded",
          "avgA": 94,
          "avgB": 70.4,
          "winner": "A",
          "benchmarkCount": 5
        },
        "reasoning": {
          "categoryLabel": "Reasoning",
          "avgA": 83.3,
          "avgB": 85,
          "winner": "B",
          "benchmarkCount": 5
        },
        "knowledge": {
          "categoryLabel": "Knowledge",
          "avgA": 49,
          "avgB": 66.4,
          "winner": "B",
          "benchmarkCount": 12
        },
        "instructionFollowing": {
          "categoryLabel": "Instruction Following",
          "avgA": null,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 1
        },
        "multilingual": {
          "categoryLabel": "Multilingual",
          "avgA": null,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 0
        },
        "math": {
          "categoryLabel": "Mathematics",
          "avgA": 50,
          "avgB": 51.7,
          "winner": "B",
          "benchmarkCount": 2
        }
      }
    },
    {
      "slug": "gemini-3-pro-deep-think-vs-gpt-5-4-pro",
      "url": "https://benchlm.ai/compare/gemini-3-pro-deep-think-vs-gpt-5-4-pro",
      "markdownUrl": "https://benchlm.ai/md/compare/gemini-3-pro-deep-think-vs-gpt-5-4-pro.md",
      "modelA": {
        "slug": "gpt-5-4-pro",
        "canonicalModelKey": "gpt-5-4-pro",
        "model": "GPT-5.4 Pro",
        "creator": "OpenAI",
        "sourceType": "Proprietary",
        "reasoningType": "Reasoning",
        "contextWindow": "1.05M",
        "contextWindowTokens": 1050000,
        "displayScore": 90,
        "rankingEligible": true,
        "overallRank": 6,
        "url": "https://benchlm.ai/models/gpt-5-4-pro",
        "markdownUrl": "https://benchlm.ai/md/models/gpt-5-4-pro.md"
      },
      "modelB": {
        "slug": "gemini-3-pro-deep-think",
        "canonicalModelKey": "gemini-3-pro-deep-think",
        "model": "Gemini 3 Pro Deep Think",
        "creator": "Google",
        "sourceType": "Proprietary",
        "reasoningType": "Reasoning",
        "contextWindow": "2M",
        "contextWindowTokens": 2000000,
        "displayScore": 89,
        "rankingEligible": true,
        "overallRank": 8,
        "url": "https://benchlm.ai/models/gemini-3-pro-deep-think",
        "markdownUrl": "https://benchlm.ai/md/models/gemini-3-pro-deep-think.md"
      },
      "overallWinner": "A",
      "winner": {
        "slug": "gpt-5-4-pro",
        "canonicalModelKey": "gpt-5-4-pro",
        "model": "GPT-5.4 Pro",
        "creator": "OpenAI",
        "sourceType": "Proprietary",
        "reasoningType": "Reasoning",
        "contextWindow": "1.05M",
        "contextWindowTokens": 1050000,
        "displayScore": 90,
        "rankingEligible": true,
        "overallRank": 6,
        "url": "https://benchlm.ai/models/gpt-5-4-pro",
        "markdownUrl": "https://benchlm.ai/md/models/gpt-5-4-pro.md"
      },
      "scoreDiff": 1,
      "winsA": 1,
      "winsB": 0,
      "comparableCategoryCount": 1,
      "benchmarkCountA": 10,
      "benchmarkCountB": 4,
      "categoryResults": {
        "agentic": {
          "categoryLabel": "Agentic",
          "avgA": 89.3,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 3
        },
        "coding": {
          "categoryLabel": "Coding",
          "avgA": null,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 0
        },
        "multimodalGrounded": {
          "categoryLabel": "Multimodal & Grounded",
          "avgA": 94,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 1
        },
        "reasoning": {
          "categoryLabel": "Reasoning",
          "avgA": 83.3,
          "avgB": 45.1,
          "winner": "A",
          "benchmarkCount": 2
        },
        "knowledge": {
          "categoryLabel": "Knowledge",
          "avgA": 49,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 4
        },
        "instructionFollowing": {
          "categoryLabel": "Instruction Following",
          "avgA": null,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 0
        },
        "multilingual": {
          "categoryLabel": "Multilingual",
          "avgA": null,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 0
        },
        "math": {
          "categoryLabel": "Mathematics",
          "avgA": 50,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 2
        }
      }
    },
    {
      "slug": "gpt-5-4-pro-vs-grok-4-1",
      "url": "https://benchlm.ai/compare/gpt-5-4-pro-vs-grok-4-1",
      "markdownUrl": "https://benchlm.ai/md/compare/gpt-5-4-pro-vs-grok-4-1.md",
      "modelA": {
        "slug": "gpt-5-4-pro",
        "canonicalModelKey": "gpt-5-4-pro",
        "model": "GPT-5.4 Pro",
        "creator": "OpenAI",
        "sourceType": "Proprietary",
        "reasoningType": "Reasoning",
        "contextWindow": "1.05M",
        "contextWindowTokens": 1050000,
        "displayScore": 90,
        "rankingEligible": true,
        "overallRank": 6,
        "url": "https://benchlm.ai/models/gpt-5-4-pro",
        "markdownUrl": "https://benchlm.ai/md/models/gpt-5-4-pro.md"
      },
      "modelB": {
        "slug": "grok-4-1",
        "canonicalModelKey": "grok-4-1",
        "model": "Grok 4.1",
        "creator": "xAI",
        "sourceType": "Proprietary",
        "reasoningType": "Non-Reasoning",
        "contextWindow": "1M",
        "contextWindowTokens": 1000000,
        "displayScore": 89,
        "rankingEligible": true,
        "overallRank": 9,
        "url": "https://benchlm.ai/models/grok-4-1",
        "markdownUrl": "https://benchlm.ai/md/models/grok-4-1.md"
      },
      "overallWinner": "A",
      "winner": {
        "slug": "gpt-5-4-pro",
        "canonicalModelKey": "gpt-5-4-pro",
        "model": "GPT-5.4 Pro",
        "creator": "OpenAI",
        "sourceType": "Proprietary",
        "reasoningType": "Reasoning",
        "contextWindow": "1.05M",
        "contextWindowTokens": 1050000,
        "displayScore": 90,
        "rankingEligible": true,
        "overallRank": 6,
        "url": "https://benchlm.ai/models/gpt-5-4-pro",
        "markdownUrl": "https://benchlm.ai/md/models/gpt-5-4-pro.md"
      },
      "scoreDiff": 1,
      "winsA": 0,
      "winsB": 0,
      "comparableCategoryCount": 0,
      "benchmarkCountA": 10,
      "benchmarkCountB": 0,
      "categoryResults": {
        "agentic": {
          "categoryLabel": "Agentic",
          "avgA": 89.3,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 1
        },
        "coding": {
          "categoryLabel": "Coding",
          "avgA": null,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 0
        },
        "multimodalGrounded": {
          "categoryLabel": "Multimodal & Grounded",
          "avgA": 94,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 1
        },
        "reasoning": {
          "categoryLabel": "Reasoning",
          "avgA": 83.3,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 2
        },
        "knowledge": {
          "categoryLabel": "Knowledge",
          "avgA": 49,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 4
        },
        "instructionFollowing": {
          "categoryLabel": "Instruction Following",
          "avgA": null,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 0
        },
        "multilingual": {
          "categoryLabel": "Multilingual",
          "avgA": null,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 0
        },
        "math": {
          "categoryLabel": "Mathematics",
          "avgA": 50,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 2
        }
      }
    },
    {
      "slug": "gpt-5-4-vs-gpt-5-4-pro",
      "url": "https://benchlm.ai/compare/gpt-5-4-vs-gpt-5-4-pro",
      "markdownUrl": "https://benchlm.ai/md/compare/gpt-5-4-vs-gpt-5-4-pro.md",
      "modelA": {
        "slug": "gpt-5-4-pro",
        "canonicalModelKey": "gpt-5-4-pro",
        "model": "GPT-5.4 Pro",
        "creator": "OpenAI",
        "sourceType": "Proprietary",
        "reasoningType": "Reasoning",
        "contextWindow": "1.05M",
        "contextWindowTokens": 1050000,
        "displayScore": 90,
        "rankingEligible": true,
        "overallRank": 6,
        "url": "https://benchlm.ai/models/gpt-5-4-pro",
        "markdownUrl": "https://benchlm.ai/md/models/gpt-5-4-pro.md"
      },
      "modelB": {
        "slug": "gpt-5-4",
        "canonicalModelKey": "gpt-5-4",
        "model": "GPT-5.4",
        "creator": "OpenAI",
        "sourceType": "Proprietary",
        "reasoningType": "Reasoning",
        "contextWindow": "1.05M",
        "contextWindowTokens": 1050000,
        "displayScore": 88,
        "rankingEligible": true,
        "overallRank": 10,
        "url": "https://benchlm.ai/models/gpt-5-4",
        "markdownUrl": "https://benchlm.ai/md/models/gpt-5-4.md"
      },
      "overallWinner": "A",
      "winner": {
        "slug": "gpt-5-4-pro",
        "canonicalModelKey": "gpt-5-4-pro",
        "model": "GPT-5.4 Pro",
        "creator": "OpenAI",
        "sourceType": "Proprietary",
        "reasoningType": "Reasoning",
        "contextWindow": "1.05M",
        "contextWindowTokens": 1050000,
        "displayScore": 90,
        "rankingEligible": true,
        "overallRank": 6,
        "url": "https://benchlm.ai/models/gpt-5-4-pro",
        "markdownUrl": "https://benchlm.ai/md/models/gpt-5-4-pro.md"
      },
      "scoreDiff": 2,
      "winsA": 2,
      "winsB": 1,
      "comparableCategoryCount": 3,
      "benchmarkCountA": 10,
      "benchmarkCountB": 48,
      "categoryResults": {
        "agentic": {
          "categoryLabel": "Agentic",
          "avgA": 89.3,
          "avgB": 77,
          "winner": "A",
          "benchmarkCount": 14
        },
        "coding": {
          "categoryLabel": "Coding",
          "avgA": null,
          "avgB": 57.7,
          "winner": null,
          "benchmarkCount": 7
        },
        "multimodalGrounded": {
          "categoryLabel": "Multimodal & Grounded",
          "avgA": 94,
          "avgB": 72.7,
          "winner": "A",
          "benchmarkCount": 12
        },
        "reasoning": {
          "categoryLabel": "Reasoning",
          "avgA": 83.3,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 3
        },
        "knowledge": {
          "categoryLabel": "Knowledge",
          "avgA": 49,
          "avgB": 66.1,
          "winner": "B",
          "benchmarkCount": 14
        },
        "instructionFollowing": {
          "categoryLabel": "Instruction Following",
          "avgA": null,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 1
        },
        "multilingual": {
          "categoryLabel": "Multilingual",
          "avgA": null,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 0
        },
        "math": {
          "categoryLabel": "Mathematics",
          "avgA": 50,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 2
        }
      }
    },
    {
      "slug": "gpt-5-4-pro-vs-qwen3-7-plus",
      "url": "https://benchlm.ai/compare/gpt-5-4-pro-vs-qwen3-7-plus",
      "markdownUrl": "https://benchlm.ai/md/compare/gpt-5-4-pro-vs-qwen3-7-plus.md",
      "modelA": {
        "slug": "gpt-5-4-pro",
        "canonicalModelKey": "gpt-5-4-pro",
        "model": "GPT-5.4 Pro",
        "creator": "OpenAI",
        "sourceType": "Proprietary",
        "reasoningType": "Reasoning",
        "contextWindow": "1.05M",
        "contextWindowTokens": 1050000,
        "displayScore": 90,
        "rankingEligible": true,
        "overallRank": 6,
        "url": "https://benchlm.ai/models/gpt-5-4-pro",
        "markdownUrl": "https://benchlm.ai/md/models/gpt-5-4-pro.md"
      },
      "modelB": {
        "slug": "qwen3-7-plus",
        "canonicalModelKey": "qwen3-7-plus",
        "model": "Qwen3.7 Plus",
        "creator": "Alibaba",
        "sourceType": "Proprietary",
        "reasoningType": "Reasoning",
        "contextWindow": "1M",
        "contextWindowTokens": 1000000,
        "displayScore": 88,
        "rankingEligible": true,
        "overallRank": 11,
        "url": "https://benchlm.ai/models/qwen3-7-plus",
        "markdownUrl": "https://benchlm.ai/md/models/qwen3-7-plus.md"
      },
      "overallWinner": "A",
      "winner": {
        "slug": "gpt-5-4-pro",
        "canonicalModelKey": "gpt-5-4-pro",
        "model": "GPT-5.4 Pro",
        "creator": "OpenAI",
        "sourceType": "Proprietary",
        "reasoningType": "Reasoning",
        "contextWindow": "1.05M",
        "contextWindowTokens": 1050000,
        "displayScore": 90,
        "rankingEligible": true,
        "overallRank": 6,
        "url": "https://benchlm.ai/models/gpt-5-4-pro",
        "markdownUrl": "https://benchlm.ai/md/models/gpt-5-4-pro.md"
      },
      "scoreDiff": 2,
      "winsA": 2,
      "winsB": 2,
      "comparableCategoryCount": 4,
      "benchmarkCountA": 10,
      "benchmarkCountB": 68,
      "categoryResults": {
        "agentic": {
          "categoryLabel": "Agentic",
          "avgA": 89.3,
          "avgB": 71.7,
          "winner": "A",
          "benchmarkCount": 16
        },
        "coding": {
          "categoryLabel": "Coding",
          "avgA": null,
          "avgB": 71.1,
          "winner": null,
          "benchmarkCount": 10
        },
        "multimodalGrounded": {
          "categoryLabel": "Multimodal & Grounded",
          "avgA": 94,
          "avgB": 81.1,
          "winner": "A",
          "benchmarkCount": 16
        },
        "reasoning": {
          "categoryLabel": "Reasoning",
          "avgA": 83.3,
          "avgB": 91.7,
          "winner": "B",
          "benchmarkCount": 4
        },
        "knowledge": {
          "categoryLabel": "Knowledge",
          "avgA": 49,
          "avgB": 67.9,
          "winner": "B",
          "benchmarkCount": 16
        },
        "instructionFollowing": {
          "categoryLabel": "Instruction Following",
          "avgA": null,
          "avgB": 89.2,
          "winner": null,
          "benchmarkCount": 3
        },
        "multilingual": {
          "categoryLabel": "Multilingual",
          "avgA": null,
          "avgB": 85.4,
          "winner": null,
          "benchmarkCount": 5
        },
        "math": {
          "categoryLabel": "Mathematics",
          "avgA": 50,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 5
        }
      }
    },
    {
      "slug": "claude-opus-4-6-vs-gpt-5-4-pro",
      "url": "https://benchlm.ai/compare/claude-opus-4-6-vs-gpt-5-4-pro",
      "markdownUrl": "https://benchlm.ai/md/compare/claude-opus-4-6-vs-gpt-5-4-pro.md",
      "modelA": {
        "slug": "gpt-5-4-pro",
        "canonicalModelKey": "gpt-5-4-pro",
        "model": "GPT-5.4 Pro",
        "creator": "OpenAI",
        "sourceType": "Proprietary",
        "reasoningType": "Reasoning",
        "contextWindow": "1.05M",
        "contextWindowTokens": 1050000,
        "displayScore": 90,
        "rankingEligible": true,
        "overallRank": 6,
        "url": "https://benchlm.ai/models/gpt-5-4-pro",
        "markdownUrl": "https://benchlm.ai/md/models/gpt-5-4-pro.md"
      },
      "modelB": {
        "slug": "claude-opus-4-6",
        "canonicalModelKey": "claude-opus-4-6",
        "model": "Claude Opus 4.6",
        "creator": "Anthropic",
        "sourceType": "Proprietary",
        "reasoningType": "Non-Reasoning",
        "contextWindow": "1M",
        "contextWindowTokens": 1000000,
        "displayScore": 86,
        "rankingEligible": true,
        "overallRank": 12,
        "url": "https://benchlm.ai/models/claude-opus-4-6",
        "markdownUrl": "https://benchlm.ai/md/models/claude-opus-4-6.md"
      },
      "overallWinner": "A",
      "winner": {
        "slug": "gpt-5-4-pro",
        "canonicalModelKey": "gpt-5-4-pro",
        "model": "GPT-5.4 Pro",
        "creator": "OpenAI",
        "sourceType": "Proprietary",
        "reasoningType": "Reasoning",
        "contextWindow": "1.05M",
        "contextWindowTokens": 1050000,
        "displayScore": 90,
        "rankingEligible": true,
        "overallRank": 6,
        "url": "https://benchlm.ai/models/gpt-5-4-pro",
        "markdownUrl": "https://benchlm.ai/md/models/gpt-5-4-pro.md"
      },
      "scoreDiff": 4,
      "winsA": 2,
      "winsB": 1,
      "comparableCategoryCount": 3,
      "benchmarkCountA": 10,
      "benchmarkCountB": 47,
      "categoryResults": {
        "agentic": {
          "categoryLabel": "Agentic",
          "avgA": 89.3,
          "avgB": 72.6,
          "winner": "A",
          "benchmarkCount": 11
        },
        "coding": {
          "categoryLabel": "Coding",
          "avgA": null,
          "avgB": 64.4,
          "winner": null,
          "benchmarkCount": 10
        },
        "multimodalGrounded": {
          "categoryLabel": "Multimodal & Grounded",
          "avgA": 94,
          "avgB": 77.3,
          "winner": "A",
          "benchmarkCount": 7
        },
        "reasoning": {
          "categoryLabel": "Reasoning",
          "avgA": 83.3,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 3
        },
        "knowledge": {
          "categoryLabel": "Knowledge",
          "avgA": 49,
          "avgB": 76.2,
          "winner": "B",
          "benchmarkCount": 17
        },
        "instructionFollowing": {
          "categoryLabel": "Instruction Following",
          "avgA": null,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 1
        },
        "multilingual": {
          "categoryLabel": "Multilingual",
          "avgA": null,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 0
        },
        "math": {
          "categoryLabel": "Mathematics",
          "avgA": 50,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 3
        }
      }
    },
    {
      "slug": "gemini-3-5-flash-vs-gpt-5-4-pro",
      "url": "https://benchlm.ai/compare/gemini-3-5-flash-vs-gpt-5-4-pro",
      "markdownUrl": "https://benchlm.ai/md/compare/gemini-3-5-flash-vs-gpt-5-4-pro.md",
      "modelA": {
        "slug": "gpt-5-4-pro",
        "canonicalModelKey": "gpt-5-4-pro",
        "model": "GPT-5.4 Pro",
        "creator": "OpenAI",
        "sourceType": "Proprietary",
        "reasoningType": "Reasoning",
        "contextWindow": "1.05M",
        "contextWindowTokens": 1050000,
        "displayScore": 90,
        "rankingEligible": true,
        "overallRank": 6,
        "url": "https://benchlm.ai/models/gpt-5-4-pro",
        "markdownUrl": "https://benchlm.ai/md/models/gpt-5-4-pro.md"
      },
      "modelB": {
        "slug": "gemini-3-5-flash",
        "canonicalModelKey": "gemini-3-5-flash",
        "model": "Gemini 3.5 Flash",
        "creator": "Google",
        "sourceType": "Proprietary",
        "reasoningType": "Reasoning",
        "contextWindow": "1M",
        "contextWindowTokens": 1000000,
        "displayScore": 86,
        "rankingEligible": true,
        "overallRank": 13,
        "url": "https://benchlm.ai/models/gemini-3-5-flash",
        "markdownUrl": "https://benchlm.ai/md/models/gemini-3-5-flash.md"
      },
      "overallWinner": "A",
      "winner": {
        "slug": "gpt-5-4-pro",
        "canonicalModelKey": "gpt-5-4-pro",
        "model": "GPT-5.4 Pro",
        "creator": "OpenAI",
        "sourceType": "Proprietary",
        "reasoningType": "Reasoning",
        "contextWindow": "1.05M",
        "contextWindowTokens": 1050000,
        "displayScore": 90,
        "rankingEligible": true,
        "overallRank": 6,
        "url": "https://benchlm.ai/models/gpt-5-4-pro",
        "markdownUrl": "https://benchlm.ai/md/models/gpt-5-4-pro.md"
      },
      "scoreDiff": 4,
      "winsA": 3,
      "winsB": 1,
      "comparableCategoryCount": 4,
      "benchmarkCountA": 10,
      "benchmarkCountB": 40,
      "categoryResults": {
        "agentic": {
          "categoryLabel": "Agentic",
          "avgA": 89.3,
          "avgB": 77.2,
          "winner": "A",
          "benchmarkCount": 12
        },
        "coding": {
          "categoryLabel": "Coding",
          "avgA": null,
          "avgB": 54.5,
          "winner": null,
          "benchmarkCount": 8
        },
        "multimodalGrounded": {
          "categoryLabel": "Multimodal & Grounded",
          "avgA": 94,
          "avgB": 83.8,
          "winner": "A",
          "benchmarkCount": 5
        },
        "reasoning": {
          "categoryLabel": "Reasoning",
          "avgA": 83.3,
          "avgB": 74.7,
          "winner": "A",
          "benchmarkCount": 5
        },
        "knowledge": {
          "categoryLabel": "Knowledge",
          "avgA": 49,
          "avgB": 58,
          "winner": "B",
          "benchmarkCount": 12
        },
        "instructionFollowing": {
          "categoryLabel": "Instruction Following",
          "avgA": null,
          "avgB": 76.3,
          "winner": null,
          "benchmarkCount": 2
        },
        "multilingual": {
          "categoryLabel": "Multilingual",
          "avgA": null,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 0
        },
        "math": {
          "categoryLabel": "Mathematics",
          "avgA": 50,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 2
        }
      }
    },
    {
      "slug": "deepseek-v4-pro-max-vs-gpt-5-4-pro",
      "url": "https://benchlm.ai/compare/deepseek-v4-pro-max-vs-gpt-5-4-pro",
      "markdownUrl": "https://benchlm.ai/md/compare/deepseek-v4-pro-max-vs-gpt-5-4-pro.md",
      "modelA": {
        "slug": "gpt-5-4-pro",
        "canonicalModelKey": "gpt-5-4-pro",
        "model": "GPT-5.4 Pro",
        "creator": "OpenAI",
        "sourceType": "Proprietary",
        "reasoningType": "Reasoning",
        "contextWindow": "1.05M",
        "contextWindowTokens": 1050000,
        "displayScore": 90,
        "rankingEligible": true,
        "overallRank": 6,
        "url": "https://benchlm.ai/models/gpt-5-4-pro",
        "markdownUrl": "https://benchlm.ai/md/models/gpt-5-4-pro.md"
      },
      "modelB": {
        "slug": "deepseek-v4-pro-max",
        "canonicalModelKey": "deepseek-v4-pro-max",
        "model": "DeepSeek V4 Pro (Max)",
        "creator": "DeepSeek",
        "sourceType": "Open Weight",
        "reasoningType": "Reasoning",
        "contextWindow": "1M",
        "contextWindowTokens": 1000000,
        "displayScore": 86,
        "rankingEligible": true,
        "overallRank": 14,
        "url": "https://benchlm.ai/models/deepseek-v4-pro-max",
        "markdownUrl": "https://benchlm.ai/md/models/deepseek-v4-pro-max.md"
      },
      "overallWinner": "A",
      "winner": {
        "slug": "gpt-5-4-pro",
        "canonicalModelKey": "gpt-5-4-pro",
        "model": "GPT-5.4 Pro",
        "creator": "OpenAI",
        "sourceType": "Proprietary",
        "reasoningType": "Reasoning",
        "contextWindow": "1.05M",
        "contextWindowTokens": 1050000,
        "displayScore": 90,
        "rankingEligible": true,
        "overallRank": 6,
        "url": "https://benchlm.ai/models/gpt-5-4-pro",
        "markdownUrl": "https://benchlm.ai/md/models/gpt-5-4-pro.md"
      },
      "scoreDiff": 4,
      "winsA": 1,
      "winsB": 1,
      "comparableCategoryCount": 2,
      "benchmarkCountA": 10,
      "benchmarkCountB": 42,
      "categoryResults": {
        "agentic": {
          "categoryLabel": "Agentic",
          "avgA": 89.3,
          "avgB": 74,
          "winner": "A",
          "benchmarkCount": 10
        },
        "coding": {
          "categoryLabel": "Coding",
          "avgA": null,
          "avgB": 75.9,
          "winner": null,
          "benchmarkCount": 10
        },
        "multimodalGrounded": {
          "categoryLabel": "Multimodal & Grounded",
          "avgA": 94,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 2
        },
        "reasoning": {
          "categoryLabel": "Reasoning",
          "avgA": 83.3,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 5
        },
        "knowledge": {
          "categoryLabel": "Knowledge",
          "avgA": 49,
          "avgB": 66.1,
          "winner": "B",
          "benchmarkCount": 15
        },
        "instructionFollowing": {
          "categoryLabel": "Instruction Following",
          "avgA": null,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 1
        },
        "multilingual": {
          "categoryLabel": "Multilingual",
          "avgA": null,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 0
        },
        "math": {
          "categoryLabel": "Mathematics",
          "avgA": 50,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 6
        }
      }
    },
    {
      "slug": "gpt-5-3-codex-vs-gpt-5-4-pro",
      "url": "https://benchlm.ai/compare/gpt-5-3-codex-vs-gpt-5-4-pro",
      "markdownUrl": "https://benchlm.ai/md/compare/gpt-5-3-codex-vs-gpt-5-4-pro.md",
      "modelA": {
        "slug": "gpt-5-4-pro",
        "canonicalModelKey": "gpt-5-4-pro",
        "model": "GPT-5.4 Pro",
        "creator": "OpenAI",
        "sourceType": "Proprietary",
        "reasoningType": "Reasoning",
        "contextWindow": "1.05M",
        "contextWindowTokens": 1050000,
        "displayScore": 90,
        "rankingEligible": true,
        "overallRank": 6,
        "url": "https://benchlm.ai/models/gpt-5-4-pro",
        "markdownUrl": "https://benchlm.ai/md/models/gpt-5-4-pro.md"
      },
      "modelB": {
        "slug": "gpt-5-3-codex",
        "canonicalModelKey": "gpt-5-3-codex",
        "model": "GPT-5.3 Codex",
        "creator": "OpenAI",
        "sourceType": "Proprietary",
        "reasoningType": "Reasoning",
        "contextWindow": "400K",
        "contextWindowTokens": 400000,
        "displayScore": 85,
        "rankingEligible": true,
        "overallRank": 15,
        "url": "https://benchlm.ai/models/gpt-5-3-codex",
        "markdownUrl": "https://benchlm.ai/md/models/gpt-5-3-codex.md"
      },
      "overallWinner": "A",
      "winner": {
        "slug": "gpt-5-4-pro",
        "canonicalModelKey": "gpt-5-4-pro",
        "model": "GPT-5.4 Pro",
        "creator": "OpenAI",
        "sourceType": "Proprietary",
        "reasoningType": "Reasoning",
        "contextWindow": "1.05M",
        "contextWindowTokens": 1050000,
        "displayScore": 90,
        "rankingEligible": true,
        "overallRank": 6,
        "url": "https://benchlm.ai/models/gpt-5-4-pro",
        "markdownUrl": "https://benchlm.ai/md/models/gpt-5-4-pro.md"
      },
      "scoreDiff": 5,
      "winsA": 1,
      "winsB": 0,
      "comparableCategoryCount": 1,
      "benchmarkCountA": 10,
      "benchmarkCountB": 25,
      "categoryResults": {
        "agentic": {
          "categoryLabel": "Agentic",
          "avgA": 89.3,
          "avgB": 71.5,
          "winner": "A",
          "benchmarkCount": 8
        },
        "coding": {
          "categoryLabel": "Coding",
          "avgA": null,
          "avgB": 63.1,
          "winner": null,
          "benchmarkCount": 7
        },
        "multimodalGrounded": {
          "categoryLabel": "Multimodal & Grounded",
          "avgA": 94,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 3
        },
        "reasoning": {
          "categoryLabel": "Reasoning",
          "avgA": 83.3,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 3
        },
        "knowledge": {
          "categoryLabel": "Knowledge",
          "avgA": 49,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 10
        },
        "instructionFollowing": {
          "categoryLabel": "Instruction Following",
          "avgA": null,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 1
        },
        "multilingual": {
          "categoryLabel": "Multilingual",
          "avgA": null,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 0
        },
        "math": {
          "categoryLabel": "Mathematics",
          "avgA": 50,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 2
        }
      }
    },
    {
      "slug": "claude-opus-4-7-adaptive-vs-gpt-5-4-pro",
      "url": "https://benchlm.ai/compare/claude-opus-4-7-adaptive-vs-gpt-5-4-pro",
      "markdownUrl": "https://benchlm.ai/md/compare/claude-opus-4-7-adaptive-vs-gpt-5-4-pro.md",
      "modelA": {
        "slug": "gpt-5-4-pro",
        "canonicalModelKey": "gpt-5-4-pro",
        "model": "GPT-5.4 Pro",
        "creator": "OpenAI",
        "sourceType": "Proprietary",
        "reasoningType": "Reasoning",
        "contextWindow": "1.05M",
        "contextWindowTokens": 1050000,
        "displayScore": 90,
        "rankingEligible": true,
        "overallRank": 6,
        "url": "https://benchlm.ai/models/gpt-5-4-pro",
        "markdownUrl": "https://benchlm.ai/md/models/gpt-5-4-pro.md"
      },
      "modelB": {
        "slug": "claude-opus-4-7-adaptive",
        "canonicalModelKey": "claude-opus-4-7-max",
        "model": "Claude Opus 4.7 (Adaptive)",
        "creator": "Anthropic",
        "sourceType": "Proprietary",
        "reasoningType": "Reasoning",
        "contextWindow": "1M",
        "contextWindowTokens": 1000000,
        "displayScore": 84,
        "rankingEligible": true,
        "overallRank": 16,
        "url": "https://benchlm.ai/models/claude-opus-4-7-adaptive",
        "markdownUrl": "https://benchlm.ai/md/models/claude-opus-4-7-adaptive.md"
      },
      "overallWinner": "A",
      "winner": {
        "slug": "gpt-5-4-pro",
        "canonicalModelKey": "gpt-5-4-pro",
        "model": "GPT-5.4 Pro",
        "creator": "OpenAI",
        "sourceType": "Proprietary",
        "reasoningType": "Reasoning",
        "contextWindow": "1.05M",
        "contextWindowTokens": 1050000,
        "displayScore": 90,
        "rankingEligible": true,
        "overallRank": 6,
        "url": "https://benchlm.ai/models/gpt-5-4-pro",
        "markdownUrl": "https://benchlm.ai/md/models/gpt-5-4-pro.md"
      },
      "scoreDiff": 6,
      "winsA": 4,
      "winsB": 1,
      "comparableCategoryCount": 5,
      "benchmarkCountA": 10,
      "benchmarkCountB": 36,
      "categoryResults": {
        "agentic": {
          "categoryLabel": "Agentic",
          "avgA": 89.3,
          "avgB": 74.9,
          "winner": "A",
          "benchmarkCount": 9
        },
        "coding": {
          "categoryLabel": "Coding",
          "avgA": null,
          "avgB": 72.9,
          "winner": null,
          "benchmarkCount": 6
        },
        "multimodalGrounded": {
          "categoryLabel": "Multimodal & Grounded",
          "avgA": 94,
          "avgB": 64.3,
          "winner": "A",
          "benchmarkCount": 6
        },
        "reasoning": {
          "categoryLabel": "Reasoning",
          "avgA": 83.3,
          "avgB": 75.8,
          "winner": "A",
          "benchmarkCount": 4
        },
        "knowledge": {
          "categoryLabel": "Knowledge",
          "avgA": 49,
          "avgB": 68.2,
          "winner": "B",
          "benchmarkCount": 12
        },
        "instructionFollowing": {
          "categoryLabel": "Instruction Following",
          "avgA": null,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 1
        },
        "multilingual": {
          "categoryLabel": "Multilingual",
          "avgA": null,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 0
        },
        "math": {
          "categoryLabel": "Mathematics",
          "avgA": 50,
          "avgB": 43.8,
          "winner": "A",
          "benchmarkCount": 2
        }
      }
    },
    {
      "slug": "glm-5-1-vs-gpt-5-4-pro",
      "url": "https://benchlm.ai/compare/glm-5-1-vs-gpt-5-4-pro",
      "markdownUrl": "https://benchlm.ai/md/compare/glm-5-1-vs-gpt-5-4-pro.md",
      "modelA": {
        "slug": "gpt-5-4-pro",
        "canonicalModelKey": "gpt-5-4-pro",
        "model": "GPT-5.4 Pro",
        "creator": "OpenAI",
        "sourceType": "Proprietary",
        "reasoningType": "Reasoning",
        "contextWindow": "1.05M",
        "contextWindowTokens": 1050000,
        "displayScore": 90,
        "rankingEligible": true,
        "overallRank": 6,
        "url": "https://benchlm.ai/models/gpt-5-4-pro",
        "markdownUrl": "https://benchlm.ai/md/models/gpt-5-4-pro.md"
      },
      "modelB": {
        "slug": "glm-5-1",
        "canonicalModelKey": "glm-5-1",
        "model": "GLM-5.1",
        "creator": "Z.AI",
        "sourceType": "Open Weight",
        "reasoningType": "Reasoning",
        "contextWindow": "203K",
        "contextWindowTokens": 203000,
        "displayScore": 82,
        "rankingEligible": true,
        "overallRank": 17,
        "url": "https://benchlm.ai/models/glm-5-1",
        "markdownUrl": "https://benchlm.ai/md/models/glm-5-1.md"
      },
      "overallWinner": "A",
      "winner": {
        "slug": "gpt-5-4-pro",
        "canonicalModelKey": "gpt-5-4-pro",
        "model": "GPT-5.4 Pro",
        "creator": "OpenAI",
        "sourceType": "Proprietary",
        "reasoningType": "Reasoning",
        "contextWindow": "1.05M",
        "contextWindowTokens": 1050000,
        "displayScore": 90,
        "rankingEligible": true,
        "overallRank": 6,
        "url": "https://benchlm.ai/models/gpt-5-4-pro",
        "markdownUrl": "https://benchlm.ai/md/models/gpt-5-4-pro.md"
      },
      "scoreDiff": 8,
      "winsA": 1,
      "winsB": 1,
      "comparableCategoryCount": 2,
      "benchmarkCountA": 10,
      "benchmarkCountB": 33,
      "categoryResults": {
        "agentic": {
          "categoryLabel": "Agentic",
          "avgA": 89.3,
          "avgB": 65.3,
          "winner": "A",
          "benchmarkCount": 10
        },
        "coding": {
          "categoryLabel": "Coding",
          "avgA": null,
          "avgB": 60.9,
          "winner": null,
          "benchmarkCount": 7
        },
        "multimodalGrounded": {
          "categoryLabel": "Multimodal & Grounded",
          "avgA": 94,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 2
        },
        "reasoning": {
          "categoryLabel": "Reasoning",
          "avgA": 83.3,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 3
        },
        "knowledge": {
          "categoryLabel": "Knowledge",
          "avgA": 49,
          "avgB": 52.3,
          "winner": "B",
          "benchmarkCount": 11
        },
        "instructionFollowing": {
          "categoryLabel": "Instruction Following",
          "avgA": null,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 1
        },
        "multilingual": {
          "categoryLabel": "Multilingual",
          "avgA": null,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 0
        },
        "math": {
          "categoryLabel": "Mathematics",
          "avgA": 50,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 6
        }
      }
    },
    {
      "slug": "claude-sonnet-4-6-vs-gpt-5-4-pro",
      "url": "https://benchlm.ai/compare/claude-sonnet-4-6-vs-gpt-5-4-pro",
      "markdownUrl": "https://benchlm.ai/md/compare/claude-sonnet-4-6-vs-gpt-5-4-pro.md",
      "modelA": {
        "slug": "gpt-5-4-pro",
        "canonicalModelKey": "gpt-5-4-pro",
        "model": "GPT-5.4 Pro",
        "creator": "OpenAI",
        "sourceType": "Proprietary",
        "reasoningType": "Reasoning",
        "contextWindow": "1.05M",
        "contextWindowTokens": 1050000,
        "displayScore": 90,
        "rankingEligible": true,
        "overallRank": 6,
        "url": "https://benchlm.ai/models/gpt-5-4-pro",
        "markdownUrl": "https://benchlm.ai/md/models/gpt-5-4-pro.md"
      },
      "modelB": {
        "slug": "claude-sonnet-4-6",
        "canonicalModelKey": "claude-sonnet-4-6",
        "model": "Claude Sonnet 4.6",
        "creator": "Anthropic",
        "sourceType": "Proprietary",
        "reasoningType": "Non-Reasoning",
        "contextWindow": "200K",
        "contextWindowTokens": 200000,
        "displayScore": 82,
        "rankingEligible": true,
        "overallRank": 18,
        "url": "https://benchlm.ai/models/claude-sonnet-4-6",
        "markdownUrl": "https://benchlm.ai/md/models/claude-sonnet-4-6.md"
      },
      "overallWinner": "A",
      "winner": {
        "slug": "gpt-5-4-pro",
        "canonicalModelKey": "gpt-5-4-pro",
        "model": "GPT-5.4 Pro",
        "creator": "OpenAI",
        "sourceType": "Proprietary",
        "reasoningType": "Reasoning",
        "contextWindow": "1.05M",
        "contextWindowTokens": 1050000,
        "displayScore": 90,
        "rankingEligible": true,
        "overallRank": 6,
        "url": "https://benchlm.ai/models/gpt-5-4-pro",
        "markdownUrl": "https://benchlm.ai/md/models/gpt-5-4-pro.md"
      },
      "scoreDiff": 8,
      "winsA": 2,
      "winsB": 1,
      "comparableCategoryCount": 3,
      "benchmarkCountA": 10,
      "benchmarkCountB": 33,
      "categoryResults": {
        "agentic": {
          "categoryLabel": "Agentic",
          "avgA": 89.3,
          "avgB": 65.1,
          "winner": "A",
          "benchmarkCount": 10
        },
        "coding": {
          "categoryLabel": "Coding",
          "avgA": null,
          "avgB": 66.4,
          "winner": null,
          "benchmarkCount": 8
        },
        "multimodalGrounded": {
          "categoryLabel": "Multimodal & Grounded",
          "avgA": 94,
          "avgB": 77.4,
          "winner": "A",
          "benchmarkCount": 4
        },
        "reasoning": {
          "categoryLabel": "Reasoning",
          "avgA": 83.3,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 3
        },
        "knowledge": {
          "categoryLabel": "Knowledge",
          "avgA": 49,
          "avgB": 73.7,
          "winner": "B",
          "benchmarkCount": 13
        },
        "instructionFollowing": {
          "categoryLabel": "Instruction Following",
          "avgA": null,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 1
        },
        "multilingual": {
          "categoryLabel": "Multilingual",
          "avgA": null,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 0
        },
        "math": {
          "categoryLabel": "Mathematics",
          "avgA": 50,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 2
        }
      }
    },
    {
      "slug": "gemini-3-pro-deep-think-vs-gpt-5-5",
      "url": "https://benchlm.ai/compare/gemini-3-pro-deep-think-vs-gpt-5-5",
      "markdownUrl": "https://benchlm.ai/md/compare/gemini-3-pro-deep-think-vs-gpt-5-5.md",
      "modelA": {
        "slug": "gpt-5-5",
        "canonicalModelKey": "gpt-5-5",
        "model": "GPT-5.5",
        "creator": "OpenAI",
        "sourceType": "Proprietary",
        "reasoningType": "Reasoning",
        "contextWindow": "1M",
        "contextWindowTokens": 1000000,
        "displayScore": 89,
        "rankingEligible": true,
        "overallRank": 7,
        "url": "https://benchlm.ai/models/gpt-5-5",
        "markdownUrl": "https://benchlm.ai/md/models/gpt-5-5.md"
      },
      "modelB": {
        "slug": "gemini-3-pro-deep-think",
        "canonicalModelKey": "gemini-3-pro-deep-think",
        "model": "Gemini 3 Pro Deep Think",
        "creator": "Google",
        "sourceType": "Proprietary",
        "reasoningType": "Reasoning",
        "contextWindow": "2M",
        "contextWindowTokens": 2000000,
        "displayScore": 89,
        "rankingEligible": true,
        "overallRank": 8,
        "url": "https://benchlm.ai/models/gemini-3-pro-deep-think",
        "markdownUrl": "https://benchlm.ai/md/models/gemini-3-pro-deep-think.md"
      },
      "overallWinner": "tie",
      "winner": null,
      "scoreDiff": 0,
      "winsA": 1,
      "winsB": 0,
      "comparableCategoryCount": 1,
      "benchmarkCountA": 42,
      "benchmarkCountB": 4,
      "categoryResults": {
        "agentic": {
          "categoryLabel": "Agentic",
          "avgA": 81.5,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 12
        },
        "coding": {
          "categoryLabel": "Coding",
          "avgA": 58.6,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 8
        },
        "multimodalGrounded": {
          "categoryLabel": "Multimodal & Grounded",
          "avgA": 70.4,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 5
        },
        "reasoning": {
          "categoryLabel": "Reasoning",
          "avgA": 85,
          "avgB": 45.1,
          "winner": "A",
          "benchmarkCount": 5
        },
        "knowledge": {
          "categoryLabel": "Knowledge",
          "avgA": 66.4,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 10
        },
        "instructionFollowing": {
          "categoryLabel": "Instruction Following",
          "avgA": null,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 1
        },
        "multilingual": {
          "categoryLabel": "Multilingual",
          "avgA": null,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 0
        },
        "math": {
          "categoryLabel": "Mathematics",
          "avgA": 51.7,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 1
        }
      }
    },
    {
      "slug": "gpt-5-5-vs-grok-4-1",
      "url": "https://benchlm.ai/compare/gpt-5-5-vs-grok-4-1",
      "markdownUrl": "https://benchlm.ai/md/compare/gpt-5-5-vs-grok-4-1.md",
      "modelA": {
        "slug": "gpt-5-5",
        "canonicalModelKey": "gpt-5-5",
        "model": "GPT-5.5",
        "creator": "OpenAI",
        "sourceType": "Proprietary",
        "reasoningType": "Reasoning",
        "contextWindow": "1M",
        "contextWindowTokens": 1000000,
        "displayScore": 89,
        "rankingEligible": true,
        "overallRank": 7,
        "url": "https://benchlm.ai/models/gpt-5-5",
        "markdownUrl": "https://benchlm.ai/md/models/gpt-5-5.md"
      },
      "modelB": {
        "slug": "grok-4-1",
        "canonicalModelKey": "grok-4-1",
        "model": "Grok 4.1",
        "creator": "xAI",
        "sourceType": "Proprietary",
        "reasoningType": "Non-Reasoning",
        "contextWindow": "1M",
        "contextWindowTokens": 1000000,
        "displayScore": 89,
        "rankingEligible": true,
        "overallRank": 9,
        "url": "https://benchlm.ai/models/grok-4-1",
        "markdownUrl": "https://benchlm.ai/md/models/grok-4-1.md"
      },
      "overallWinner": "tie",
      "winner": null,
      "scoreDiff": 0,
      "winsA": 0,
      "winsB": 0,
      "comparableCategoryCount": 0,
      "benchmarkCountA": 42,
      "benchmarkCountB": 0,
      "categoryResults": {
        "agentic": {
          "categoryLabel": "Agentic",
          "avgA": 81.5,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 12
        },
        "coding": {
          "categoryLabel": "Coding",
          "avgA": 58.6,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 8
        },
        "multimodalGrounded": {
          "categoryLabel": "Multimodal & Grounded",
          "avgA": 70.4,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 5
        },
        "reasoning": {
          "categoryLabel": "Reasoning",
          "avgA": 85,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 5
        },
        "knowledge": {
          "categoryLabel": "Knowledge",
          "avgA": 66.4,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 10
        },
        "instructionFollowing": {
          "categoryLabel": "Instruction Following",
          "avgA": null,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 1
        },
        "multilingual": {
          "categoryLabel": "Multilingual",
          "avgA": null,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 0
        },
        "math": {
          "categoryLabel": "Mathematics",
          "avgA": 51.7,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 1
        }
      }
    },
    {
      "slug": "gpt-5-4-vs-gpt-5-5",
      "url": "https://benchlm.ai/compare/gpt-5-4-vs-gpt-5-5",
      "markdownUrl": "https://benchlm.ai/md/compare/gpt-5-4-vs-gpt-5-5.md",
      "modelA": {
        "slug": "gpt-5-5",
        "canonicalModelKey": "gpt-5-5",
        "model": "GPT-5.5",
        "creator": "OpenAI",
        "sourceType": "Proprietary",
        "reasoningType": "Reasoning",
        "contextWindow": "1M",
        "contextWindowTokens": 1000000,
        "displayScore": 89,
        "rankingEligible": true,
        "overallRank": 7,
        "url": "https://benchlm.ai/models/gpt-5-5",
        "markdownUrl": "https://benchlm.ai/md/models/gpt-5-5.md"
      },
      "modelB": {
        "slug": "gpt-5-4",
        "canonicalModelKey": "gpt-5-4",
        "model": "GPT-5.4",
        "creator": "OpenAI",
        "sourceType": "Proprietary",
        "reasoningType": "Reasoning",
        "contextWindow": "1.05M",
        "contextWindowTokens": 1050000,
        "displayScore": 88,
        "rankingEligible": true,
        "overallRank": 10,
        "url": "https://benchlm.ai/models/gpt-5-4",
        "markdownUrl": "https://benchlm.ai/md/models/gpt-5-4.md"
      },
      "overallWinner": "A",
      "winner": {
        "slug": "gpt-5-5",
        "canonicalModelKey": "gpt-5-5",
        "model": "GPT-5.5",
        "creator": "OpenAI",
        "sourceType": "Proprietary",
        "reasoningType": "Reasoning",
        "contextWindow": "1M",
        "contextWindowTokens": 1000000,
        "displayScore": 89,
        "rankingEligible": true,
        "overallRank": 7,
        "url": "https://benchlm.ai/models/gpt-5-5",
        "markdownUrl": "https://benchlm.ai/md/models/gpt-5-5.md"
      },
      "scoreDiff": 1,
      "winsA": 3,
      "winsB": 1,
      "comparableCategoryCount": 4,
      "benchmarkCountA": 42,
      "benchmarkCountB": 48,
      "categoryResults": {
        "agentic": {
          "categoryLabel": "Agentic",
          "avgA": 81.5,
          "avgB": 77,
          "winner": "A",
          "benchmarkCount": 14
        },
        "coding": {
          "categoryLabel": "Coding",
          "avgA": 58.6,
          "avgB": 57.7,
          "winner": "A",
          "benchmarkCount": 9
        },
        "multimodalGrounded": {
          "categoryLabel": "Multimodal & Grounded",
          "avgA": 70.4,
          "avgB": 72.7,
          "winner": "B",
          "benchmarkCount": 12
        },
        "reasoning": {
          "categoryLabel": "Reasoning",
          "avgA": 85,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 5
        },
        "knowledge": {
          "categoryLabel": "Knowledge",
          "avgA": 66.4,
          "avgB": 66.1,
          "winner": "A",
          "benchmarkCount": 12
        },
        "instructionFollowing": {
          "categoryLabel": "Instruction Following",
          "avgA": null,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 1
        },
        "multilingual": {
          "categoryLabel": "Multilingual",
          "avgA": null,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 0
        },
        "math": {
          "categoryLabel": "Mathematics",
          "avgA": 51.7,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 1
        }
      }
    },
    {
      "slug": "gpt-5-5-vs-qwen3-7-plus",
      "url": "https://benchlm.ai/compare/gpt-5-5-vs-qwen3-7-plus",
      "markdownUrl": "https://benchlm.ai/md/compare/gpt-5-5-vs-qwen3-7-plus.md",
      "modelA": {
        "slug": "gpt-5-5",
        "canonicalModelKey": "gpt-5-5",
        "model": "GPT-5.5",
        "creator": "OpenAI",
        "sourceType": "Proprietary",
        "reasoningType": "Reasoning",
        "contextWindow": "1M",
        "contextWindowTokens": 1000000,
        "displayScore": 89,
        "rankingEligible": true,
        "overallRank": 7,
        "url": "https://benchlm.ai/models/gpt-5-5",
        "markdownUrl": "https://benchlm.ai/md/models/gpt-5-5.md"
      },
      "modelB": {
        "slug": "qwen3-7-plus",
        "canonicalModelKey": "qwen3-7-plus",
        "model": "Qwen3.7 Plus",
        "creator": "Alibaba",
        "sourceType": "Proprietary",
        "reasoningType": "Reasoning",
        "contextWindow": "1M",
        "contextWindowTokens": 1000000,
        "displayScore": 88,
        "rankingEligible": true,
        "overallRank": 11,
        "url": "https://benchlm.ai/models/qwen3-7-plus",
        "markdownUrl": "https://benchlm.ai/md/models/qwen3-7-plus.md"
      },
      "overallWinner": "A",
      "winner": {
        "slug": "gpt-5-5",
        "canonicalModelKey": "gpt-5-5",
        "model": "GPT-5.5",
        "creator": "OpenAI",
        "sourceType": "Proprietary",
        "reasoningType": "Reasoning",
        "contextWindow": "1M",
        "contextWindowTokens": 1000000,
        "displayScore": 89,
        "rankingEligible": true,
        "overallRank": 7,
        "url": "https://benchlm.ai/models/gpt-5-5",
        "markdownUrl": "https://benchlm.ai/md/models/gpt-5-5.md"
      },
      "scoreDiff": 1,
      "winsA": 1,
      "winsB": 4,
      "comparableCategoryCount": 5,
      "benchmarkCountA": 42,
      "benchmarkCountB": 68,
      "categoryResults": {
        "agentic": {
          "categoryLabel": "Agentic",
          "avgA": 81.5,
          "avgB": 71.7,
          "winner": "A",
          "benchmarkCount": 19
        },
        "coding": {
          "categoryLabel": "Coding",
          "avgA": 58.6,
          "avgB": 71.1,
          "winner": "B",
          "benchmarkCount": 13
        },
        "multimodalGrounded": {
          "categoryLabel": "Multimodal & Grounded",
          "avgA": 70.4,
          "avgB": 81.1,
          "winner": "B",
          "benchmarkCount": 19
        },
        "reasoning": {
          "categoryLabel": "Reasoning",
          "avgA": 85,
          "avgB": 91.7,
          "winner": "B",
          "benchmarkCount": 6
        },
        "knowledge": {
          "categoryLabel": "Knowledge",
          "avgA": 66.4,
          "avgB": 67.9,
          "winner": "B",
          "benchmarkCount": 14
        },
        "instructionFollowing": {
          "categoryLabel": "Instruction Following",
          "avgA": null,
          "avgB": 89.2,
          "winner": null,
          "benchmarkCount": 3
        },
        "multilingual": {
          "categoryLabel": "Multilingual",
          "avgA": null,
          "avgB": 85.4,
          "winner": null,
          "benchmarkCount": 5
        },
        "math": {
          "categoryLabel": "Mathematics",
          "avgA": 51.7,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 4
        }
      }
    },
    {
      "slug": "claude-opus-4-6-vs-gpt-5-5",
      "url": "https://benchlm.ai/compare/claude-opus-4-6-vs-gpt-5-5",
      "markdownUrl": "https://benchlm.ai/md/compare/claude-opus-4-6-vs-gpt-5-5.md",
      "modelA": {
        "slug": "gpt-5-5",
        "canonicalModelKey": "gpt-5-5",
        "model": "GPT-5.5",
        "creator": "OpenAI",
        "sourceType": "Proprietary",
        "reasoningType": "Reasoning",
        "contextWindow": "1M",
        "contextWindowTokens": 1000000,
        "displayScore": 89,
        "rankingEligible": true,
        "overallRank": 7,
        "url": "https://benchlm.ai/models/gpt-5-5",
        "markdownUrl": "https://benchlm.ai/md/models/gpt-5-5.md"
      },
      "modelB": {
        "slug": "claude-opus-4-6",
        "canonicalModelKey": "claude-opus-4-6",
        "model": "Claude Opus 4.6",
        "creator": "Anthropic",
        "sourceType": "Proprietary",
        "reasoningType": "Non-Reasoning",
        "contextWindow": "1M",
        "contextWindowTokens": 1000000,
        "displayScore": 86,
        "rankingEligible": true,
        "overallRank": 12,
        "url": "https://benchlm.ai/models/claude-opus-4-6",
        "markdownUrl": "https://benchlm.ai/md/models/claude-opus-4-6.md"
      },
      "overallWinner": "A",
      "winner": {
        "slug": "gpt-5-5",
        "canonicalModelKey": "gpt-5-5",
        "model": "GPT-5.5",
        "creator": "OpenAI",
        "sourceType": "Proprietary",
        "reasoningType": "Reasoning",
        "contextWindow": "1M",
        "contextWindowTokens": 1000000,
        "displayScore": 89,
        "rankingEligible": true,
        "overallRank": 7,
        "url": "https://benchlm.ai/models/gpt-5-5",
        "markdownUrl": "https://benchlm.ai/md/models/gpt-5-5.md"
      },
      "scoreDiff": 3,
      "winsA": 1,
      "winsB": 3,
      "comparableCategoryCount": 4,
      "benchmarkCountA": 42,
      "benchmarkCountB": 47,
      "categoryResults": {
        "agentic": {
          "categoryLabel": "Agentic",
          "avgA": 81.5,
          "avgB": 72.6,
          "winner": "A",
          "benchmarkCount": 14
        },
        "coding": {
          "categoryLabel": "Coding",
          "avgA": 58.6,
          "avgB": 64.4,
          "winner": "B",
          "benchmarkCount": 12
        },
        "multimodalGrounded": {
          "categoryLabel": "Multimodal & Grounded",
          "avgA": 70.4,
          "avgB": 77.3,
          "winner": "B",
          "benchmarkCount": 9
        },
        "reasoning": {
          "categoryLabel": "Reasoning",
          "avgA": 85,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 5
        },
        "knowledge": {
          "categoryLabel": "Knowledge",
          "avgA": 66.4,
          "avgB": 76.2,
          "winner": "B",
          "benchmarkCount": 15
        },
        "instructionFollowing": {
          "categoryLabel": "Instruction Following",
          "avgA": null,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 1
        },
        "multilingual": {
          "categoryLabel": "Multilingual",
          "avgA": null,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 0
        },
        "math": {
          "categoryLabel": "Mathematics",
          "avgA": 51.7,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 2
        }
      }
    },
    {
      "slug": "deepseek-v4-pro-max-vs-gpt-5-5",
      "url": "https://benchlm.ai/compare/deepseek-v4-pro-max-vs-gpt-5-5",
      "markdownUrl": "https://benchlm.ai/md/compare/deepseek-v4-pro-max-vs-gpt-5-5.md",
      "modelA": {
        "slug": "gpt-5-5",
        "canonicalModelKey": "gpt-5-5",
        "model": "GPT-5.5",
        "creator": "OpenAI",
        "sourceType": "Proprietary",
        "reasoningType": "Reasoning",
        "contextWindow": "1M",
        "contextWindowTokens": 1000000,
        "displayScore": 89,
        "rankingEligible": true,
        "overallRank": 7,
        "url": "https://benchlm.ai/models/gpt-5-5",
        "markdownUrl": "https://benchlm.ai/md/models/gpt-5-5.md"
      },
      "modelB": {
        "slug": "deepseek-v4-pro-max",
        "canonicalModelKey": "deepseek-v4-pro-max",
        "model": "DeepSeek V4 Pro (Max)",
        "creator": "DeepSeek",
        "sourceType": "Open Weight",
        "reasoningType": "Reasoning",
        "contextWindow": "1M",
        "contextWindowTokens": 1000000,
        "displayScore": 86,
        "rankingEligible": true,
        "overallRank": 14,
        "url": "https://benchlm.ai/models/deepseek-v4-pro-max",
        "markdownUrl": "https://benchlm.ai/md/models/deepseek-v4-pro-max.md"
      },
      "overallWinner": "A",
      "winner": {
        "slug": "gpt-5-5",
        "canonicalModelKey": "gpt-5-5",
        "model": "GPT-5.5",
        "creator": "OpenAI",
        "sourceType": "Proprietary",
        "reasoningType": "Reasoning",
        "contextWindow": "1M",
        "contextWindowTokens": 1000000,
        "displayScore": 89,
        "rankingEligible": true,
        "overallRank": 7,
        "url": "https://benchlm.ai/models/gpt-5-5",
        "markdownUrl": "https://benchlm.ai/md/models/gpt-5-5.md"
      },
      "scoreDiff": 3,
      "winsA": 2,
      "winsB": 1,
      "comparableCategoryCount": 3,
      "benchmarkCountA": 42,
      "benchmarkCountB": 42,
      "categoryResults": {
        "agentic": {
          "categoryLabel": "Agentic",
          "avgA": 81.5,
          "avgB": 74,
          "winner": "A",
          "benchmarkCount": 13
        },
        "coding": {
          "categoryLabel": "Coding",
          "avgA": 58.6,
          "avgB": 75.9,
          "winner": "B",
          "benchmarkCount": 12
        },
        "multimodalGrounded": {
          "categoryLabel": "Multimodal & Grounded",
          "avgA": 70.4,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 5
        },
        "reasoning": {
          "categoryLabel": "Reasoning",
          "avgA": 85,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 7
        },
        "knowledge": {
          "categoryLabel": "Knowledge",
          "avgA": 66.4,
          "avgB": 66.1,
          "winner": "A",
          "benchmarkCount": 13
        },
        "instructionFollowing": {
          "categoryLabel": "Instruction Following",
          "avgA": null,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 1
        },
        "multilingual": {
          "categoryLabel": "Multilingual",
          "avgA": null,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 0
        },
        "math": {
          "categoryLabel": "Mathematics",
          "avgA": 51.7,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 5
        }
      }
    },
    {
      "slug": "gpt-5-3-codex-vs-gpt-5-5",
      "url": "https://benchlm.ai/compare/gpt-5-3-codex-vs-gpt-5-5",
      "markdownUrl": "https://benchlm.ai/md/compare/gpt-5-3-codex-vs-gpt-5-5.md",
      "modelA": {
        "slug": "gpt-5-5",
        "canonicalModelKey": "gpt-5-5",
        "model": "GPT-5.5",
        "creator": "OpenAI",
        "sourceType": "Proprietary",
        "reasoningType": "Reasoning",
        "contextWindow": "1M",
        "contextWindowTokens": 1000000,
        "displayScore": 89,
        "rankingEligible": true,
        "overallRank": 7,
        "url": "https://benchlm.ai/models/gpt-5-5",
        "markdownUrl": "https://benchlm.ai/md/models/gpt-5-5.md"
      },
      "modelB": {
        "slug": "gpt-5-3-codex",
        "canonicalModelKey": "gpt-5-3-codex",
        "model": "GPT-5.3 Codex",
        "creator": "OpenAI",
        "sourceType": "Proprietary",
        "reasoningType": "Reasoning",
        "contextWindow": "400K",
        "contextWindowTokens": 400000,
        "displayScore": 85,
        "rankingEligible": true,
        "overallRank": 15,
        "url": "https://benchlm.ai/models/gpt-5-3-codex",
        "markdownUrl": "https://benchlm.ai/md/models/gpt-5-3-codex.md"
      },
      "overallWinner": "A",
      "winner": {
        "slug": "gpt-5-5",
        "canonicalModelKey": "gpt-5-5",
        "model": "GPT-5.5",
        "creator": "OpenAI",
        "sourceType": "Proprietary",
        "reasoningType": "Reasoning",
        "contextWindow": "1M",
        "contextWindowTokens": 1000000,
        "displayScore": 89,
        "rankingEligible": true,
        "overallRank": 7,
        "url": "https://benchlm.ai/models/gpt-5-5",
        "markdownUrl": "https://benchlm.ai/md/models/gpt-5-5.md"
      },
      "scoreDiff": 4,
      "winsA": 1,
      "winsB": 1,
      "comparableCategoryCount": 2,
      "benchmarkCountA": 42,
      "benchmarkCountB": 25,
      "categoryResults": {
        "agentic": {
          "categoryLabel": "Agentic",
          "avgA": 81.5,
          "avgB": 71.5,
          "winner": "A",
          "benchmarkCount": 12
        },
        "coding": {
          "categoryLabel": "Coding",
          "avgA": 58.6,
          "avgB": 63.1,
          "winner": "B",
          "benchmarkCount": 10
        },
        "multimodalGrounded": {
          "categoryLabel": "Multimodal & Grounded",
          "avgA": 70.4,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 5
        },
        "reasoning": {
          "categoryLabel": "Reasoning",
          "avgA": 85,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 5
        },
        "knowledge": {
          "categoryLabel": "Knowledge",
          "avgA": 66.4,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 10
        },
        "instructionFollowing": {
          "categoryLabel": "Instruction Following",
          "avgA": null,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 1
        },
        "multilingual": {
          "categoryLabel": "Multilingual",
          "avgA": null,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 0
        },
        "math": {
          "categoryLabel": "Mathematics",
          "avgA": 51.7,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 1
        }
      }
    },
    {
      "slug": "claude-sonnet-4-6-vs-gpt-5-5",
      "url": "https://benchlm.ai/compare/claude-sonnet-4-6-vs-gpt-5-5",
      "markdownUrl": "https://benchlm.ai/md/compare/claude-sonnet-4-6-vs-gpt-5-5.md",
      "modelA": {
        "slug": "gpt-5-5",
        "canonicalModelKey": "gpt-5-5",
        "model": "GPT-5.5",
        "creator": "OpenAI",
        "sourceType": "Proprietary",
        "reasoningType": "Reasoning",
        "contextWindow": "1M",
        "contextWindowTokens": 1000000,
        "displayScore": 89,
        "rankingEligible": true,
        "overallRank": 7,
        "url": "https://benchlm.ai/models/gpt-5-5",
        "markdownUrl": "https://benchlm.ai/md/models/gpt-5-5.md"
      },
      "modelB": {
        "slug": "claude-sonnet-4-6",
        "canonicalModelKey": "claude-sonnet-4-6",
        "model": "Claude Sonnet 4.6",
        "creator": "Anthropic",
        "sourceType": "Proprietary",
        "reasoningType": "Non-Reasoning",
        "contextWindow": "200K",
        "contextWindowTokens": 200000,
        "displayScore": 82,
        "rankingEligible": true,
        "overallRank": 18,
        "url": "https://benchlm.ai/models/claude-sonnet-4-6",
        "markdownUrl": "https://benchlm.ai/md/models/claude-sonnet-4-6.md"
      },
      "overallWinner": "A",
      "winner": {
        "slug": "gpt-5-5",
        "canonicalModelKey": "gpt-5-5",
        "model": "GPT-5.5",
        "creator": "OpenAI",
        "sourceType": "Proprietary",
        "reasoningType": "Reasoning",
        "contextWindow": "1M",
        "contextWindowTokens": 1000000,
        "displayScore": 89,
        "rankingEligible": true,
        "overallRank": 7,
        "url": "https://benchlm.ai/models/gpt-5-5",
        "markdownUrl": "https://benchlm.ai/md/models/gpt-5-5.md"
      },
      "scoreDiff": 7,
      "winsA": 1,
      "winsB": 3,
      "comparableCategoryCount": 4,
      "benchmarkCountA": 42,
      "benchmarkCountB": 33,
      "categoryResults": {
        "agentic": {
          "categoryLabel": "Agentic",
          "avgA": 81.5,
          "avgB": 65.1,
          "winner": "A",
          "benchmarkCount": 13
        },
        "coding": {
          "categoryLabel": "Coding",
          "avgA": 58.6,
          "avgB": 66.4,
          "winner": "B",
          "benchmarkCount": 10
        },
        "multimodalGrounded": {
          "categoryLabel": "Multimodal & Grounded",
          "avgA": 70.4,
          "avgB": 77.4,
          "winner": "B",
          "benchmarkCount": 6
        },
        "reasoning": {
          "categoryLabel": "Reasoning",
          "avgA": 85,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 5
        },
        "knowledge": {
          "categoryLabel": "Knowledge",
          "avgA": 66.4,
          "avgB": 73.7,
          "winner": "B",
          "benchmarkCount": 12
        },
        "instructionFollowing": {
          "categoryLabel": "Instruction Following",
          "avgA": null,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 1
        },
        "multilingual": {
          "categoryLabel": "Multilingual",
          "avgA": null,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 0
        },
        "math": {
          "categoryLabel": "Mathematics",
          "avgA": 51.7,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 1
        }
      }
    },
    {
      "slug": "gemini-3-pro-deep-think-vs-grok-4-1",
      "url": "https://benchlm.ai/compare/gemini-3-pro-deep-think-vs-grok-4-1",
      "markdownUrl": "https://benchlm.ai/md/compare/gemini-3-pro-deep-think-vs-grok-4-1.md",
      "modelA": {
        "slug": "gemini-3-pro-deep-think",
        "canonicalModelKey": "gemini-3-pro-deep-think",
        "model": "Gemini 3 Pro Deep Think",
        "creator": "Google",
        "sourceType": "Proprietary",
        "reasoningType": "Reasoning",
        "contextWindow": "2M",
        "contextWindowTokens": 2000000,
        "displayScore": 89,
        "rankingEligible": true,
        "overallRank": 8,
        "url": "https://benchlm.ai/models/gemini-3-pro-deep-think",
        "markdownUrl": "https://benchlm.ai/md/models/gemini-3-pro-deep-think.md"
      },
      "modelB": {
        "slug": "grok-4-1",
        "canonicalModelKey": "grok-4-1",
        "model": "Grok 4.1",
        "creator": "xAI",
        "sourceType": "Proprietary",
        "reasoningType": "Non-Reasoning",
        "contextWindow": "1M",
        "contextWindowTokens": 1000000,
        "displayScore": 89,
        "rankingEligible": true,
        "overallRank": 9,
        "url": "https://benchlm.ai/models/grok-4-1",
        "markdownUrl": "https://benchlm.ai/md/models/grok-4-1.md"
      },
      "overallWinner": "tie",
      "winner": null,
      "scoreDiff": 0,
      "winsA": 0,
      "winsB": 0,
      "comparableCategoryCount": 0,
      "benchmarkCountA": 4,
      "benchmarkCountB": 0,
      "categoryResults": {
        "agentic": {
          "categoryLabel": "Agentic",
          "avgA": null,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 2
        },
        "coding": {
          "categoryLabel": "Coding",
          "avgA": null,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 0
        },
        "multimodalGrounded": {
          "categoryLabel": "Multimodal & Grounded",
          "avgA": null,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 0
        },
        "reasoning": {
          "categoryLabel": "Reasoning",
          "avgA": 45.1,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 2
        },
        "knowledge": {
          "categoryLabel": "Knowledge",
          "avgA": null,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 0
        },
        "instructionFollowing": {
          "categoryLabel": "Instruction Following",
          "avgA": null,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 0
        },
        "multilingual": {
          "categoryLabel": "Multilingual",
          "avgA": null,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 0
        },
        "math": {
          "categoryLabel": "Mathematics",
          "avgA": null,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 0
        }
      }
    },
    {
      "slug": "gemini-3-pro-deep-think-vs-gpt-5-4",
      "url": "https://benchlm.ai/compare/gemini-3-pro-deep-think-vs-gpt-5-4",
      "markdownUrl": "https://benchlm.ai/md/compare/gemini-3-pro-deep-think-vs-gpt-5-4.md",
      "modelA": {
        "slug": "gemini-3-pro-deep-think",
        "canonicalModelKey": "gemini-3-pro-deep-think",
        "model": "Gemini 3 Pro Deep Think",
        "creator": "Google",
        "sourceType": "Proprietary",
        "reasoningType": "Reasoning",
        "contextWindow": "2M",
        "contextWindowTokens": 2000000,
        "displayScore": 89,
        "rankingEligible": true,
        "overallRank": 8,
        "url": "https://benchlm.ai/models/gemini-3-pro-deep-think",
        "markdownUrl": "https://benchlm.ai/md/models/gemini-3-pro-deep-think.md"
      },
      "modelB": {
        "slug": "gpt-5-4",
        "canonicalModelKey": "gpt-5-4",
        "model": "GPT-5.4",
        "creator": "OpenAI",
        "sourceType": "Proprietary",
        "reasoningType": "Reasoning",
        "contextWindow": "1.05M",
        "contextWindowTokens": 1050000,
        "displayScore": 88,
        "rankingEligible": true,
        "overallRank": 10,
        "url": "https://benchlm.ai/models/gpt-5-4",
        "markdownUrl": "https://benchlm.ai/md/models/gpt-5-4.md"
      },
      "overallWinner": "A",
      "winner": {
        "slug": "gemini-3-pro-deep-think",
        "canonicalModelKey": "gemini-3-pro-deep-think",
        "model": "Gemini 3 Pro Deep Think",
        "creator": "Google",
        "sourceType": "Proprietary",
        "reasoningType": "Reasoning",
        "contextWindow": "2M",
        "contextWindowTokens": 2000000,
        "displayScore": 89,
        "rankingEligible": true,
        "overallRank": 8,
        "url": "https://benchlm.ai/models/gemini-3-pro-deep-think",
        "markdownUrl": "https://benchlm.ai/md/models/gemini-3-pro-deep-think.md"
      },
      "scoreDiff": 1,
      "winsA": 0,
      "winsB": 0,
      "comparableCategoryCount": 0,
      "benchmarkCountA": 4,
      "benchmarkCountB": 48,
      "categoryResults": {
        "agentic": {
          "categoryLabel": "Agentic",
          "avgA": null,
          "avgB": 77,
          "winner": null,
          "benchmarkCount": 14
        },
        "coding": {
          "categoryLabel": "Coding",
          "avgA": null,
          "avgB": 57.7,
          "winner": null,
          "benchmarkCount": 7
        },
        "multimodalGrounded": {
          "categoryLabel": "Multimodal & Grounded",
          "avgA": null,
          "avgB": 72.7,
          "winner": null,
          "benchmarkCount": 12
        },
        "reasoning": {
          "categoryLabel": "Reasoning",
          "avgA": 45.1,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 3
        },
        "knowledge": {
          "categoryLabel": "Knowledge",
          "avgA": null,
          "avgB": 66.1,
          "winner": null,
          "benchmarkCount": 12
        },
        "instructionFollowing": {
          "categoryLabel": "Instruction Following",
          "avgA": null,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 1
        },
        "multilingual": {
          "categoryLabel": "Multilingual",
          "avgA": null,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 0
        },
        "math": {
          "categoryLabel": "Mathematics",
          "avgA": null,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 0
        }
      }
    },
    {
      "slug": "gemini-3-pro-deep-think-vs-qwen3-7-plus",
      "url": "https://benchlm.ai/compare/gemini-3-pro-deep-think-vs-qwen3-7-plus",
      "markdownUrl": "https://benchlm.ai/md/compare/gemini-3-pro-deep-think-vs-qwen3-7-plus.md",
      "modelA": {
        "slug": "gemini-3-pro-deep-think",
        "canonicalModelKey": "gemini-3-pro-deep-think",
        "model": "Gemini 3 Pro Deep Think",
        "creator": "Google",
        "sourceType": "Proprietary",
        "reasoningType": "Reasoning",
        "contextWindow": "2M",
        "contextWindowTokens": 2000000,
        "displayScore": 89,
        "rankingEligible": true,
        "overallRank": 8,
        "url": "https://benchlm.ai/models/gemini-3-pro-deep-think",
        "markdownUrl": "https://benchlm.ai/md/models/gemini-3-pro-deep-think.md"
      },
      "modelB": {
        "slug": "qwen3-7-plus",
        "canonicalModelKey": "qwen3-7-plus",
        "model": "Qwen3.7 Plus",
        "creator": "Alibaba",
        "sourceType": "Proprietary",
        "reasoningType": "Reasoning",
        "contextWindow": "1M",
        "contextWindowTokens": 1000000,
        "displayScore": 88,
        "rankingEligible": true,
        "overallRank": 11,
        "url": "https://benchlm.ai/models/qwen3-7-plus",
        "markdownUrl": "https://benchlm.ai/md/models/qwen3-7-plus.md"
      },
      "overallWinner": "A",
      "winner": {
        "slug": "gemini-3-pro-deep-think",
        "canonicalModelKey": "gemini-3-pro-deep-think",
        "model": "Gemini 3 Pro Deep Think",
        "creator": "Google",
        "sourceType": "Proprietary",
        "reasoningType": "Reasoning",
        "contextWindow": "2M",
        "contextWindowTokens": 2000000,
        "displayScore": 89,
        "rankingEligible": true,
        "overallRank": 8,
        "url": "https://benchlm.ai/models/gemini-3-pro-deep-think",
        "markdownUrl": "https://benchlm.ai/md/models/gemini-3-pro-deep-think.md"
      },
      "scoreDiff": 1,
      "winsA": 0,
      "winsB": 1,
      "comparableCategoryCount": 1,
      "benchmarkCountA": 4,
      "benchmarkCountB": 68,
      "categoryResults": {
        "agentic": {
          "categoryLabel": "Agentic",
          "avgA": null,
          "avgB": 71.7,
          "winner": null,
          "benchmarkCount": 15
        },
        "coding": {
          "categoryLabel": "Coding",
          "avgA": null,
          "avgB": 71.1,
          "winner": null,
          "benchmarkCount": 10
        },
        "multimodalGrounded": {
          "categoryLabel": "Multimodal & Grounded",
          "avgA": null,
          "avgB": 81.1,
          "winner": null,
          "benchmarkCount": 16
        },
        "reasoning": {
          "categoryLabel": "Reasoning",
          "avgA": 45.1,
          "avgB": 91.7,
          "winner": "B",
          "benchmarkCount": 4
        },
        "knowledge": {
          "categoryLabel": "Knowledge",
          "avgA": null,
          "avgB": 67.9,
          "winner": null,
          "benchmarkCount": 13
        },
        "instructionFollowing": {
          "categoryLabel": "Instruction Following",
          "avgA": null,
          "avgB": 89.2,
          "winner": null,
          "benchmarkCount": 3
        },
        "multilingual": {
          "categoryLabel": "Multilingual",
          "avgA": null,
          "avgB": 85.4,
          "winner": null,
          "benchmarkCount": 5
        },
        "math": {
          "categoryLabel": "Mathematics",
          "avgA": null,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 3
        }
      }
    },
    {
      "slug": "claude-opus-4-6-vs-gemini-3-pro-deep-think",
      "url": "https://benchlm.ai/compare/claude-opus-4-6-vs-gemini-3-pro-deep-think",
      "markdownUrl": "https://benchlm.ai/md/compare/claude-opus-4-6-vs-gemini-3-pro-deep-think.md",
      "modelA": {
        "slug": "gemini-3-pro-deep-think",
        "canonicalModelKey": "gemini-3-pro-deep-think",
        "model": "Gemini 3 Pro Deep Think",
        "creator": "Google",
        "sourceType": "Proprietary",
        "reasoningType": "Reasoning",
        "contextWindow": "2M",
        "contextWindowTokens": 2000000,
        "displayScore": 89,
        "rankingEligible": true,
        "overallRank": 8,
        "url": "https://benchlm.ai/models/gemini-3-pro-deep-think",
        "markdownUrl": "https://benchlm.ai/md/models/gemini-3-pro-deep-think.md"
      },
      "modelB": {
        "slug": "claude-opus-4-6",
        "canonicalModelKey": "claude-opus-4-6",
        "model": "Claude Opus 4.6",
        "creator": "Anthropic",
        "sourceType": "Proprietary",
        "reasoningType": "Non-Reasoning",
        "contextWindow": "1M",
        "contextWindowTokens": 1000000,
        "displayScore": 86,
        "rankingEligible": true,
        "overallRank": 12,
        "url": "https://benchlm.ai/models/claude-opus-4-6",
        "markdownUrl": "https://benchlm.ai/md/models/claude-opus-4-6.md"
      },
      "overallWinner": "A",
      "winner": {
        "slug": "gemini-3-pro-deep-think",
        "canonicalModelKey": "gemini-3-pro-deep-think",
        "model": "Gemini 3 Pro Deep Think",
        "creator": "Google",
        "sourceType": "Proprietary",
        "reasoningType": "Reasoning",
        "contextWindow": "2M",
        "contextWindowTokens": 2000000,
        "displayScore": 89,
        "rankingEligible": true,
        "overallRank": 8,
        "url": "https://benchlm.ai/models/gemini-3-pro-deep-think",
        "markdownUrl": "https://benchlm.ai/md/models/gemini-3-pro-deep-think.md"
      },
      "scoreDiff": 3,
      "winsA": 0,
      "winsB": 0,
      "comparableCategoryCount": 0,
      "benchmarkCountA": 4,
      "benchmarkCountB": 47,
      "categoryResults": {
        "agentic": {
          "categoryLabel": "Agentic",
          "avgA": null,
          "avgB": 72.6,
          "winner": null,
          "benchmarkCount": 11
        },
        "coding": {
          "categoryLabel": "Coding",
          "avgA": null,
          "avgB": 64.4,
          "winner": null,
          "benchmarkCount": 10
        },
        "multimodalGrounded": {
          "categoryLabel": "Multimodal & Grounded",
          "avgA": null,
          "avgB": 77.3,
          "winner": null,
          "benchmarkCount": 7
        },
        "reasoning": {
          "categoryLabel": "Reasoning",
          "avgA": 45.1,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 3
        },
        "knowledge": {
          "categoryLabel": "Knowledge",
          "avgA": null,
          "avgB": 76.2,
          "winner": null,
          "benchmarkCount": 15
        },
        "instructionFollowing": {
          "categoryLabel": "Instruction Following",
          "avgA": null,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 1
        },
        "multilingual": {
          "categoryLabel": "Multilingual",
          "avgA": null,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 0
        },
        "math": {
          "categoryLabel": "Mathematics",
          "avgA": null,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 1
        }
      }
    },
    {
      "slug": "gemini-3-5-flash-vs-gemini-3-pro-deep-think",
      "url": "https://benchlm.ai/compare/gemini-3-5-flash-vs-gemini-3-pro-deep-think",
      "markdownUrl": "https://benchlm.ai/md/compare/gemini-3-5-flash-vs-gemini-3-pro-deep-think.md",
      "modelA": {
        "slug": "gemini-3-pro-deep-think",
        "canonicalModelKey": "gemini-3-pro-deep-think",
        "model": "Gemini 3 Pro Deep Think",
        "creator": "Google",
        "sourceType": "Proprietary",
        "reasoningType": "Reasoning",
        "contextWindow": "2M",
        "contextWindowTokens": 2000000,
        "displayScore": 89,
        "rankingEligible": true,
        "overallRank": 8,
        "url": "https://benchlm.ai/models/gemini-3-pro-deep-think",
        "markdownUrl": "https://benchlm.ai/md/models/gemini-3-pro-deep-think.md"
      },
      "modelB": {
        "slug": "gemini-3-5-flash",
        "canonicalModelKey": "gemini-3-5-flash",
        "model": "Gemini 3.5 Flash",
        "creator": "Google",
        "sourceType": "Proprietary",
        "reasoningType": "Reasoning",
        "contextWindow": "1M",
        "contextWindowTokens": 1000000,
        "displayScore": 86,
        "rankingEligible": true,
        "overallRank": 13,
        "url": "https://benchlm.ai/models/gemini-3-5-flash",
        "markdownUrl": "https://benchlm.ai/md/models/gemini-3-5-flash.md"
      },
      "overallWinner": "A",
      "winner": {
        "slug": "gemini-3-pro-deep-think",
        "canonicalModelKey": "gemini-3-pro-deep-think",
        "model": "Gemini 3 Pro Deep Think",
        "creator": "Google",
        "sourceType": "Proprietary",
        "reasoningType": "Reasoning",
        "contextWindow": "2M",
        "contextWindowTokens": 2000000,
        "displayScore": 89,
        "rankingEligible": true,
        "overallRank": 8,
        "url": "https://benchlm.ai/models/gemini-3-pro-deep-think",
        "markdownUrl": "https://benchlm.ai/md/models/gemini-3-pro-deep-think.md"
      },
      "scoreDiff": 3,
      "winsA": 0,
      "winsB": 1,
      "comparableCategoryCount": 1,
      "benchmarkCountA": 4,
      "benchmarkCountB": 40,
      "categoryResults": {
        "agentic": {
          "categoryLabel": "Agentic",
          "avgA": null,
          "avgB": 77.2,
          "winner": null,
          "benchmarkCount": 11
        },
        "coding": {
          "categoryLabel": "Coding",
          "avgA": null,
          "avgB": 54.5,
          "winner": null,
          "benchmarkCount": 8
        },
        "multimodalGrounded": {
          "categoryLabel": "Multimodal & Grounded",
          "avgA": null,
          "avgB": 83.8,
          "winner": null,
          "benchmarkCount": 5
        },
        "reasoning": {
          "categoryLabel": "Reasoning",
          "avgA": 45.1,
          "avgB": 74.7,
          "winner": "B",
          "benchmarkCount": 5
        },
        "knowledge": {
          "categoryLabel": "Knowledge",
          "avgA": null,
          "avgB": 58,
          "winner": null,
          "benchmarkCount": 9
        },
        "instructionFollowing": {
          "categoryLabel": "Instruction Following",
          "avgA": null,
          "avgB": 76.3,
          "winner": null,
          "benchmarkCount": 2
        },
        "multilingual": {
          "categoryLabel": "Multilingual",
          "avgA": null,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 0
        },
        "math": {
          "categoryLabel": "Mathematics",
          "avgA": null,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 0
        }
      }
    },
    {
      "slug": "deepseek-v4-pro-max-vs-gemini-3-pro-deep-think",
      "url": "https://benchlm.ai/compare/deepseek-v4-pro-max-vs-gemini-3-pro-deep-think",
      "markdownUrl": "https://benchlm.ai/md/compare/deepseek-v4-pro-max-vs-gemini-3-pro-deep-think.md",
      "modelA": {
        "slug": "gemini-3-pro-deep-think",
        "canonicalModelKey": "gemini-3-pro-deep-think",
        "model": "Gemini 3 Pro Deep Think",
        "creator": "Google",
        "sourceType": "Proprietary",
        "reasoningType": "Reasoning",
        "contextWindow": "2M",
        "contextWindowTokens": 2000000,
        "displayScore": 89,
        "rankingEligible": true,
        "overallRank": 8,
        "url": "https://benchlm.ai/models/gemini-3-pro-deep-think",
        "markdownUrl": "https://benchlm.ai/md/models/gemini-3-pro-deep-think.md"
      },
      "modelB": {
        "slug": "deepseek-v4-pro-max",
        "canonicalModelKey": "deepseek-v4-pro-max",
        "model": "DeepSeek V4 Pro (Max)",
        "creator": "DeepSeek",
        "sourceType": "Open Weight",
        "reasoningType": "Reasoning",
        "contextWindow": "1M",
        "contextWindowTokens": 1000000,
        "displayScore": 86,
        "rankingEligible": true,
        "overallRank": 14,
        "url": "https://benchlm.ai/models/deepseek-v4-pro-max",
        "markdownUrl": "https://benchlm.ai/md/models/deepseek-v4-pro-max.md"
      },
      "overallWinner": "A",
      "winner": {
        "slug": "gemini-3-pro-deep-think",
        "canonicalModelKey": "gemini-3-pro-deep-think",
        "model": "Gemini 3 Pro Deep Think",
        "creator": "Google",
        "sourceType": "Proprietary",
        "reasoningType": "Reasoning",
        "contextWindow": "2M",
        "contextWindowTokens": 2000000,
        "displayScore": 89,
        "rankingEligible": true,
        "overallRank": 8,
        "url": "https://benchlm.ai/models/gemini-3-pro-deep-think",
        "markdownUrl": "https://benchlm.ai/md/models/gemini-3-pro-deep-think.md"
      },
      "scoreDiff": 3,
      "winsA": 0,
      "winsB": 0,
      "comparableCategoryCount": 0,
      "benchmarkCountA": 4,
      "benchmarkCountB": 42,
      "categoryResults": {
        "agentic": {
          "categoryLabel": "Agentic",
          "avgA": null,
          "avgB": 74,
          "winner": null,
          "benchmarkCount": 10
        },
        "coding": {
          "categoryLabel": "Coding",
          "avgA": null,
          "avgB": 75.9,
          "winner": null,
          "benchmarkCount": 10
        },
        "multimodalGrounded": {
          "categoryLabel": "Multimodal & Grounded",
          "avgA": null,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 1
        },
        "reasoning": {
          "categoryLabel": "Reasoning",
          "avgA": 45.1,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 5
        },
        "knowledge": {
          "categoryLabel": "Knowledge",
          "avgA": null,
          "avgB": 66.1,
          "winner": null,
          "benchmarkCount": 12
        },
        "instructionFollowing": {
          "categoryLabel": "Instruction Following",
          "avgA": null,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 1
        },
        "multilingual": {
          "categoryLabel": "Multilingual",
          "avgA": null,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 0
        },
        "math": {
          "categoryLabel": "Mathematics",
          "avgA": null,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 4
        }
      }
    },
    {
      "slug": "gemini-3-pro-deep-think-vs-gpt-5-3-codex",
      "url": "https://benchlm.ai/compare/gemini-3-pro-deep-think-vs-gpt-5-3-codex",
      "markdownUrl": "https://benchlm.ai/md/compare/gemini-3-pro-deep-think-vs-gpt-5-3-codex.md",
      "modelA": {
        "slug": "gemini-3-pro-deep-think",
        "canonicalModelKey": "gemini-3-pro-deep-think",
        "model": "Gemini 3 Pro Deep Think",
        "creator": "Google",
        "sourceType": "Proprietary",
        "reasoningType": "Reasoning",
        "contextWindow": "2M",
        "contextWindowTokens": 2000000,
        "displayScore": 89,
        "rankingEligible": true,
        "overallRank": 8,
        "url": "https://benchlm.ai/models/gemini-3-pro-deep-think",
        "markdownUrl": "https://benchlm.ai/md/models/gemini-3-pro-deep-think.md"
      },
      "modelB": {
        "slug": "gpt-5-3-codex",
        "canonicalModelKey": "gpt-5-3-codex",
        "model": "GPT-5.3 Codex",
        "creator": "OpenAI",
        "sourceType": "Proprietary",
        "reasoningType": "Reasoning",
        "contextWindow": "400K",
        "contextWindowTokens": 400000,
        "displayScore": 85,
        "rankingEligible": true,
        "overallRank": 15,
        "url": "https://benchlm.ai/models/gpt-5-3-codex",
        "markdownUrl": "https://benchlm.ai/md/models/gpt-5-3-codex.md"
      },
      "overallWinner": "A",
      "winner": {
        "slug": "gemini-3-pro-deep-think",
        "canonicalModelKey": "gemini-3-pro-deep-think",
        "model": "Gemini 3 Pro Deep Think",
        "creator": "Google",
        "sourceType": "Proprietary",
        "reasoningType": "Reasoning",
        "contextWindow": "2M",
        "contextWindowTokens": 2000000,
        "displayScore": 89,
        "rankingEligible": true,
        "overallRank": 8,
        "url": "https://benchlm.ai/models/gemini-3-pro-deep-think",
        "markdownUrl": "https://benchlm.ai/md/models/gemini-3-pro-deep-think.md"
      },
      "scoreDiff": 4,
      "winsA": 0,
      "winsB": 0,
      "comparableCategoryCount": 0,
      "benchmarkCountA": 4,
      "benchmarkCountB": 25,
      "categoryResults": {
        "agentic": {
          "categoryLabel": "Agentic",
          "avgA": null,
          "avgB": 71.5,
          "winner": null,
          "benchmarkCount": 7
        },
        "coding": {
          "categoryLabel": "Coding",
          "avgA": null,
          "avgB": 63.1,
          "winner": null,
          "benchmarkCount": 7
        },
        "multimodalGrounded": {
          "categoryLabel": "Multimodal & Grounded",
          "avgA": null,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 2
        },
        "reasoning": {
          "categoryLabel": "Reasoning",
          "avgA": 45.1,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 3
        },
        "knowledge": {
          "categoryLabel": "Knowledge",
          "avgA": null,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 6
        },
        "instructionFollowing": {
          "categoryLabel": "Instruction Following",
          "avgA": null,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 1
        },
        "multilingual": {
          "categoryLabel": "Multilingual",
          "avgA": null,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 0
        },
        "math": {
          "categoryLabel": "Mathematics",
          "avgA": null,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 0
        }
      }
    },
    {
      "slug": "claude-opus-4-7-adaptive-vs-gemini-3-pro-deep-think",
      "url": "https://benchlm.ai/compare/claude-opus-4-7-adaptive-vs-gemini-3-pro-deep-think",
      "markdownUrl": "https://benchlm.ai/md/compare/claude-opus-4-7-adaptive-vs-gemini-3-pro-deep-think.md",
      "modelA": {
        "slug": "gemini-3-pro-deep-think",
        "canonicalModelKey": "gemini-3-pro-deep-think",
        "model": "Gemini 3 Pro Deep Think",
        "creator": "Google",
        "sourceType": "Proprietary",
        "reasoningType": "Reasoning",
        "contextWindow": "2M",
        "contextWindowTokens": 2000000,
        "displayScore": 89,
        "rankingEligible": true,
        "overallRank": 8,
        "url": "https://benchlm.ai/models/gemini-3-pro-deep-think",
        "markdownUrl": "https://benchlm.ai/md/models/gemini-3-pro-deep-think.md"
      },
      "modelB": {
        "slug": "claude-opus-4-7-adaptive",
        "canonicalModelKey": "claude-opus-4-7-max",
        "model": "Claude Opus 4.7 (Adaptive)",
        "creator": "Anthropic",
        "sourceType": "Proprietary",
        "reasoningType": "Reasoning",
        "contextWindow": "1M",
        "contextWindowTokens": 1000000,
        "displayScore": 84,
        "rankingEligible": true,
        "overallRank": 16,
        "url": "https://benchlm.ai/models/claude-opus-4-7-adaptive",
        "markdownUrl": "https://benchlm.ai/md/models/claude-opus-4-7-adaptive.md"
      },
      "overallWinner": "A",
      "winner": {
        "slug": "gemini-3-pro-deep-think",
        "canonicalModelKey": "gemini-3-pro-deep-think",
        "model": "Gemini 3 Pro Deep Think",
        "creator": "Google",
        "sourceType": "Proprietary",
        "reasoningType": "Reasoning",
        "contextWindow": "2M",
        "contextWindowTokens": 2000000,
        "displayScore": 89,
        "rankingEligible": true,
        "overallRank": 8,
        "url": "https://benchlm.ai/models/gemini-3-pro-deep-think",
        "markdownUrl": "https://benchlm.ai/md/models/gemini-3-pro-deep-think.md"
      },
      "scoreDiff": 5,
      "winsA": 0,
      "winsB": 1,
      "comparableCategoryCount": 1,
      "benchmarkCountA": 4,
      "benchmarkCountB": 36,
      "categoryResults": {
        "agentic": {
          "categoryLabel": "Agentic",
          "avgA": null,
          "avgB": 74.9,
          "winner": null,
          "benchmarkCount": 9
        },
        "coding": {
          "categoryLabel": "Coding",
          "avgA": null,
          "avgB": 72.9,
          "winner": null,
          "benchmarkCount": 6
        },
        "multimodalGrounded": {
          "categoryLabel": "Multimodal & Grounded",
          "avgA": null,
          "avgB": 64.3,
          "winner": null,
          "benchmarkCount": 5
        },
        "reasoning": {
          "categoryLabel": "Reasoning",
          "avgA": 45.1,
          "avgB": 75.8,
          "winner": "B",
          "benchmarkCount": 4
        },
        "knowledge": {
          "categoryLabel": "Knowledge",
          "avgA": null,
          "avgB": 68.2,
          "winner": null,
          "benchmarkCount": 10
        },
        "instructionFollowing": {
          "categoryLabel": "Instruction Following",
          "avgA": null,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 1
        },
        "multilingual": {
          "categoryLabel": "Multilingual",
          "avgA": null,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 0
        },
        "math": {
          "categoryLabel": "Mathematics",
          "avgA": null,
          "avgB": 43.8,
          "winner": null,
          "benchmarkCount": 1
        }
      }
    },
    {
      "slug": "gemini-3-pro-deep-think-vs-glm-5-1",
      "url": "https://benchlm.ai/compare/gemini-3-pro-deep-think-vs-glm-5-1",
      "markdownUrl": "https://benchlm.ai/md/compare/gemini-3-pro-deep-think-vs-glm-5-1.md",
      "modelA": {
        "slug": "gemini-3-pro-deep-think",
        "canonicalModelKey": "gemini-3-pro-deep-think",
        "model": "Gemini 3 Pro Deep Think",
        "creator": "Google",
        "sourceType": "Proprietary",
        "reasoningType": "Reasoning",
        "contextWindow": "2M",
        "contextWindowTokens": 2000000,
        "displayScore": 89,
        "rankingEligible": true,
        "overallRank": 8,
        "url": "https://benchlm.ai/models/gemini-3-pro-deep-think",
        "markdownUrl": "https://benchlm.ai/md/models/gemini-3-pro-deep-think.md"
      },
      "modelB": {
        "slug": "glm-5-1",
        "canonicalModelKey": "glm-5-1",
        "model": "GLM-5.1",
        "creator": "Z.AI",
        "sourceType": "Open Weight",
        "reasoningType": "Reasoning",
        "contextWindow": "203K",
        "contextWindowTokens": 203000,
        "displayScore": 82,
        "rankingEligible": true,
        "overallRank": 17,
        "url": "https://benchlm.ai/models/glm-5-1",
        "markdownUrl": "https://benchlm.ai/md/models/glm-5-1.md"
      },
      "overallWinner": "A",
      "winner": {
        "slug": "gemini-3-pro-deep-think",
        "canonicalModelKey": "gemini-3-pro-deep-think",
        "model": "Gemini 3 Pro Deep Think",
        "creator": "Google",
        "sourceType": "Proprietary",
        "reasoningType": "Reasoning",
        "contextWindow": "2M",
        "contextWindowTokens": 2000000,
        "displayScore": 89,
        "rankingEligible": true,
        "overallRank": 8,
        "url": "https://benchlm.ai/models/gemini-3-pro-deep-think",
        "markdownUrl": "https://benchlm.ai/md/models/gemini-3-pro-deep-think.md"
      },
      "scoreDiff": 7,
      "winsA": 0,
      "winsB": 0,
      "comparableCategoryCount": 0,
      "benchmarkCountA": 4,
      "benchmarkCountB": 33,
      "categoryResults": {
        "agentic": {
          "categoryLabel": "Agentic",
          "avgA": null,
          "avgB": 65.3,
          "winner": null,
          "benchmarkCount": 11
        },
        "coding": {
          "categoryLabel": "Coding",
          "avgA": null,
          "avgB": 60.9,
          "winner": null,
          "benchmarkCount": 7
        },
        "multimodalGrounded": {
          "categoryLabel": "Multimodal & Grounded",
          "avgA": null,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 1
        },
        "reasoning": {
          "categoryLabel": "Reasoning",
          "avgA": 45.1,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 3
        },
        "knowledge": {
          "categoryLabel": "Knowledge",
          "avgA": null,
          "avgB": 52.3,
          "winner": null,
          "benchmarkCount": 8
        },
        "instructionFollowing": {
          "categoryLabel": "Instruction Following",
          "avgA": null,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 1
        },
        "multilingual": {
          "categoryLabel": "Multilingual",
          "avgA": null,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 0
        },
        "math": {
          "categoryLabel": "Mathematics",
          "avgA": null,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 4
        }
      }
    },
    {
      "slug": "claude-sonnet-4-6-vs-gemini-3-pro-deep-think",
      "url": "https://benchlm.ai/compare/claude-sonnet-4-6-vs-gemini-3-pro-deep-think",
      "markdownUrl": "https://benchlm.ai/md/compare/claude-sonnet-4-6-vs-gemini-3-pro-deep-think.md",
      "modelA": {
        "slug": "gemini-3-pro-deep-think",
        "canonicalModelKey": "gemini-3-pro-deep-think",
        "model": "Gemini 3 Pro Deep Think",
        "creator": "Google",
        "sourceType": "Proprietary",
        "reasoningType": "Reasoning",
        "contextWindow": "2M",
        "contextWindowTokens": 2000000,
        "displayScore": 89,
        "rankingEligible": true,
        "overallRank": 8,
        "url": "https://benchlm.ai/models/gemini-3-pro-deep-think",
        "markdownUrl": "https://benchlm.ai/md/models/gemini-3-pro-deep-think.md"
      },
      "modelB": {
        "slug": "claude-sonnet-4-6",
        "canonicalModelKey": "claude-sonnet-4-6",
        "model": "Claude Sonnet 4.6",
        "creator": "Anthropic",
        "sourceType": "Proprietary",
        "reasoningType": "Non-Reasoning",
        "contextWindow": "200K",
        "contextWindowTokens": 200000,
        "displayScore": 82,
        "rankingEligible": true,
        "overallRank": 18,
        "url": "https://benchlm.ai/models/claude-sonnet-4-6",
        "markdownUrl": "https://benchlm.ai/md/models/claude-sonnet-4-6.md"
      },
      "overallWinner": "A",
      "winner": {
        "slug": "gemini-3-pro-deep-think",
        "canonicalModelKey": "gemini-3-pro-deep-think",
        "model": "Gemini 3 Pro Deep Think",
        "creator": "Google",
        "sourceType": "Proprietary",
        "reasoningType": "Reasoning",
        "contextWindow": "2M",
        "contextWindowTokens": 2000000,
        "displayScore": 89,
        "rankingEligible": true,
        "overallRank": 8,
        "url": "https://benchlm.ai/models/gemini-3-pro-deep-think",
        "markdownUrl": "https://benchlm.ai/md/models/gemini-3-pro-deep-think.md"
      },
      "scoreDiff": 7,
      "winsA": 0,
      "winsB": 0,
      "comparableCategoryCount": 0,
      "benchmarkCountA": 4,
      "benchmarkCountB": 33,
      "categoryResults": {
        "agentic": {
          "categoryLabel": "Agentic",
          "avgA": null,
          "avgB": 65.1,
          "winner": null,
          "benchmarkCount": 9
        },
        "coding": {
          "categoryLabel": "Coding",
          "avgA": null,
          "avgB": 66.4,
          "winner": null,
          "benchmarkCount": 8
        },
        "multimodalGrounded": {
          "categoryLabel": "Multimodal & Grounded",
          "avgA": null,
          "avgB": 77.4,
          "winner": null,
          "benchmarkCount": 3
        },
        "reasoning": {
          "categoryLabel": "Reasoning",
          "avgA": 45.1,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 3
        },
        "knowledge": {
          "categoryLabel": "Knowledge",
          "avgA": null,
          "avgB": 73.7,
          "winner": null,
          "benchmarkCount": 10
        },
        "instructionFollowing": {
          "categoryLabel": "Instruction Following",
          "avgA": null,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 1
        },
        "multilingual": {
          "categoryLabel": "Multilingual",
          "avgA": null,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 0
        },
        "math": {
          "categoryLabel": "Mathematics",
          "avgA": null,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 0
        }
      }
    },
    {
      "slug": "gpt-5-4-vs-grok-4-1",
      "url": "https://benchlm.ai/compare/gpt-5-4-vs-grok-4-1",
      "markdownUrl": "https://benchlm.ai/md/compare/gpt-5-4-vs-grok-4-1.md",
      "modelA": {
        "slug": "grok-4-1",
        "canonicalModelKey": "grok-4-1",
        "model": "Grok 4.1",
        "creator": "xAI",
        "sourceType": "Proprietary",
        "reasoningType": "Non-Reasoning",
        "contextWindow": "1M",
        "contextWindowTokens": 1000000,
        "displayScore": 89,
        "rankingEligible": true,
        "overallRank": 9,
        "url": "https://benchlm.ai/models/grok-4-1",
        "markdownUrl": "https://benchlm.ai/md/models/grok-4-1.md"
      },
      "modelB": {
        "slug": "gpt-5-4",
        "canonicalModelKey": "gpt-5-4",
        "model": "GPT-5.4",
        "creator": "OpenAI",
        "sourceType": "Proprietary",
        "reasoningType": "Reasoning",
        "contextWindow": "1.05M",
        "contextWindowTokens": 1050000,
        "displayScore": 88,
        "rankingEligible": true,
        "overallRank": 10,
        "url": "https://benchlm.ai/models/gpt-5-4",
        "markdownUrl": "https://benchlm.ai/md/models/gpt-5-4.md"
      },
      "overallWinner": "A",
      "winner": {
        "slug": "grok-4-1",
        "canonicalModelKey": "grok-4-1",
        "model": "Grok 4.1",
        "creator": "xAI",
        "sourceType": "Proprietary",
        "reasoningType": "Non-Reasoning",
        "contextWindow": "1M",
        "contextWindowTokens": 1000000,
        "displayScore": 89,
        "rankingEligible": true,
        "overallRank": 9,
        "url": "https://benchlm.ai/models/grok-4-1",
        "markdownUrl": "https://benchlm.ai/md/models/grok-4-1.md"
      },
      "scoreDiff": 1,
      "winsA": 0,
      "winsB": 0,
      "comparableCategoryCount": 0,
      "benchmarkCountA": 0,
      "benchmarkCountB": 48,
      "categoryResults": {
        "agentic": {
          "categoryLabel": "Agentic",
          "avgA": null,
          "avgB": 77,
          "winner": null,
          "benchmarkCount": 14
        },
        "coding": {
          "categoryLabel": "Coding",
          "avgA": null,
          "avgB": 57.7,
          "winner": null,
          "benchmarkCount": 7
        },
        "multimodalGrounded": {
          "categoryLabel": "Multimodal & Grounded",
          "avgA": null,
          "avgB": 72.7,
          "winner": null,
          "benchmarkCount": 12
        },
        "reasoning": {
          "categoryLabel": "Reasoning",
          "avgA": null,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 2
        },
        "knowledge": {
          "categoryLabel": "Knowledge",
          "avgA": null,
          "avgB": 66.1,
          "winner": null,
          "benchmarkCount": 12
        },
        "instructionFollowing": {
          "categoryLabel": "Instruction Following",
          "avgA": null,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 1
        },
        "multilingual": {
          "categoryLabel": "Multilingual",
          "avgA": null,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 0
        },
        "math": {
          "categoryLabel": "Mathematics",
          "avgA": null,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 0
        }
      }
    },
    {
      "slug": "grok-4-1-vs-qwen3-7-plus",
      "url": "https://benchlm.ai/compare/grok-4-1-vs-qwen3-7-plus",
      "markdownUrl": "https://benchlm.ai/md/compare/grok-4-1-vs-qwen3-7-plus.md",
      "modelA": {
        "slug": "grok-4-1",
        "canonicalModelKey": "grok-4-1",
        "model": "Grok 4.1",
        "creator": "xAI",
        "sourceType": "Proprietary",
        "reasoningType": "Non-Reasoning",
        "contextWindow": "1M",
        "contextWindowTokens": 1000000,
        "displayScore": 89,
        "rankingEligible": true,
        "overallRank": 9,
        "url": "https://benchlm.ai/models/grok-4-1",
        "markdownUrl": "https://benchlm.ai/md/models/grok-4-1.md"
      },
      "modelB": {
        "slug": "qwen3-7-plus",
        "canonicalModelKey": "qwen3-7-plus",
        "model": "Qwen3.7 Plus",
        "creator": "Alibaba",
        "sourceType": "Proprietary",
        "reasoningType": "Reasoning",
        "contextWindow": "1M",
        "contextWindowTokens": 1000000,
        "displayScore": 88,
        "rankingEligible": true,
        "overallRank": 11,
        "url": "https://benchlm.ai/models/qwen3-7-plus",
        "markdownUrl": "https://benchlm.ai/md/models/qwen3-7-plus.md"
      },
      "overallWinner": "A",
      "winner": {
        "slug": "grok-4-1",
        "canonicalModelKey": "grok-4-1",
        "model": "Grok 4.1",
        "creator": "xAI",
        "sourceType": "Proprietary",
        "reasoningType": "Non-Reasoning",
        "contextWindow": "1M",
        "contextWindowTokens": 1000000,
        "displayScore": 89,
        "rankingEligible": true,
        "overallRank": 9,
        "url": "https://benchlm.ai/models/grok-4-1",
        "markdownUrl": "https://benchlm.ai/md/models/grok-4-1.md"
      },
      "scoreDiff": 1,
      "winsA": 0,
      "winsB": 0,
      "comparableCategoryCount": 0,
      "benchmarkCountA": 0,
      "benchmarkCountB": 68,
      "categoryResults": {
        "agentic": {
          "categoryLabel": "Agentic",
          "avgA": null,
          "avgB": 71.7,
          "winner": null,
          "benchmarkCount": 15
        },
        "coding": {
          "categoryLabel": "Coding",
          "avgA": null,
          "avgB": 71.1,
          "winner": null,
          "benchmarkCount": 10
        },
        "multimodalGrounded": {
          "categoryLabel": "Multimodal & Grounded",
          "avgA": null,
          "avgB": 81.1,
          "winner": null,
          "benchmarkCount": 16
        },
        "reasoning": {
          "categoryLabel": "Reasoning",
          "avgA": null,
          "avgB": 91.7,
          "winner": null,
          "benchmarkCount": 3
        },
        "knowledge": {
          "categoryLabel": "Knowledge",
          "avgA": null,
          "avgB": 67.9,
          "winner": null,
          "benchmarkCount": 13
        },
        "instructionFollowing": {
          "categoryLabel": "Instruction Following",
          "avgA": null,
          "avgB": 89.2,
          "winner": null,
          "benchmarkCount": 3
        },
        "multilingual": {
          "categoryLabel": "Multilingual",
          "avgA": null,
          "avgB": 85.4,
          "winner": null,
          "benchmarkCount": 5
        },
        "math": {
          "categoryLabel": "Mathematics",
          "avgA": null,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 3
        }
      }
    },
    {
      "slug": "claude-opus-4-6-vs-grok-4-1",
      "url": "https://benchlm.ai/compare/claude-opus-4-6-vs-grok-4-1",
      "markdownUrl": "https://benchlm.ai/md/compare/claude-opus-4-6-vs-grok-4-1.md",
      "modelA": {
        "slug": "grok-4-1",
        "canonicalModelKey": "grok-4-1",
        "model": "Grok 4.1",
        "creator": "xAI",
        "sourceType": "Proprietary",
        "reasoningType": "Non-Reasoning",
        "contextWindow": "1M",
        "contextWindowTokens": 1000000,
        "displayScore": 89,
        "rankingEligible": true,
        "overallRank": 9,
        "url": "https://benchlm.ai/models/grok-4-1",
        "markdownUrl": "https://benchlm.ai/md/models/grok-4-1.md"
      },
      "modelB": {
        "slug": "claude-opus-4-6",
        "canonicalModelKey": "claude-opus-4-6",
        "model": "Claude Opus 4.6",
        "creator": "Anthropic",
        "sourceType": "Proprietary",
        "reasoningType": "Non-Reasoning",
        "contextWindow": "1M",
        "contextWindowTokens": 1000000,
        "displayScore": 86,
        "rankingEligible": true,
        "overallRank": 12,
        "url": "https://benchlm.ai/models/claude-opus-4-6",
        "markdownUrl": "https://benchlm.ai/md/models/claude-opus-4-6.md"
      },
      "overallWinner": "A",
      "winner": {
        "slug": "grok-4-1",
        "canonicalModelKey": "grok-4-1",
        "model": "Grok 4.1",
        "creator": "xAI",
        "sourceType": "Proprietary",
        "reasoningType": "Non-Reasoning",
        "contextWindow": "1M",
        "contextWindowTokens": 1000000,
        "displayScore": 89,
        "rankingEligible": true,
        "overallRank": 9,
        "url": "https://benchlm.ai/models/grok-4-1",
        "markdownUrl": "https://benchlm.ai/md/models/grok-4-1.md"
      },
      "scoreDiff": 3,
      "winsA": 0,
      "winsB": 0,
      "comparableCategoryCount": 0,
      "benchmarkCountA": 0,
      "benchmarkCountB": 47,
      "categoryResults": {
        "agentic": {
          "categoryLabel": "Agentic",
          "avgA": null,
          "avgB": 72.6,
          "winner": null,
          "benchmarkCount": 11
        },
        "coding": {
          "categoryLabel": "Coding",
          "avgA": null,
          "avgB": 64.4,
          "winner": null,
          "benchmarkCount": 10
        },
        "multimodalGrounded": {
          "categoryLabel": "Multimodal & Grounded",
          "avgA": null,
          "avgB": 77.3,
          "winner": null,
          "benchmarkCount": 7
        },
        "reasoning": {
          "categoryLabel": "Reasoning",
          "avgA": null,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 2
        },
        "knowledge": {
          "categoryLabel": "Knowledge",
          "avgA": null,
          "avgB": 76.2,
          "winner": null,
          "benchmarkCount": 15
        },
        "instructionFollowing": {
          "categoryLabel": "Instruction Following",
          "avgA": null,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 1
        },
        "multilingual": {
          "categoryLabel": "Multilingual",
          "avgA": null,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 0
        },
        "math": {
          "categoryLabel": "Mathematics",
          "avgA": null,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 1
        }
      }
    },
    {
      "slug": "gemini-3-5-flash-vs-grok-4-1",
      "url": "https://benchlm.ai/compare/gemini-3-5-flash-vs-grok-4-1",
      "markdownUrl": "https://benchlm.ai/md/compare/gemini-3-5-flash-vs-grok-4-1.md",
      "modelA": {
        "slug": "grok-4-1",
        "canonicalModelKey": "grok-4-1",
        "model": "Grok 4.1",
        "creator": "xAI",
        "sourceType": "Proprietary",
        "reasoningType": "Non-Reasoning",
        "contextWindow": "1M",
        "contextWindowTokens": 1000000,
        "displayScore": 89,
        "rankingEligible": true,
        "overallRank": 9,
        "url": "https://benchlm.ai/models/grok-4-1",
        "markdownUrl": "https://benchlm.ai/md/models/grok-4-1.md"
      },
      "modelB": {
        "slug": "gemini-3-5-flash",
        "canonicalModelKey": "gemini-3-5-flash",
        "model": "Gemini 3.5 Flash",
        "creator": "Google",
        "sourceType": "Proprietary",
        "reasoningType": "Reasoning",
        "contextWindow": "1M",
        "contextWindowTokens": 1000000,
        "displayScore": 86,
        "rankingEligible": true,
        "overallRank": 13,
        "url": "https://benchlm.ai/models/gemini-3-5-flash",
        "markdownUrl": "https://benchlm.ai/md/models/gemini-3-5-flash.md"
      },
      "overallWinner": "A",
      "winner": {
        "slug": "grok-4-1",
        "canonicalModelKey": "grok-4-1",
        "model": "Grok 4.1",
        "creator": "xAI",
        "sourceType": "Proprietary",
        "reasoningType": "Non-Reasoning",
        "contextWindow": "1M",
        "contextWindowTokens": 1000000,
        "displayScore": 89,
        "rankingEligible": true,
        "overallRank": 9,
        "url": "https://benchlm.ai/models/grok-4-1",
        "markdownUrl": "https://benchlm.ai/md/models/grok-4-1.md"
      },
      "scoreDiff": 3,
      "winsA": 0,
      "winsB": 0,
      "comparableCategoryCount": 0,
      "benchmarkCountA": 0,
      "benchmarkCountB": 40,
      "categoryResults": {
        "agentic": {
          "categoryLabel": "Agentic",
          "avgA": null,
          "avgB": 77.2,
          "winner": null,
          "benchmarkCount": 11
        },
        "coding": {
          "categoryLabel": "Coding",
          "avgA": null,
          "avgB": 54.5,
          "winner": null,
          "benchmarkCount": 8
        },
        "multimodalGrounded": {
          "categoryLabel": "Multimodal & Grounded",
          "avgA": null,
          "avgB": 83.8,
          "winner": null,
          "benchmarkCount": 5
        },
        "reasoning": {
          "categoryLabel": "Reasoning",
          "avgA": null,
          "avgB": 74.7,
          "winner": null,
          "benchmarkCount": 5
        },
        "knowledge": {
          "categoryLabel": "Knowledge",
          "avgA": null,
          "avgB": 58,
          "winner": null,
          "benchmarkCount": 9
        },
        "instructionFollowing": {
          "categoryLabel": "Instruction Following",
          "avgA": null,
          "avgB": 76.3,
          "winner": null,
          "benchmarkCount": 2
        },
        "multilingual": {
          "categoryLabel": "Multilingual",
          "avgA": null,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 0
        },
        "math": {
          "categoryLabel": "Mathematics",
          "avgA": null,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 0
        }
      }
    },
    {
      "slug": "deepseek-v4-pro-max-vs-grok-4-1",
      "url": "https://benchlm.ai/compare/deepseek-v4-pro-max-vs-grok-4-1",
      "markdownUrl": "https://benchlm.ai/md/compare/deepseek-v4-pro-max-vs-grok-4-1.md",
      "modelA": {
        "slug": "grok-4-1",
        "canonicalModelKey": "grok-4-1",
        "model": "Grok 4.1",
        "creator": "xAI",
        "sourceType": "Proprietary",
        "reasoningType": "Non-Reasoning",
        "contextWindow": "1M",
        "contextWindowTokens": 1000000,
        "displayScore": 89,
        "rankingEligible": true,
        "overallRank": 9,
        "url": "https://benchlm.ai/models/grok-4-1",
        "markdownUrl": "https://benchlm.ai/md/models/grok-4-1.md"
      },
      "modelB": {
        "slug": "deepseek-v4-pro-max",
        "canonicalModelKey": "deepseek-v4-pro-max",
        "model": "DeepSeek V4 Pro (Max)",
        "creator": "DeepSeek",
        "sourceType": "Open Weight",
        "reasoningType": "Reasoning",
        "contextWindow": "1M",
        "contextWindowTokens": 1000000,
        "displayScore": 86,
        "rankingEligible": true,
        "overallRank": 14,
        "url": "https://benchlm.ai/models/deepseek-v4-pro-max",
        "markdownUrl": "https://benchlm.ai/md/models/deepseek-v4-pro-max.md"
      },
      "overallWinner": "A",
      "winner": {
        "slug": "grok-4-1",
        "canonicalModelKey": "grok-4-1",
        "model": "Grok 4.1",
        "creator": "xAI",
        "sourceType": "Proprietary",
        "reasoningType": "Non-Reasoning",
        "contextWindow": "1M",
        "contextWindowTokens": 1000000,
        "displayScore": 89,
        "rankingEligible": true,
        "overallRank": 9,
        "url": "https://benchlm.ai/models/grok-4-1",
        "markdownUrl": "https://benchlm.ai/md/models/grok-4-1.md"
      },
      "scoreDiff": 3,
      "winsA": 0,
      "winsB": 0,
      "comparableCategoryCount": 0,
      "benchmarkCountA": 0,
      "benchmarkCountB": 42,
      "categoryResults": {
        "agentic": {
          "categoryLabel": "Agentic",
          "avgA": null,
          "avgB": 74,
          "winner": null,
          "benchmarkCount": 10
        },
        "coding": {
          "categoryLabel": "Coding",
          "avgA": null,
          "avgB": 75.9,
          "winner": null,
          "benchmarkCount": 10
        },
        "multimodalGrounded": {
          "categoryLabel": "Multimodal & Grounded",
          "avgA": null,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 1
        },
        "reasoning": {
          "categoryLabel": "Reasoning",
          "avgA": null,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 4
        },
        "knowledge": {
          "categoryLabel": "Knowledge",
          "avgA": null,
          "avgB": 66.1,
          "winner": null,
          "benchmarkCount": 12
        },
        "instructionFollowing": {
          "categoryLabel": "Instruction Following",
          "avgA": null,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 1
        },
        "multilingual": {
          "categoryLabel": "Multilingual",
          "avgA": null,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 0
        },
        "math": {
          "categoryLabel": "Mathematics",
          "avgA": null,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 4
        }
      }
    },
    {
      "slug": "gpt-5-3-codex-vs-grok-4-1",
      "url": "https://benchlm.ai/compare/gpt-5-3-codex-vs-grok-4-1",
      "markdownUrl": "https://benchlm.ai/md/compare/gpt-5-3-codex-vs-grok-4-1.md",
      "modelA": {
        "slug": "grok-4-1",
        "canonicalModelKey": "grok-4-1",
        "model": "Grok 4.1",
        "creator": "xAI",
        "sourceType": "Proprietary",
        "reasoningType": "Non-Reasoning",
        "contextWindow": "1M",
        "contextWindowTokens": 1000000,
        "displayScore": 89,
        "rankingEligible": true,
        "overallRank": 9,
        "url": "https://benchlm.ai/models/grok-4-1",
        "markdownUrl": "https://benchlm.ai/md/models/grok-4-1.md"
      },
      "modelB": {
        "slug": "gpt-5-3-codex",
        "canonicalModelKey": "gpt-5-3-codex",
        "model": "GPT-5.3 Codex",
        "creator": "OpenAI",
        "sourceType": "Proprietary",
        "reasoningType": "Reasoning",
        "contextWindow": "400K",
        "contextWindowTokens": 400000,
        "displayScore": 85,
        "rankingEligible": true,
        "overallRank": 15,
        "url": "https://benchlm.ai/models/gpt-5-3-codex",
        "markdownUrl": "https://benchlm.ai/md/models/gpt-5-3-codex.md"
      },
      "overallWinner": "A",
      "winner": {
        "slug": "grok-4-1",
        "canonicalModelKey": "grok-4-1",
        "model": "Grok 4.1",
        "creator": "xAI",
        "sourceType": "Proprietary",
        "reasoningType": "Non-Reasoning",
        "contextWindow": "1M",
        "contextWindowTokens": 1000000,
        "displayScore": 89,
        "rankingEligible": true,
        "overallRank": 9,
        "url": "https://benchlm.ai/models/grok-4-1",
        "markdownUrl": "https://benchlm.ai/md/models/grok-4-1.md"
      },
      "scoreDiff": 4,
      "winsA": 0,
      "winsB": 0,
      "comparableCategoryCount": 0,
      "benchmarkCountA": 0,
      "benchmarkCountB": 25,
      "categoryResults": {
        "agentic": {
          "categoryLabel": "Agentic",
          "avgA": null,
          "avgB": 71.5,
          "winner": null,
          "benchmarkCount": 7
        },
        "coding": {
          "categoryLabel": "Coding",
          "avgA": null,
          "avgB": 63.1,
          "winner": null,
          "benchmarkCount": 7
        },
        "multimodalGrounded": {
          "categoryLabel": "Multimodal & Grounded",
          "avgA": null,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 2
        },
        "reasoning": {
          "categoryLabel": "Reasoning",
          "avgA": null,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 2
        },
        "knowledge": {
          "categoryLabel": "Knowledge",
          "avgA": null,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 6
        },
        "instructionFollowing": {
          "categoryLabel": "Instruction Following",
          "avgA": null,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 1
        },
        "multilingual": {
          "categoryLabel": "Multilingual",
          "avgA": null,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 0
        },
        "math": {
          "categoryLabel": "Mathematics",
          "avgA": null,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 0
        }
      }
    },
    {
      "slug": "claude-opus-4-7-adaptive-vs-grok-4-1",
      "url": "https://benchlm.ai/compare/claude-opus-4-7-adaptive-vs-grok-4-1",
      "markdownUrl": "https://benchlm.ai/md/compare/claude-opus-4-7-adaptive-vs-grok-4-1.md",
      "modelA": {
        "slug": "grok-4-1",
        "canonicalModelKey": "grok-4-1",
        "model": "Grok 4.1",
        "creator": "xAI",
        "sourceType": "Proprietary",
        "reasoningType": "Non-Reasoning",
        "contextWindow": "1M",
        "contextWindowTokens": 1000000,
        "displayScore": 89,
        "rankingEligible": true,
        "overallRank": 9,
        "url": "https://benchlm.ai/models/grok-4-1",
        "markdownUrl": "https://benchlm.ai/md/models/grok-4-1.md"
      },
      "modelB": {
        "slug": "claude-opus-4-7-adaptive",
        "canonicalModelKey": "claude-opus-4-7-max",
        "model": "Claude Opus 4.7 (Adaptive)",
        "creator": "Anthropic",
        "sourceType": "Proprietary",
        "reasoningType": "Reasoning",
        "contextWindow": "1M",
        "contextWindowTokens": 1000000,
        "displayScore": 84,
        "rankingEligible": true,
        "overallRank": 16,
        "url": "https://benchlm.ai/models/claude-opus-4-7-adaptive",
        "markdownUrl": "https://benchlm.ai/md/models/claude-opus-4-7-adaptive.md"
      },
      "overallWinner": "A",
      "winner": {
        "slug": "grok-4-1",
        "canonicalModelKey": "grok-4-1",
        "model": "Grok 4.1",
        "creator": "xAI",
        "sourceType": "Proprietary",
        "reasoningType": "Non-Reasoning",
        "contextWindow": "1M",
        "contextWindowTokens": 1000000,
        "displayScore": 89,
        "rankingEligible": true,
        "overallRank": 9,
        "url": "https://benchlm.ai/models/grok-4-1",
        "markdownUrl": "https://benchlm.ai/md/models/grok-4-1.md"
      },
      "scoreDiff": 5,
      "winsA": 0,
      "winsB": 0,
      "comparableCategoryCount": 0,
      "benchmarkCountA": 0,
      "benchmarkCountB": 36,
      "categoryResults": {
        "agentic": {
          "categoryLabel": "Agentic",
          "avgA": null,
          "avgB": 74.9,
          "winner": null,
          "benchmarkCount": 9
        },
        "coding": {
          "categoryLabel": "Coding",
          "avgA": null,
          "avgB": 72.9,
          "winner": null,
          "benchmarkCount": 6
        },
        "multimodalGrounded": {
          "categoryLabel": "Multimodal & Grounded",
          "avgA": null,
          "avgB": 64.3,
          "winner": null,
          "benchmarkCount": 5
        },
        "reasoning": {
          "categoryLabel": "Reasoning",
          "avgA": null,
          "avgB": 75.8,
          "winner": null,
          "benchmarkCount": 4
        },
        "knowledge": {
          "categoryLabel": "Knowledge",
          "avgA": null,
          "avgB": 68.2,
          "winner": null,
          "benchmarkCount": 10
        },
        "instructionFollowing": {
          "categoryLabel": "Instruction Following",
          "avgA": null,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 1
        },
        "multilingual": {
          "categoryLabel": "Multilingual",
          "avgA": null,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 0
        },
        "math": {
          "categoryLabel": "Mathematics",
          "avgA": null,
          "avgB": 43.8,
          "winner": null,
          "benchmarkCount": 1
        }
      }
    },
    {
      "slug": "glm-5-1-vs-grok-4-1",
      "url": "https://benchlm.ai/compare/glm-5-1-vs-grok-4-1",
      "markdownUrl": "https://benchlm.ai/md/compare/glm-5-1-vs-grok-4-1.md",
      "modelA": {
        "slug": "grok-4-1",
        "canonicalModelKey": "grok-4-1",
        "model": "Grok 4.1",
        "creator": "xAI",
        "sourceType": "Proprietary",
        "reasoningType": "Non-Reasoning",
        "contextWindow": "1M",
        "contextWindowTokens": 1000000,
        "displayScore": 89,
        "rankingEligible": true,
        "overallRank": 9,
        "url": "https://benchlm.ai/models/grok-4-1",
        "markdownUrl": "https://benchlm.ai/md/models/grok-4-1.md"
      },
      "modelB": {
        "slug": "glm-5-1",
        "canonicalModelKey": "glm-5-1",
        "model": "GLM-5.1",
        "creator": "Z.AI",
        "sourceType": "Open Weight",
        "reasoningType": "Reasoning",
        "contextWindow": "203K",
        "contextWindowTokens": 203000,
        "displayScore": 82,
        "rankingEligible": true,
        "overallRank": 17,
        "url": "https://benchlm.ai/models/glm-5-1",
        "markdownUrl": "https://benchlm.ai/md/models/glm-5-1.md"
      },
      "overallWinner": "A",
      "winner": {
        "slug": "grok-4-1",
        "canonicalModelKey": "grok-4-1",
        "model": "Grok 4.1",
        "creator": "xAI",
        "sourceType": "Proprietary",
        "reasoningType": "Non-Reasoning",
        "contextWindow": "1M",
        "contextWindowTokens": 1000000,
        "displayScore": 89,
        "rankingEligible": true,
        "overallRank": 9,
        "url": "https://benchlm.ai/models/grok-4-1",
        "markdownUrl": "https://benchlm.ai/md/models/grok-4-1.md"
      },
      "scoreDiff": 7,
      "winsA": 0,
      "winsB": 0,
      "comparableCategoryCount": 0,
      "benchmarkCountA": 0,
      "benchmarkCountB": 33,
      "categoryResults": {
        "agentic": {
          "categoryLabel": "Agentic",
          "avgA": null,
          "avgB": 65.3,
          "winner": null,
          "benchmarkCount": 10
        },
        "coding": {
          "categoryLabel": "Coding",
          "avgA": null,
          "avgB": 60.9,
          "winner": null,
          "benchmarkCount": 7
        },
        "multimodalGrounded": {
          "categoryLabel": "Multimodal & Grounded",
          "avgA": null,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 1
        },
        "reasoning": {
          "categoryLabel": "Reasoning",
          "avgA": null,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 2
        },
        "knowledge": {
          "categoryLabel": "Knowledge",
          "avgA": null,
          "avgB": 52.3,
          "winner": null,
          "benchmarkCount": 8
        },
        "instructionFollowing": {
          "categoryLabel": "Instruction Following",
          "avgA": null,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 1
        },
        "multilingual": {
          "categoryLabel": "Multilingual",
          "avgA": null,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 0
        },
        "math": {
          "categoryLabel": "Mathematics",
          "avgA": null,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 4
        }
      }
    },
    {
      "slug": "claude-sonnet-4-6-vs-grok-4-1",
      "url": "https://benchlm.ai/compare/claude-sonnet-4-6-vs-grok-4-1",
      "markdownUrl": "https://benchlm.ai/md/compare/claude-sonnet-4-6-vs-grok-4-1.md",
      "modelA": {
        "slug": "grok-4-1",
        "canonicalModelKey": "grok-4-1",
        "model": "Grok 4.1",
        "creator": "xAI",
        "sourceType": "Proprietary",
        "reasoningType": "Non-Reasoning",
        "contextWindow": "1M",
        "contextWindowTokens": 1000000,
        "displayScore": 89,
        "rankingEligible": true,
        "overallRank": 9,
        "url": "https://benchlm.ai/models/grok-4-1",
        "markdownUrl": "https://benchlm.ai/md/models/grok-4-1.md"
      },
      "modelB": {
        "slug": "claude-sonnet-4-6",
        "canonicalModelKey": "claude-sonnet-4-6",
        "model": "Claude Sonnet 4.6",
        "creator": "Anthropic",
        "sourceType": "Proprietary",
        "reasoningType": "Non-Reasoning",
        "contextWindow": "200K",
        "contextWindowTokens": 200000,
        "displayScore": 82,
        "rankingEligible": true,
        "overallRank": 18,
        "url": "https://benchlm.ai/models/claude-sonnet-4-6",
        "markdownUrl": "https://benchlm.ai/md/models/claude-sonnet-4-6.md"
      },
      "overallWinner": "A",
      "winner": {
        "slug": "grok-4-1",
        "canonicalModelKey": "grok-4-1",
        "model": "Grok 4.1",
        "creator": "xAI",
        "sourceType": "Proprietary",
        "reasoningType": "Non-Reasoning",
        "contextWindow": "1M",
        "contextWindowTokens": 1000000,
        "displayScore": 89,
        "rankingEligible": true,
        "overallRank": 9,
        "url": "https://benchlm.ai/models/grok-4-1",
        "markdownUrl": "https://benchlm.ai/md/models/grok-4-1.md"
      },
      "scoreDiff": 7,
      "winsA": 0,
      "winsB": 0,
      "comparableCategoryCount": 0,
      "benchmarkCountA": 0,
      "benchmarkCountB": 33,
      "categoryResults": {
        "agentic": {
          "categoryLabel": "Agentic",
          "avgA": null,
          "avgB": 65.1,
          "winner": null,
          "benchmarkCount": 9
        },
        "coding": {
          "categoryLabel": "Coding",
          "avgA": null,
          "avgB": 66.4,
          "winner": null,
          "benchmarkCount": 8
        },
        "multimodalGrounded": {
          "categoryLabel": "Multimodal & Grounded",
          "avgA": null,
          "avgB": 77.4,
          "winner": null,
          "benchmarkCount": 3
        },
        "reasoning": {
          "categoryLabel": "Reasoning",
          "avgA": null,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 2
        },
        "knowledge": {
          "categoryLabel": "Knowledge",
          "avgA": null,
          "avgB": 73.7,
          "winner": null,
          "benchmarkCount": 10
        },
        "instructionFollowing": {
          "categoryLabel": "Instruction Following",
          "avgA": null,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 1
        },
        "multilingual": {
          "categoryLabel": "Multilingual",
          "avgA": null,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 0
        },
        "math": {
          "categoryLabel": "Mathematics",
          "avgA": null,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 0
        }
      }
    },
    {
      "slug": "gpt-5-4-vs-qwen3-7-plus",
      "url": "https://benchlm.ai/compare/gpt-5-4-vs-qwen3-7-plus",
      "markdownUrl": "https://benchlm.ai/md/compare/gpt-5-4-vs-qwen3-7-plus.md",
      "modelA": {
        "slug": "gpt-5-4",
        "canonicalModelKey": "gpt-5-4",
        "model": "GPT-5.4",
        "creator": "OpenAI",
        "sourceType": "Proprietary",
        "reasoningType": "Reasoning",
        "contextWindow": "1.05M",
        "contextWindowTokens": 1050000,
        "displayScore": 88,
        "rankingEligible": true,
        "overallRank": 10,
        "url": "https://benchlm.ai/models/gpt-5-4",
        "markdownUrl": "https://benchlm.ai/md/models/gpt-5-4.md"
      },
      "modelB": {
        "slug": "qwen3-7-plus",
        "canonicalModelKey": "qwen3-7-plus",
        "model": "Qwen3.7 Plus",
        "creator": "Alibaba",
        "sourceType": "Proprietary",
        "reasoningType": "Reasoning",
        "contextWindow": "1M",
        "contextWindowTokens": 1000000,
        "displayScore": 88,
        "rankingEligible": true,
        "overallRank": 11,
        "url": "https://benchlm.ai/models/qwen3-7-plus",
        "markdownUrl": "https://benchlm.ai/md/models/qwen3-7-plus.md"
      },
      "overallWinner": "tie",
      "winner": null,
      "scoreDiff": 0,
      "winsA": 1,
      "winsB": 3,
      "comparableCategoryCount": 4,
      "benchmarkCountA": 48,
      "benchmarkCountB": 68,
      "categoryResults": {
        "agentic": {
          "categoryLabel": "Agentic",
          "avgA": 77,
          "avgB": 71.7,
          "winner": "A",
          "benchmarkCount": 20
        },
        "coding": {
          "categoryLabel": "Coding",
          "avgA": 57.7,
          "avgB": 71.1,
          "winner": "B",
          "benchmarkCount": 13
        },
        "multimodalGrounded": {
          "categoryLabel": "Multimodal & Grounded",
          "avgA": 72.7,
          "avgB": 81.1,
          "winner": "B",
          "benchmarkCount": 21
        },
        "reasoning": {
          "categoryLabel": "Reasoning",
          "avgA": null,
          "avgB": 91.7,
          "winner": null,
          "benchmarkCount": 3
        },
        "knowledge": {
          "categoryLabel": "Knowledge",
          "avgA": 66.1,
          "avgB": 67.9,
          "winner": "B",
          "benchmarkCount": 16
        },
        "instructionFollowing": {
          "categoryLabel": "Instruction Following",
          "avgA": null,
          "avgB": 89.2,
          "winner": null,
          "benchmarkCount": 3
        },
        "multilingual": {
          "categoryLabel": "Multilingual",
          "avgA": null,
          "avgB": 85.4,
          "winner": null,
          "benchmarkCount": 5
        },
        "math": {
          "categoryLabel": "Mathematics",
          "avgA": null,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 3
        }
      }
    },
    {
      "slug": "claude-opus-4-6-vs-gpt-5-4",
      "url": "https://benchlm.ai/compare/claude-opus-4-6-vs-gpt-5-4",
      "markdownUrl": "https://benchlm.ai/md/compare/claude-opus-4-6-vs-gpt-5-4.md",
      "modelA": {
        "slug": "gpt-5-4",
        "canonicalModelKey": "gpt-5-4",
        "model": "GPT-5.4",
        "creator": "OpenAI",
        "sourceType": "Proprietary",
        "reasoningType": "Reasoning",
        "contextWindow": "1.05M",
        "contextWindowTokens": 1050000,
        "displayScore": 88,
        "rankingEligible": true,
        "overallRank": 10,
        "url": "https://benchlm.ai/models/gpt-5-4",
        "markdownUrl": "https://benchlm.ai/md/models/gpt-5-4.md"
      },
      "modelB": {
        "slug": "claude-opus-4-6",
        "canonicalModelKey": "claude-opus-4-6",
        "model": "Claude Opus 4.6",
        "creator": "Anthropic",
        "sourceType": "Proprietary",
        "reasoningType": "Non-Reasoning",
        "contextWindow": "1M",
        "contextWindowTokens": 1000000,
        "displayScore": 86,
        "rankingEligible": true,
        "overallRank": 12,
        "url": "https://benchlm.ai/models/claude-opus-4-6",
        "markdownUrl": "https://benchlm.ai/md/models/claude-opus-4-6.md"
      },
      "overallWinner": "A",
      "winner": {
        "slug": "gpt-5-4",
        "canonicalModelKey": "gpt-5-4",
        "model": "GPT-5.4",
        "creator": "OpenAI",
        "sourceType": "Proprietary",
        "reasoningType": "Reasoning",
        "contextWindow": "1.05M",
        "contextWindowTokens": 1050000,
        "displayScore": 88,
        "rankingEligible": true,
        "overallRank": 10,
        "url": "https://benchlm.ai/models/gpt-5-4",
        "markdownUrl": "https://benchlm.ai/md/models/gpt-5-4.md"
      },
      "scoreDiff": 2,
      "winsA": 1,
      "winsB": 3,
      "comparableCategoryCount": 4,
      "benchmarkCountA": 48,
      "benchmarkCountB": 47,
      "categoryResults": {
        "agentic": {
          "categoryLabel": "Agentic",
          "avgA": 77,
          "avgB": 72.6,
          "winner": "A",
          "benchmarkCount": 14
        },
        "coding": {
          "categoryLabel": "Coding",
          "avgA": 57.7,
          "avgB": 64.4,
          "winner": "B",
          "benchmarkCount": 10
        },
        "multimodalGrounded": {
          "categoryLabel": "Multimodal & Grounded",
          "avgA": 72.7,
          "avgB": 77.3,
          "winner": "B",
          "benchmarkCount": 12
        },
        "reasoning": {
          "categoryLabel": "Reasoning",
          "avgA": null,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 2
        },
        "knowledge": {
          "categoryLabel": "Knowledge",
          "avgA": 66.1,
          "avgB": 76.2,
          "winner": "B",
          "benchmarkCount": 15
        },
        "instructionFollowing": {
          "categoryLabel": "Instruction Following",
          "avgA": null,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 1
        },
        "multilingual": {
          "categoryLabel": "Multilingual",
          "avgA": null,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 0
        },
        "math": {
          "categoryLabel": "Mathematics",
          "avgA": null,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 1
        }
      }
    },
    {
      "slug": "gemini-3-5-flash-vs-gpt-5-4",
      "url": "https://benchlm.ai/compare/gemini-3-5-flash-vs-gpt-5-4",
      "markdownUrl": "https://benchlm.ai/md/compare/gemini-3-5-flash-vs-gpt-5-4.md",
      "modelA": {
        "slug": "gpt-5-4",
        "canonicalModelKey": "gpt-5-4",
        "model": "GPT-5.4",
        "creator": "OpenAI",
        "sourceType": "Proprietary",
        "reasoningType": "Reasoning",
        "contextWindow": "1.05M",
        "contextWindowTokens": 1050000,
        "displayScore": 88,
        "rankingEligible": true,
        "overallRank": 10,
        "url": "https://benchlm.ai/models/gpt-5-4",
        "markdownUrl": "https://benchlm.ai/md/models/gpt-5-4.md"
      },
      "modelB": {
        "slug": "gemini-3-5-flash",
        "canonicalModelKey": "gemini-3-5-flash",
        "model": "Gemini 3.5 Flash",
        "creator": "Google",
        "sourceType": "Proprietary",
        "reasoningType": "Reasoning",
        "contextWindow": "1M",
        "contextWindowTokens": 1000000,
        "displayScore": 86,
        "rankingEligible": true,
        "overallRank": 13,
        "url": "https://benchlm.ai/models/gemini-3-5-flash",
        "markdownUrl": "https://benchlm.ai/md/models/gemini-3-5-flash.md"
      },
      "overallWinner": "A",
      "winner": {
        "slug": "gpt-5-4",
        "canonicalModelKey": "gpt-5-4",
        "model": "GPT-5.4",
        "creator": "OpenAI",
        "sourceType": "Proprietary",
        "reasoningType": "Reasoning",
        "contextWindow": "1.05M",
        "contextWindowTokens": 1050000,
        "displayScore": 88,
        "rankingEligible": true,
        "overallRank": 10,
        "url": "https://benchlm.ai/models/gpt-5-4",
        "markdownUrl": "https://benchlm.ai/md/models/gpt-5-4.md"
      },
      "scoreDiff": 2,
      "winsA": 2,
      "winsB": 2,
      "comparableCategoryCount": 4,
      "benchmarkCountA": 48,
      "benchmarkCountB": 40,
      "categoryResults": {
        "agentic": {
          "categoryLabel": "Agentic",
          "avgA": 77,
          "avgB": 77.2,
          "winner": "B",
          "benchmarkCount": 15
        },
        "coding": {
          "categoryLabel": "Coding",
          "avgA": 57.7,
          "avgB": 54.5,
          "winner": "A",
          "benchmarkCount": 10
        },
        "multimodalGrounded": {
          "categoryLabel": "Multimodal & Grounded",
          "avgA": 72.7,
          "avgB": 83.8,
          "winner": "B",
          "benchmarkCount": 13
        },
        "reasoning": {
          "categoryLabel": "Reasoning",
          "avgA": null,
          "avgB": 74.7,
          "winner": null,
          "benchmarkCount": 5
        },
        "knowledge": {
          "categoryLabel": "Knowledge",
          "avgA": 66.1,
          "avgB": 58,
          "winner": "A",
          "benchmarkCount": 12
        },
        "instructionFollowing": {
          "categoryLabel": "Instruction Following",
          "avgA": null,
          "avgB": 76.3,
          "winner": null,
          "benchmarkCount": 2
        },
        "multilingual": {
          "categoryLabel": "Multilingual",
          "avgA": null,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 0
        },
        "math": {
          "categoryLabel": "Mathematics",
          "avgA": null,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 0
        }
      }
    },
    {
      "slug": "deepseek-v4-pro-max-vs-gpt-5-4",
      "url": "https://benchlm.ai/compare/deepseek-v4-pro-max-vs-gpt-5-4",
      "markdownUrl": "https://benchlm.ai/md/compare/deepseek-v4-pro-max-vs-gpt-5-4.md",
      "modelA": {
        "slug": "gpt-5-4",
        "canonicalModelKey": "gpt-5-4",
        "model": "GPT-5.4",
        "creator": "OpenAI",
        "sourceType": "Proprietary",
        "reasoningType": "Reasoning",
        "contextWindow": "1.05M",
        "contextWindowTokens": 1050000,
        "displayScore": 88,
        "rankingEligible": true,
        "overallRank": 10,
        "url": "https://benchlm.ai/models/gpt-5-4",
        "markdownUrl": "https://benchlm.ai/md/models/gpt-5-4.md"
      },
      "modelB": {
        "slug": "deepseek-v4-pro-max",
        "canonicalModelKey": "deepseek-v4-pro-max",
        "model": "DeepSeek V4 Pro (Max)",
        "creator": "DeepSeek",
        "sourceType": "Open Weight",
        "reasoningType": "Reasoning",
        "contextWindow": "1M",
        "contextWindowTokens": 1000000,
        "displayScore": 86,
        "rankingEligible": true,
        "overallRank": 14,
        "url": "https://benchlm.ai/models/deepseek-v4-pro-max",
        "markdownUrl": "https://benchlm.ai/md/models/deepseek-v4-pro-max.md"
      },
      "overallWinner": "A",
      "winner": {
        "slug": "gpt-5-4",
        "canonicalModelKey": "gpt-5-4",
        "model": "GPT-5.4",
        "creator": "OpenAI",
        "sourceType": "Proprietary",
        "reasoningType": "Reasoning",
        "contextWindow": "1.05M",
        "contextWindowTokens": 1050000,
        "displayScore": 88,
        "rankingEligible": true,
        "overallRank": 10,
        "url": "https://benchlm.ai/models/gpt-5-4",
        "markdownUrl": "https://benchlm.ai/md/models/gpt-5-4.md"
      },
      "scoreDiff": 2,
      "winsA": 1,
      "winsB": 1,
      "comparableCategoryCount": 3,
      "benchmarkCountA": 48,
      "benchmarkCountB": 42,
      "categoryResults": {
        "agentic": {
          "categoryLabel": "Agentic",
          "avgA": 77,
          "avgB": 74,
          "winner": "A",
          "benchmarkCount": 15
        },
        "coding": {
          "categoryLabel": "Coding",
          "avgA": 57.7,
          "avgB": 75.9,
          "winner": "B",
          "benchmarkCount": 12
        },
        "multimodalGrounded": {
          "categoryLabel": "Multimodal & Grounded",
          "avgA": 72.7,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 12
        },
        "reasoning": {
          "categoryLabel": "Reasoning",
          "avgA": null,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 4
        },
        "knowledge": {
          "categoryLabel": "Knowledge",
          "avgA": 66.1,
          "avgB": 66.1,
          "winner": "tie",
          "benchmarkCount": 15
        },
        "instructionFollowing": {
          "categoryLabel": "Instruction Following",
          "avgA": null,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 1
        },
        "multilingual": {
          "categoryLabel": "Multilingual",
          "avgA": null,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 0
        },
        "math": {
          "categoryLabel": "Mathematics",
          "avgA": null,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 4
        }
      }
    },
    {
      "slug": "gpt-5-3-codex-vs-gpt-5-4",
      "url": "https://benchlm.ai/compare/gpt-5-3-codex-vs-gpt-5-4",
      "markdownUrl": "https://benchlm.ai/md/compare/gpt-5-3-codex-vs-gpt-5-4.md",
      "modelA": {
        "slug": "gpt-5-4",
        "canonicalModelKey": "gpt-5-4",
        "model": "GPT-5.4",
        "creator": "OpenAI",
        "sourceType": "Proprietary",
        "reasoningType": "Reasoning",
        "contextWindow": "1.05M",
        "contextWindowTokens": 1050000,
        "displayScore": 88,
        "rankingEligible": true,
        "overallRank": 10,
        "url": "https://benchlm.ai/models/gpt-5-4",
        "markdownUrl": "https://benchlm.ai/md/models/gpt-5-4.md"
      },
      "modelB": {
        "slug": "gpt-5-3-codex",
        "canonicalModelKey": "gpt-5-3-codex",
        "model": "GPT-5.3 Codex",
        "creator": "OpenAI",
        "sourceType": "Proprietary",
        "reasoningType": "Reasoning",
        "contextWindow": "400K",
        "contextWindowTokens": 400000,
        "displayScore": 85,
        "rankingEligible": true,
        "overallRank": 15,
        "url": "https://benchlm.ai/models/gpt-5-3-codex",
        "markdownUrl": "https://benchlm.ai/md/models/gpt-5-3-codex.md"
      },
      "overallWinner": "A",
      "winner": {
        "slug": "gpt-5-4",
        "canonicalModelKey": "gpt-5-4",
        "model": "GPT-5.4",
        "creator": "OpenAI",
        "sourceType": "Proprietary",
        "reasoningType": "Reasoning",
        "contextWindow": "1.05M",
        "contextWindowTokens": 1050000,
        "displayScore": 88,
        "rankingEligible": true,
        "overallRank": 10,
        "url": "https://benchlm.ai/models/gpt-5-4",
        "markdownUrl": "https://benchlm.ai/md/models/gpt-5-4.md"
      },
      "scoreDiff": 3,
      "winsA": 1,
      "winsB": 1,
      "comparableCategoryCount": 2,
      "benchmarkCountA": 48,
      "benchmarkCountB": 25,
      "categoryResults": {
        "agentic": {
          "categoryLabel": "Agentic",
          "avgA": 77,
          "avgB": 71.5,
          "winner": "A",
          "benchmarkCount": 14
        },
        "coding": {
          "categoryLabel": "Coding",
          "avgA": 57.7,
          "avgB": 63.1,
          "winner": "B",
          "benchmarkCount": 9
        },
        "multimodalGrounded": {
          "categoryLabel": "Multimodal & Grounded",
          "avgA": 72.7,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 12
        },
        "reasoning": {
          "categoryLabel": "Reasoning",
          "avgA": null,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 2
        },
        "knowledge": {
          "categoryLabel": "Knowledge",
          "avgA": 66.1,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 12
        },
        "instructionFollowing": {
          "categoryLabel": "Instruction Following",
          "avgA": null,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 1
        },
        "multilingual": {
          "categoryLabel": "Multilingual",
          "avgA": null,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 0
        },
        "math": {
          "categoryLabel": "Mathematics",
          "avgA": null,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 0
        }
      }
    },
    {
      "slug": "claude-opus-4-7-adaptive-vs-gpt-5-4",
      "url": "https://benchlm.ai/compare/claude-opus-4-7-adaptive-vs-gpt-5-4",
      "markdownUrl": "https://benchlm.ai/md/compare/claude-opus-4-7-adaptive-vs-gpt-5-4.md",
      "modelA": {
        "slug": "gpt-5-4",
        "canonicalModelKey": "gpt-5-4",
        "model": "GPT-5.4",
        "creator": "OpenAI",
        "sourceType": "Proprietary",
        "reasoningType": "Reasoning",
        "contextWindow": "1.05M",
        "contextWindowTokens": 1050000,
        "displayScore": 88,
        "rankingEligible": true,
        "overallRank": 10,
        "url": "https://benchlm.ai/models/gpt-5-4",
        "markdownUrl": "https://benchlm.ai/md/models/gpt-5-4.md"
      },
      "modelB": {
        "slug": "claude-opus-4-7-adaptive",
        "canonicalModelKey": "claude-opus-4-7-max",
        "model": "Claude Opus 4.7 (Adaptive)",
        "creator": "Anthropic",
        "sourceType": "Proprietary",
        "reasoningType": "Reasoning",
        "contextWindow": "1M",
        "contextWindowTokens": 1000000,
        "displayScore": 84,
        "rankingEligible": true,
        "overallRank": 16,
        "url": "https://benchlm.ai/models/claude-opus-4-7-adaptive",
        "markdownUrl": "https://benchlm.ai/md/models/claude-opus-4-7-adaptive.md"
      },
      "overallWinner": "A",
      "winner": {
        "slug": "gpt-5-4",
        "canonicalModelKey": "gpt-5-4",
        "model": "GPT-5.4",
        "creator": "OpenAI",
        "sourceType": "Proprietary",
        "reasoningType": "Reasoning",
        "contextWindow": "1.05M",
        "contextWindowTokens": 1050000,
        "displayScore": 88,
        "rankingEligible": true,
        "overallRank": 10,
        "url": "https://benchlm.ai/models/gpt-5-4",
        "markdownUrl": "https://benchlm.ai/md/models/gpt-5-4.md"
      },
      "scoreDiff": 4,
      "winsA": 2,
      "winsB": 2,
      "comparableCategoryCount": 4,
      "benchmarkCountA": 48,
      "benchmarkCountB": 36,
      "categoryResults": {
        "agentic": {
          "categoryLabel": "Agentic",
          "avgA": 77,
          "avgB": 74.9,
          "winner": "A",
          "benchmarkCount": 14
        },
        "coding": {
          "categoryLabel": "Coding",
          "avgA": 57.7,
          "avgB": 72.9,
          "winner": "B",
          "benchmarkCount": 9
        },
        "multimodalGrounded": {
          "categoryLabel": "Multimodal & Grounded",
          "avgA": 72.7,
          "avgB": 64.3,
          "winner": "A",
          "benchmarkCount": 13
        },
        "reasoning": {
          "categoryLabel": "Reasoning",
          "avgA": null,
          "avgB": 75.8,
          "winner": null,
          "benchmarkCount": 4
        },
        "knowledge": {
          "categoryLabel": "Knowledge",
          "avgA": 66.1,
          "avgB": 68.2,
          "winner": "B",
          "benchmarkCount": 12
        },
        "instructionFollowing": {
          "categoryLabel": "Instruction Following",
          "avgA": null,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 1
        },
        "multilingual": {
          "categoryLabel": "Multilingual",
          "avgA": null,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 0
        },
        "math": {
          "categoryLabel": "Mathematics",
          "avgA": null,
          "avgB": 43.8,
          "winner": null,
          "benchmarkCount": 1
        }
      }
    },
    {
      "slug": "glm-5-1-vs-gpt-5-4",
      "url": "https://benchlm.ai/compare/glm-5-1-vs-gpt-5-4",
      "markdownUrl": "https://benchlm.ai/md/compare/glm-5-1-vs-gpt-5-4.md",
      "modelA": {
        "slug": "gpt-5-4",
        "canonicalModelKey": "gpt-5-4",
        "model": "GPT-5.4",
        "creator": "OpenAI",
        "sourceType": "Proprietary",
        "reasoningType": "Reasoning",
        "contextWindow": "1.05M",
        "contextWindowTokens": 1050000,
        "displayScore": 88,
        "rankingEligible": true,
        "overallRank": 10,
        "url": "https://benchlm.ai/models/gpt-5-4",
        "markdownUrl": "https://benchlm.ai/md/models/gpt-5-4.md"
      },
      "modelB": {
        "slug": "glm-5-1",
        "canonicalModelKey": "glm-5-1",
        "model": "GLM-5.1",
        "creator": "Z.AI",
        "sourceType": "Open Weight",
        "reasoningType": "Reasoning",
        "contextWindow": "203K",
        "contextWindowTokens": 203000,
        "displayScore": 82,
        "rankingEligible": true,
        "overallRank": 17,
        "url": "https://benchlm.ai/models/glm-5-1",
        "markdownUrl": "https://benchlm.ai/md/models/glm-5-1.md"
      },
      "overallWinner": "A",
      "winner": {
        "slug": "gpt-5-4",
        "canonicalModelKey": "gpt-5-4",
        "model": "GPT-5.4",
        "creator": "OpenAI",
        "sourceType": "Proprietary",
        "reasoningType": "Reasoning",
        "contextWindow": "1.05M",
        "contextWindowTokens": 1050000,
        "displayScore": 88,
        "rankingEligible": true,
        "overallRank": 10,
        "url": "https://benchlm.ai/models/gpt-5-4",
        "markdownUrl": "https://benchlm.ai/md/models/gpt-5-4.md"
      },
      "scoreDiff": 6,
      "winsA": 2,
      "winsB": 1,
      "comparableCategoryCount": 3,
      "benchmarkCountA": 48,
      "benchmarkCountB": 33,
      "categoryResults": {
        "agentic": {
          "categoryLabel": "Agentic",
          "avgA": 77,
          "avgB": 65.3,
          "winner": "A",
          "benchmarkCount": 15
        },
        "coding": {
          "categoryLabel": "Coding",
          "avgA": 57.7,
          "avgB": 60.9,
          "winner": "B",
          "benchmarkCount": 9
        },
        "multimodalGrounded": {
          "categoryLabel": "Multimodal & Grounded",
          "avgA": 72.7,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 12
        },
        "reasoning": {
          "categoryLabel": "Reasoning",
          "avgA": null,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 2
        },
        "knowledge": {
          "categoryLabel": "Knowledge",
          "avgA": 66.1,
          "avgB": 52.3,
          "winner": "A",
          "benchmarkCount": 12
        },
        "instructionFollowing": {
          "categoryLabel": "Instruction Following",
          "avgA": null,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 1
        },
        "multilingual": {
          "categoryLabel": "Multilingual",
          "avgA": null,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 0
        },
        "math": {
          "categoryLabel": "Mathematics",
          "avgA": null,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 4
        }
      }
    },
    {
      "slug": "claude-sonnet-4-6-vs-gpt-5-4",
      "url": "https://benchlm.ai/compare/claude-sonnet-4-6-vs-gpt-5-4",
      "markdownUrl": "https://benchlm.ai/md/compare/claude-sonnet-4-6-vs-gpt-5-4.md",
      "modelA": {
        "slug": "gpt-5-4",
        "canonicalModelKey": "gpt-5-4",
        "model": "GPT-5.4",
        "creator": "OpenAI",
        "sourceType": "Proprietary",
        "reasoningType": "Reasoning",
        "contextWindow": "1.05M",
        "contextWindowTokens": 1050000,
        "displayScore": 88,
        "rankingEligible": true,
        "overallRank": 10,
        "url": "https://benchlm.ai/models/gpt-5-4",
        "markdownUrl": "https://benchlm.ai/md/models/gpt-5-4.md"
      },
      "modelB": {
        "slug": "claude-sonnet-4-6",
        "canonicalModelKey": "claude-sonnet-4-6",
        "model": "Claude Sonnet 4.6",
        "creator": "Anthropic",
        "sourceType": "Proprietary",
        "reasoningType": "Non-Reasoning",
        "contextWindow": "200K",
        "contextWindowTokens": 200000,
        "displayScore": 82,
        "rankingEligible": true,
        "overallRank": 18,
        "url": "https://benchlm.ai/models/claude-sonnet-4-6",
        "markdownUrl": "https://benchlm.ai/md/models/claude-sonnet-4-6.md"
      },
      "overallWinner": "A",
      "winner": {
        "slug": "gpt-5-4",
        "canonicalModelKey": "gpt-5-4",
        "model": "GPT-5.4",
        "creator": "OpenAI",
        "sourceType": "Proprietary",
        "reasoningType": "Reasoning",
        "contextWindow": "1.05M",
        "contextWindowTokens": 1050000,
        "displayScore": 88,
        "rankingEligible": true,
        "overallRank": 10,
        "url": "https://benchlm.ai/models/gpt-5-4",
        "markdownUrl": "https://benchlm.ai/md/models/gpt-5-4.md"
      },
      "scoreDiff": 6,
      "winsA": 1,
      "winsB": 3,
      "comparableCategoryCount": 4,
      "benchmarkCountA": 48,
      "benchmarkCountB": 33,
      "categoryResults": {
        "agentic": {
          "categoryLabel": "Agentic",
          "avgA": 77,
          "avgB": 65.1,
          "winner": "A",
          "benchmarkCount": 14
        },
        "coding": {
          "categoryLabel": "Coding",
          "avgA": 57.7,
          "avgB": 66.4,
          "winner": "B",
          "benchmarkCount": 10
        },
        "multimodalGrounded": {
          "categoryLabel": "Multimodal & Grounded",
          "avgA": 72.7,
          "avgB": 77.4,
          "winner": "B",
          "benchmarkCount": 12
        },
        "reasoning": {
          "categoryLabel": "Reasoning",
          "avgA": null,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 2
        },
        "knowledge": {
          "categoryLabel": "Knowledge",
          "avgA": 66.1,
          "avgB": 73.7,
          "winner": "B",
          "benchmarkCount": 14
        },
        "instructionFollowing": {
          "categoryLabel": "Instruction Following",
          "avgA": null,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 1
        },
        "multilingual": {
          "categoryLabel": "Multilingual",
          "avgA": null,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 0
        },
        "math": {
          "categoryLabel": "Mathematics",
          "avgA": null,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 0
        }
      }
    },
    {
      "slug": "claude-opus-4-6-vs-qwen3-7-plus",
      "url": "https://benchlm.ai/compare/claude-opus-4-6-vs-qwen3-7-plus",
      "markdownUrl": "https://benchlm.ai/md/compare/claude-opus-4-6-vs-qwen3-7-plus.md",
      "modelA": {
        "slug": "qwen3-7-plus",
        "canonicalModelKey": "qwen3-7-plus",
        "model": "Qwen3.7 Plus",
        "creator": "Alibaba",
        "sourceType": "Proprietary",
        "reasoningType": "Reasoning",
        "contextWindow": "1M",
        "contextWindowTokens": 1000000,
        "displayScore": 88,
        "rankingEligible": true,
        "overallRank": 11,
        "url": "https://benchlm.ai/models/qwen3-7-plus",
        "markdownUrl": "https://benchlm.ai/md/models/qwen3-7-plus.md"
      },
      "modelB": {
        "slug": "claude-opus-4-6",
        "canonicalModelKey": "claude-opus-4-6",
        "model": "Claude Opus 4.6",
        "creator": "Anthropic",
        "sourceType": "Proprietary",
        "reasoningType": "Non-Reasoning",
        "contextWindow": "1M",
        "contextWindowTokens": 1000000,
        "displayScore": 86,
        "rankingEligible": true,
        "overallRank": 12,
        "url": "https://benchlm.ai/models/claude-opus-4-6",
        "markdownUrl": "https://benchlm.ai/md/models/claude-opus-4-6.md"
      },
      "overallWinner": "A",
      "winner": {
        "slug": "qwen3-7-plus",
        "canonicalModelKey": "qwen3-7-plus",
        "model": "Qwen3.7 Plus",
        "creator": "Alibaba",
        "sourceType": "Proprietary",
        "reasoningType": "Reasoning",
        "contextWindow": "1M",
        "contextWindowTokens": 1000000,
        "displayScore": 88,
        "rankingEligible": true,
        "overallRank": 11,
        "url": "https://benchlm.ai/models/qwen3-7-plus",
        "markdownUrl": "https://benchlm.ai/md/models/qwen3-7-plus.md"
      },
      "scoreDiff": 2,
      "winsA": 2,
      "winsB": 2,
      "comparableCategoryCount": 4,
      "benchmarkCountA": 68,
      "benchmarkCountB": 47,
      "categoryResults": {
        "agentic": {
          "categoryLabel": "Agentic",
          "avgA": 71.7,
          "avgB": 72.6,
          "winner": "B",
          "benchmarkCount": 19
        },
        "coding": {
          "categoryLabel": "Coding",
          "avgA": 71.1,
          "avgB": 64.4,
          "winner": "A",
          "benchmarkCount": 15
        },
        "multimodalGrounded": {
          "categoryLabel": "Multimodal & Grounded",
          "avgA": 81.1,
          "avgB": 77.3,
          "winner": "A",
          "benchmarkCount": 18
        },
        "reasoning": {
          "categoryLabel": "Reasoning",
          "avgA": 91.7,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 3
        },
        "knowledge": {
          "categoryLabel": "Knowledge",
          "avgA": 67.9,
          "avgB": 76.2,
          "winner": "B",
          "benchmarkCount": 17
        },
        "instructionFollowing": {
          "categoryLabel": "Instruction Following",
          "avgA": 89.2,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 3
        },
        "multilingual": {
          "categoryLabel": "Multilingual",
          "avgA": 85.4,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 5
        },
        "math": {
          "categoryLabel": "Mathematics",
          "avgA": null,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 4
        }
      }
    },
    {
      "slug": "gemini-3-5-flash-vs-qwen3-7-plus",
      "url": "https://benchlm.ai/compare/gemini-3-5-flash-vs-qwen3-7-plus",
      "markdownUrl": "https://benchlm.ai/md/compare/gemini-3-5-flash-vs-qwen3-7-plus.md",
      "modelA": {
        "slug": "qwen3-7-plus",
        "canonicalModelKey": "qwen3-7-plus",
        "model": "Qwen3.7 Plus",
        "creator": "Alibaba",
        "sourceType": "Proprietary",
        "reasoningType": "Reasoning",
        "contextWindow": "1M",
        "contextWindowTokens": 1000000,
        "displayScore": 88,
        "rankingEligible": true,
        "overallRank": 11,
        "url": "https://benchlm.ai/models/qwen3-7-plus",
        "markdownUrl": "https://benchlm.ai/md/models/qwen3-7-plus.md"
      },
      "modelB": {
        "slug": "gemini-3-5-flash",
        "canonicalModelKey": "gemini-3-5-flash",
        "model": "Gemini 3.5 Flash",
        "creator": "Google",
        "sourceType": "Proprietary",
        "reasoningType": "Reasoning",
        "contextWindow": "1M",
        "contextWindowTokens": 1000000,
        "displayScore": 86,
        "rankingEligible": true,
        "overallRank": 13,
        "url": "https://benchlm.ai/models/gemini-3-5-flash",
        "markdownUrl": "https://benchlm.ai/md/models/gemini-3-5-flash.md"
      },
      "overallWinner": "A",
      "winner": {
        "slug": "qwen3-7-plus",
        "canonicalModelKey": "qwen3-7-plus",
        "model": "Qwen3.7 Plus",
        "creator": "Alibaba",
        "sourceType": "Proprietary",
        "reasoningType": "Reasoning",
        "contextWindow": "1M",
        "contextWindowTokens": 1000000,
        "displayScore": 88,
        "rankingEligible": true,
        "overallRank": 11,
        "url": "https://benchlm.ai/models/qwen3-7-plus",
        "markdownUrl": "https://benchlm.ai/md/models/qwen3-7-plus.md"
      },
      "scoreDiff": 2,
      "winsA": 4,
      "winsB": 2,
      "comparableCategoryCount": 6,
      "benchmarkCountA": 68,
      "benchmarkCountB": 40,
      "categoryResults": {
        "agentic": {
          "categoryLabel": "Agentic",
          "avgA": 71.7,
          "avgB": 77.2,
          "winner": "B",
          "benchmarkCount": 18
        },
        "coding": {
          "categoryLabel": "Coding",
          "avgA": 71.1,
          "avgB": 54.5,
          "winner": "A",
          "benchmarkCount": 12
        },
        "multimodalGrounded": {
          "categoryLabel": "Multimodal & Grounded",
          "avgA": 81.1,
          "avgB": 83.8,
          "winner": "B",
          "benchmarkCount": 18
        },
        "reasoning": {
          "categoryLabel": "Reasoning",
          "avgA": 91.7,
          "avgB": 74.7,
          "winner": "A",
          "benchmarkCount": 5
        },
        "knowledge": {
          "categoryLabel": "Knowledge",
          "avgA": 67.9,
          "avgB": 58,
          "winner": "A",
          "benchmarkCount": 13
        },
        "instructionFollowing": {
          "categoryLabel": "Instruction Following",
          "avgA": 89.2,
          "avgB": 76.3,
          "winner": "A",
          "benchmarkCount": 3
        },
        "multilingual": {
          "categoryLabel": "Multilingual",
          "avgA": 85.4,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 5
        },
        "math": {
          "categoryLabel": "Mathematics",
          "avgA": null,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 3
        }
      }
    },
    {
      "slug": "deepseek-v4-pro-max-vs-qwen3-7-plus",
      "url": "https://benchlm.ai/compare/deepseek-v4-pro-max-vs-qwen3-7-plus",
      "markdownUrl": "https://benchlm.ai/md/compare/deepseek-v4-pro-max-vs-qwen3-7-plus.md",
      "modelA": {
        "slug": "qwen3-7-plus",
        "canonicalModelKey": "qwen3-7-plus",
        "model": "Qwen3.7 Plus",
        "creator": "Alibaba",
        "sourceType": "Proprietary",
        "reasoningType": "Reasoning",
        "contextWindow": "1M",
        "contextWindowTokens": 1000000,
        "displayScore": 88,
        "rankingEligible": true,
        "overallRank": 11,
        "url": "https://benchlm.ai/models/qwen3-7-plus",
        "markdownUrl": "https://benchlm.ai/md/models/qwen3-7-plus.md"
      },
      "modelB": {
        "slug": "deepseek-v4-pro-max",
        "canonicalModelKey": "deepseek-v4-pro-max",
        "model": "DeepSeek V4 Pro (Max)",
        "creator": "DeepSeek",
        "sourceType": "Open Weight",
        "reasoningType": "Reasoning",
        "contextWindow": "1M",
        "contextWindowTokens": 1000000,
        "displayScore": 86,
        "rankingEligible": true,
        "overallRank": 14,
        "url": "https://benchlm.ai/models/deepseek-v4-pro-max",
        "markdownUrl": "https://benchlm.ai/md/models/deepseek-v4-pro-max.md"
      },
      "overallWinner": "A",
      "winner": {
        "slug": "qwen3-7-plus",
        "canonicalModelKey": "qwen3-7-plus",
        "model": "Qwen3.7 Plus",
        "creator": "Alibaba",
        "sourceType": "Proprietary",
        "reasoningType": "Reasoning",
        "contextWindow": "1M",
        "contextWindowTokens": 1000000,
        "displayScore": 88,
        "rankingEligible": true,
        "overallRank": 11,
        "url": "https://benchlm.ai/models/qwen3-7-plus",
        "markdownUrl": "https://benchlm.ai/md/models/qwen3-7-plus.md"
      },
      "scoreDiff": 2,
      "winsA": 1,
      "winsB": 2,
      "comparableCategoryCount": 3,
      "benchmarkCountA": 68,
      "benchmarkCountB": 42,
      "categoryResults": {
        "agentic": {
          "categoryLabel": "Agentic",
          "avgA": 71.7,
          "avgB": 74,
          "winner": "B",
          "benchmarkCount": 18
        },
        "coding": {
          "categoryLabel": "Coding",
          "avgA": 71.1,
          "avgB": 75.9,
          "winner": "B",
          "benchmarkCount": 12
        },
        "multimodalGrounded": {
          "categoryLabel": "Multimodal & Grounded",
          "avgA": 81.1,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 17
        },
        "reasoning": {
          "categoryLabel": "Reasoning",
          "avgA": 91.7,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 5
        },
        "knowledge": {
          "categoryLabel": "Knowledge",
          "avgA": 67.9,
          "avgB": 66.1,
          "winner": "A",
          "benchmarkCount": 15
        },
        "instructionFollowing": {
          "categoryLabel": "Instruction Following",
          "avgA": 89.2,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 3
        },
        "multilingual": {
          "categoryLabel": "Multilingual",
          "avgA": 85.4,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 5
        },
        "math": {
          "categoryLabel": "Mathematics",
          "avgA": null,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 4
        }
      }
    },
    {
      "slug": "gpt-5-3-codex-vs-qwen3-7-plus",
      "url": "https://benchlm.ai/compare/gpt-5-3-codex-vs-qwen3-7-plus",
      "markdownUrl": "https://benchlm.ai/md/compare/gpt-5-3-codex-vs-qwen3-7-plus.md",
      "modelA": {
        "slug": "qwen3-7-plus",
        "canonicalModelKey": "qwen3-7-plus",
        "model": "Qwen3.7 Plus",
        "creator": "Alibaba",
        "sourceType": "Proprietary",
        "reasoningType": "Reasoning",
        "contextWindow": "1M",
        "contextWindowTokens": 1000000,
        "displayScore": 88,
        "rankingEligible": true,
        "overallRank": 11,
        "url": "https://benchlm.ai/models/qwen3-7-plus",
        "markdownUrl": "https://benchlm.ai/md/models/qwen3-7-plus.md"
      },
      "modelB": {
        "slug": "gpt-5-3-codex",
        "canonicalModelKey": "gpt-5-3-codex",
        "model": "GPT-5.3 Codex",
        "creator": "OpenAI",
        "sourceType": "Proprietary",
        "reasoningType": "Reasoning",
        "contextWindow": "400K",
        "contextWindowTokens": 400000,
        "displayScore": 85,
        "rankingEligible": true,
        "overallRank": 15,
        "url": "https://benchlm.ai/models/gpt-5-3-codex",
        "markdownUrl": "https://benchlm.ai/md/models/gpt-5-3-codex.md"
      },
      "overallWinner": "A",
      "winner": {
        "slug": "qwen3-7-plus",
        "canonicalModelKey": "qwen3-7-plus",
        "model": "Qwen3.7 Plus",
        "creator": "Alibaba",
        "sourceType": "Proprietary",
        "reasoningType": "Reasoning",
        "contextWindow": "1M",
        "contextWindowTokens": 1000000,
        "displayScore": 88,
        "rankingEligible": true,
        "overallRank": 11,
        "url": "https://benchlm.ai/models/qwen3-7-plus",
        "markdownUrl": "https://benchlm.ai/md/models/qwen3-7-plus.md"
      },
      "scoreDiff": 3,
      "winsA": 2,
      "winsB": 0,
      "comparableCategoryCount": 2,
      "benchmarkCountA": 68,
      "benchmarkCountB": 25,
      "categoryResults": {
        "agentic": {
          "categoryLabel": "Agentic",
          "avgA": 71.7,
          "avgB": 71.5,
          "winner": "A",
          "benchmarkCount": 16
        },
        "coding": {
          "categoryLabel": "Coding",
          "avgA": 71.1,
          "avgB": 63.1,
          "winner": "A",
          "benchmarkCount": 12
        },
        "multimodalGrounded": {
          "categoryLabel": "Multimodal & Grounded",
          "avgA": 81.1,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 17
        },
        "reasoning": {
          "categoryLabel": "Reasoning",
          "avgA": 91.7,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 3
        },
        "knowledge": {
          "categoryLabel": "Knowledge",
          "avgA": 67.9,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 13
        },
        "instructionFollowing": {
          "categoryLabel": "Instruction Following",
          "avgA": 89.2,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 3
        },
        "multilingual": {
          "categoryLabel": "Multilingual",
          "avgA": 85.4,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 5
        },
        "math": {
          "categoryLabel": "Mathematics",
          "avgA": null,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 3
        }
      }
    },
    {
      "slug": "claude-opus-4-7-adaptive-vs-qwen3-7-plus",
      "url": "https://benchlm.ai/compare/claude-opus-4-7-adaptive-vs-qwen3-7-plus",
      "markdownUrl": "https://benchlm.ai/md/compare/claude-opus-4-7-adaptive-vs-qwen3-7-plus.md",
      "modelA": {
        "slug": "qwen3-7-plus",
        "canonicalModelKey": "qwen3-7-plus",
        "model": "Qwen3.7 Plus",
        "creator": "Alibaba",
        "sourceType": "Proprietary",
        "reasoningType": "Reasoning",
        "contextWindow": "1M",
        "contextWindowTokens": 1000000,
        "displayScore": 88,
        "rankingEligible": true,
        "overallRank": 11,
        "url": "https://benchlm.ai/models/qwen3-7-plus",
        "markdownUrl": "https://benchlm.ai/md/models/qwen3-7-plus.md"
      },
      "modelB": {
        "slug": "claude-opus-4-7-adaptive",
        "canonicalModelKey": "claude-opus-4-7-max",
        "model": "Claude Opus 4.7 (Adaptive)",
        "creator": "Anthropic",
        "sourceType": "Proprietary",
        "reasoningType": "Reasoning",
        "contextWindow": "1M",
        "contextWindowTokens": 1000000,
        "displayScore": 84,
        "rankingEligible": true,
        "overallRank": 16,
        "url": "https://benchlm.ai/models/claude-opus-4-7-adaptive",
        "markdownUrl": "https://benchlm.ai/md/models/claude-opus-4-7-adaptive.md"
      },
      "overallWinner": "A",
      "winner": {
        "slug": "qwen3-7-plus",
        "canonicalModelKey": "qwen3-7-plus",
        "model": "Qwen3.7 Plus",
        "creator": "Alibaba",
        "sourceType": "Proprietary",
        "reasoningType": "Reasoning",
        "contextWindow": "1M",
        "contextWindowTokens": 1000000,
        "displayScore": 88,
        "rankingEligible": true,
        "overallRank": 11,
        "url": "https://benchlm.ai/models/qwen3-7-plus",
        "markdownUrl": "https://benchlm.ai/md/models/qwen3-7-plus.md"
      },
      "scoreDiff": 4,
      "winsA": 2,
      "winsB": 3,
      "comparableCategoryCount": 5,
      "benchmarkCountA": 68,
      "benchmarkCountB": 36,
      "categoryResults": {
        "agentic": {
          "categoryLabel": "Agentic",
          "avgA": 71.7,
          "avgB": 74.9,
          "winner": "B",
          "benchmarkCount": 17
        },
        "coding": {
          "categoryLabel": "Coding",
          "avgA": 71.1,
          "avgB": 72.9,
          "winner": "B",
          "benchmarkCount": 10
        },
        "multimodalGrounded": {
          "categoryLabel": "Multimodal & Grounded",
          "avgA": 81.1,
          "avgB": 64.3,
          "winner": "A",
          "benchmarkCount": 19
        },
        "reasoning": {
          "categoryLabel": "Reasoning",
          "avgA": 91.7,
          "avgB": 75.8,
          "winner": "A",
          "benchmarkCount": 5
        },
        "knowledge": {
          "categoryLabel": "Knowledge",
          "avgA": 67.9,
          "avgB": 68.2,
          "winner": "B",
          "benchmarkCount": 14
        },
        "instructionFollowing": {
          "categoryLabel": "Instruction Following",
          "avgA": 89.2,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 3
        },
        "multilingual": {
          "categoryLabel": "Multilingual",
          "avgA": 85.4,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 5
        },
        "math": {
          "categoryLabel": "Mathematics",
          "avgA": null,
          "avgB": 43.8,
          "winner": null,
          "benchmarkCount": 4
        }
      }
    },
    {
      "slug": "glm-5-1-vs-qwen3-7-plus",
      "url": "https://benchlm.ai/compare/glm-5-1-vs-qwen3-7-plus",
      "markdownUrl": "https://benchlm.ai/md/compare/glm-5-1-vs-qwen3-7-plus.md",
      "modelA": {
        "slug": "qwen3-7-plus",
        "canonicalModelKey": "qwen3-7-plus",
        "model": "Qwen3.7 Plus",
        "creator": "Alibaba",
        "sourceType": "Proprietary",
        "reasoningType": "Reasoning",
        "contextWindow": "1M",
        "contextWindowTokens": 1000000,
        "displayScore": 88,
        "rankingEligible": true,
        "overallRank": 11,
        "url": "https://benchlm.ai/models/qwen3-7-plus",
        "markdownUrl": "https://benchlm.ai/md/models/qwen3-7-plus.md"
      },
      "modelB": {
        "slug": "glm-5-1",
        "canonicalModelKey": "glm-5-1",
        "model": "GLM-5.1",
        "creator": "Z.AI",
        "sourceType": "Open Weight",
        "reasoningType": "Reasoning",
        "contextWindow": "203K",
        "contextWindowTokens": 203000,
        "displayScore": 82,
        "rankingEligible": true,
        "overallRank": 17,
        "url": "https://benchlm.ai/models/glm-5-1",
        "markdownUrl": "https://benchlm.ai/md/models/glm-5-1.md"
      },
      "overallWinner": "A",
      "winner": {
        "slug": "qwen3-7-plus",
        "canonicalModelKey": "qwen3-7-plus",
        "model": "Qwen3.7 Plus",
        "creator": "Alibaba",
        "sourceType": "Proprietary",
        "reasoningType": "Reasoning",
        "contextWindow": "1M",
        "contextWindowTokens": 1000000,
        "displayScore": 88,
        "rankingEligible": true,
        "overallRank": 11,
        "url": "https://benchlm.ai/models/qwen3-7-plus",
        "markdownUrl": "https://benchlm.ai/md/models/qwen3-7-plus.md"
      },
      "scoreDiff": 6,
      "winsA": 3,
      "winsB": 0,
      "comparableCategoryCount": 3,
      "benchmarkCountA": 68,
      "benchmarkCountB": 33,
      "categoryResults": {
        "agentic": {
          "categoryLabel": "Agentic",
          "avgA": 71.7,
          "avgB": 65.3,
          "winner": "A",
          "benchmarkCount": 19
        },
        "coding": {
          "categoryLabel": "Coding",
          "avgA": 71.1,
          "avgB": 60.9,
          "winner": "A",
          "benchmarkCount": 12
        },
        "multimodalGrounded": {
          "categoryLabel": "Multimodal & Grounded",
          "avgA": 81.1,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 17
        },
        "reasoning": {
          "categoryLabel": "Reasoning",
          "avgA": 91.7,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 3
        },
        "knowledge": {
          "categoryLabel": "Knowledge",
          "avgA": 67.9,
          "avgB": 52.3,
          "winner": "A",
          "benchmarkCount": 13
        },
        "instructionFollowing": {
          "categoryLabel": "Instruction Following",
          "avgA": 89.2,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 3
        },
        "multilingual": {
          "categoryLabel": "Multilingual",
          "avgA": 85.4,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 5
        },
        "math": {
          "categoryLabel": "Mathematics",
          "avgA": null,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 6
        }
      }
    },
    {
      "slug": "claude-sonnet-4-6-vs-qwen3-7-plus",
      "url": "https://benchlm.ai/compare/claude-sonnet-4-6-vs-qwen3-7-plus",
      "markdownUrl": "https://benchlm.ai/md/compare/claude-sonnet-4-6-vs-qwen3-7-plus.md",
      "modelA": {
        "slug": "qwen3-7-plus",
        "canonicalModelKey": "qwen3-7-plus",
        "model": "Qwen3.7 Plus",
        "creator": "Alibaba",
        "sourceType": "Proprietary",
        "reasoningType": "Reasoning",
        "contextWindow": "1M",
        "contextWindowTokens": 1000000,
        "displayScore": 88,
        "rankingEligible": true,
        "overallRank": 11,
        "url": "https://benchlm.ai/models/qwen3-7-plus",
        "markdownUrl": "https://benchlm.ai/md/models/qwen3-7-plus.md"
      },
      "modelB": {
        "slug": "claude-sonnet-4-6",
        "canonicalModelKey": "claude-sonnet-4-6",
        "model": "Claude Sonnet 4.6",
        "creator": "Anthropic",
        "sourceType": "Proprietary",
        "reasoningType": "Non-Reasoning",
        "contextWindow": "200K",
        "contextWindowTokens": 200000,
        "displayScore": 82,
        "rankingEligible": true,
        "overallRank": 18,
        "url": "https://benchlm.ai/models/claude-sonnet-4-6",
        "markdownUrl": "https://benchlm.ai/md/models/claude-sonnet-4-6.md"
      },
      "overallWinner": "A",
      "winner": {
        "slug": "qwen3-7-plus",
        "canonicalModelKey": "qwen3-7-plus",
        "model": "Qwen3.7 Plus",
        "creator": "Alibaba",
        "sourceType": "Proprietary",
        "reasoningType": "Reasoning",
        "contextWindow": "1M",
        "contextWindowTokens": 1000000,
        "displayScore": 88,
        "rankingEligible": true,
        "overallRank": 11,
        "url": "https://benchlm.ai/models/qwen3-7-plus",
        "markdownUrl": "https://benchlm.ai/md/models/qwen3-7-plus.md"
      },
      "scoreDiff": 6,
      "winsA": 3,
      "winsB": 1,
      "comparableCategoryCount": 4,
      "benchmarkCountA": 68,
      "benchmarkCountB": 33,
      "categoryResults": {
        "agentic": {
          "categoryLabel": "Agentic",
          "avgA": 71.7,
          "avgB": 65.1,
          "winner": "A",
          "benchmarkCount": 17
        },
        "coding": {
          "categoryLabel": "Coding",
          "avgA": 71.1,
          "avgB": 66.4,
          "winner": "A",
          "benchmarkCount": 14
        },
        "multimodalGrounded": {
          "categoryLabel": "Multimodal & Grounded",
          "avgA": 81.1,
          "avgB": 77.4,
          "winner": "A",
          "benchmarkCount": 17
        },
        "reasoning": {
          "categoryLabel": "Reasoning",
          "avgA": 91.7,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 3
        },
        "knowledge": {
          "categoryLabel": "Knowledge",
          "avgA": 67.9,
          "avgB": 73.7,
          "winner": "B",
          "benchmarkCount": 13
        },
        "instructionFollowing": {
          "categoryLabel": "Instruction Following",
          "avgA": 89.2,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 3
        },
        "multilingual": {
          "categoryLabel": "Multilingual",
          "avgA": 85.4,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 5
        },
        "math": {
          "categoryLabel": "Mathematics",
          "avgA": null,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 3
        }
      }
    },
    {
      "slug": "claude-opus-4-6-vs-gemini-3-5-flash",
      "url": "https://benchlm.ai/compare/claude-opus-4-6-vs-gemini-3-5-flash",
      "markdownUrl": "https://benchlm.ai/md/compare/claude-opus-4-6-vs-gemini-3-5-flash.md",
      "modelA": {
        "slug": "claude-opus-4-6",
        "canonicalModelKey": "claude-opus-4-6",
        "model": "Claude Opus 4.6",
        "creator": "Anthropic",
        "sourceType": "Proprietary",
        "reasoningType": "Non-Reasoning",
        "contextWindow": "1M",
        "contextWindowTokens": 1000000,
        "displayScore": 86,
        "rankingEligible": true,
        "overallRank": 12,
        "url": "https://benchlm.ai/models/claude-opus-4-6",
        "markdownUrl": "https://benchlm.ai/md/models/claude-opus-4-6.md"
      },
      "modelB": {
        "slug": "gemini-3-5-flash",
        "canonicalModelKey": "gemini-3-5-flash",
        "model": "Gemini 3.5 Flash",
        "creator": "Google",
        "sourceType": "Proprietary",
        "reasoningType": "Reasoning",
        "contextWindow": "1M",
        "contextWindowTokens": 1000000,
        "displayScore": 86,
        "rankingEligible": true,
        "overallRank": 13,
        "url": "https://benchlm.ai/models/gemini-3-5-flash",
        "markdownUrl": "https://benchlm.ai/md/models/gemini-3-5-flash.md"
      },
      "overallWinner": "tie",
      "winner": null,
      "scoreDiff": 0,
      "winsA": 2,
      "winsB": 2,
      "comparableCategoryCount": 4,
      "benchmarkCountA": 47,
      "benchmarkCountB": 40,
      "categoryResults": {
        "agentic": {
          "categoryLabel": "Agentic",
          "avgA": 72.6,
          "avgB": 77.2,
          "winner": "B",
          "benchmarkCount": 15
        },
        "coding": {
          "categoryLabel": "Coding",
          "avgA": 64.4,
          "avgB": 54.5,
          "winner": "A",
          "benchmarkCount": 13
        },
        "multimodalGrounded": {
          "categoryLabel": "Multimodal & Grounded",
          "avgA": 77.3,
          "avgB": 83.8,
          "winner": "B",
          "benchmarkCount": 9
        },
        "reasoning": {
          "categoryLabel": "Reasoning",
          "avgA": null,
          "avgB": 74.7,
          "winner": null,
          "benchmarkCount": 5
        },
        "knowledge": {
          "categoryLabel": "Knowledge",
          "avgA": 76.2,
          "avgB": 58,
          "winner": "A",
          "benchmarkCount": 15
        },
        "instructionFollowing": {
          "categoryLabel": "Instruction Following",
          "avgA": null,
          "avgB": 76.3,
          "winner": null,
          "benchmarkCount": 2
        },
        "multilingual": {
          "categoryLabel": "Multilingual",
          "avgA": null,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 0
        },
        "math": {
          "categoryLabel": "Mathematics",
          "avgA": null,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 1
        }
      }
    },
    {
      "slug": "claude-opus-4-6-vs-deepseek-v4-pro-max",
      "url": "https://benchlm.ai/compare/claude-opus-4-6-vs-deepseek-v4-pro-max",
      "markdownUrl": "https://benchlm.ai/md/compare/claude-opus-4-6-vs-deepseek-v4-pro-max.md",
      "modelA": {
        "slug": "claude-opus-4-6",
        "canonicalModelKey": "claude-opus-4-6",
        "model": "Claude Opus 4.6",
        "creator": "Anthropic",
        "sourceType": "Proprietary",
        "reasoningType": "Non-Reasoning",
        "contextWindow": "1M",
        "contextWindowTokens": 1000000,
        "displayScore": 86,
        "rankingEligible": true,
        "overallRank": 12,
        "url": "https://benchlm.ai/models/claude-opus-4-6",
        "markdownUrl": "https://benchlm.ai/md/models/claude-opus-4-6.md"
      },
      "modelB": {
        "slug": "deepseek-v4-pro-max",
        "canonicalModelKey": "deepseek-v4-pro-max",
        "model": "DeepSeek V4 Pro (Max)",
        "creator": "DeepSeek",
        "sourceType": "Open Weight",
        "reasoningType": "Reasoning",
        "contextWindow": "1M",
        "contextWindowTokens": 1000000,
        "displayScore": 86,
        "rankingEligible": true,
        "overallRank": 14,
        "url": "https://benchlm.ai/models/deepseek-v4-pro-max",
        "markdownUrl": "https://benchlm.ai/md/models/deepseek-v4-pro-max.md"
      },
      "overallWinner": "tie",
      "winner": null,
      "scoreDiff": 0,
      "winsA": 1,
      "winsB": 2,
      "comparableCategoryCount": 3,
      "benchmarkCountA": 47,
      "benchmarkCountB": 42,
      "categoryResults": {
        "agentic": {
          "categoryLabel": "Agentic",
          "avgA": 72.6,
          "avgB": 74,
          "winner": "B",
          "benchmarkCount": 15
        },
        "coding": {
          "categoryLabel": "Coding",
          "avgA": 64.4,
          "avgB": 75.9,
          "winner": "B",
          "benchmarkCount": 14
        },
        "multimodalGrounded": {
          "categoryLabel": "Multimodal & Grounded",
          "avgA": 77.3,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 7
        },
        "reasoning": {
          "categoryLabel": "Reasoning",
          "avgA": null,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 4
        },
        "knowledge": {
          "categoryLabel": "Knowledge",
          "avgA": 76.2,
          "avgB": 66.1,
          "winner": "A",
          "benchmarkCount": 17
        },
        "instructionFollowing": {
          "categoryLabel": "Instruction Following",
          "avgA": null,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 1
        },
        "multilingual": {
          "categoryLabel": "Multilingual",
          "avgA": null,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 0
        },
        "math": {
          "categoryLabel": "Mathematics",
          "avgA": null,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 5
        }
      }
    },
    {
      "slug": "claude-opus-4-6-vs-gpt-5-3-codex",
      "url": "https://benchlm.ai/compare/claude-opus-4-6-vs-gpt-5-3-codex",
      "markdownUrl": "https://benchlm.ai/md/compare/claude-opus-4-6-vs-gpt-5-3-codex.md",
      "modelA": {
        "slug": "claude-opus-4-6",
        "canonicalModelKey": "claude-opus-4-6",
        "model": "Claude Opus 4.6",
        "creator": "Anthropic",
        "sourceType": "Proprietary",
        "reasoningType": "Non-Reasoning",
        "contextWindow": "1M",
        "contextWindowTokens": 1000000,
        "displayScore": 86,
        "rankingEligible": true,
        "overallRank": 12,
        "url": "https://benchlm.ai/models/claude-opus-4-6",
        "markdownUrl": "https://benchlm.ai/md/models/claude-opus-4-6.md"
      },
      "modelB": {
        "slug": "gpt-5-3-codex",
        "canonicalModelKey": "gpt-5-3-codex",
        "model": "GPT-5.3 Codex",
        "creator": "OpenAI",
        "sourceType": "Proprietary",
        "reasoningType": "Reasoning",
        "contextWindow": "400K",
        "contextWindowTokens": 400000,
        "displayScore": 85,
        "rankingEligible": true,
        "overallRank": 15,
        "url": "https://benchlm.ai/models/gpt-5-3-codex",
        "markdownUrl": "https://benchlm.ai/md/models/gpt-5-3-codex.md"
      },
      "overallWinner": "A",
      "winner": {
        "slug": "claude-opus-4-6",
        "canonicalModelKey": "claude-opus-4-6",
        "model": "Claude Opus 4.6",
        "creator": "Anthropic",
        "sourceType": "Proprietary",
        "reasoningType": "Non-Reasoning",
        "contextWindow": "1M",
        "contextWindowTokens": 1000000,
        "displayScore": 86,
        "rankingEligible": true,
        "overallRank": 12,
        "url": "https://benchlm.ai/models/claude-opus-4-6",
        "markdownUrl": "https://benchlm.ai/md/models/claude-opus-4-6.md"
      },
      "scoreDiff": 1,
      "winsA": 2,
      "winsB": 0,
      "comparableCategoryCount": 2,
      "benchmarkCountA": 47,
      "benchmarkCountB": 25,
      "categoryResults": {
        "agentic": {
          "categoryLabel": "Agentic",
          "avgA": 72.6,
          "avgB": 71.5,
          "winner": "A",
          "benchmarkCount": 11
        },
        "coding": {
          "categoryLabel": "Coding",
          "avgA": 64.4,
          "avgB": 63.1,
          "winner": "A",
          "benchmarkCount": 10
        },
        "multimodalGrounded": {
          "categoryLabel": "Multimodal & Grounded",
          "avgA": 77.3,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 7
        },
        "reasoning": {
          "categoryLabel": "Reasoning",
          "avgA": null,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 2
        },
        "knowledge": {
          "categoryLabel": "Knowledge",
          "avgA": 76.2,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 15
        },
        "instructionFollowing": {
          "categoryLabel": "Instruction Following",
          "avgA": null,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 1
        },
        "multilingual": {
          "categoryLabel": "Multilingual",
          "avgA": null,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 0
        },
        "math": {
          "categoryLabel": "Mathematics",
          "avgA": null,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 1
        }
      }
    },
    {
      "slug": "claude-opus-4-6-vs-claude-opus-4-7-adaptive",
      "url": "https://benchlm.ai/compare/claude-opus-4-6-vs-claude-opus-4-7-adaptive",
      "markdownUrl": "https://benchlm.ai/md/compare/claude-opus-4-6-vs-claude-opus-4-7-adaptive.md",
      "modelA": {
        "slug": "claude-opus-4-6",
        "canonicalModelKey": "claude-opus-4-6",
        "model": "Claude Opus 4.6",
        "creator": "Anthropic",
        "sourceType": "Proprietary",
        "reasoningType": "Non-Reasoning",
        "contextWindow": "1M",
        "contextWindowTokens": 1000000,
        "displayScore": 86,
        "rankingEligible": true,
        "overallRank": 12,
        "url": "https://benchlm.ai/models/claude-opus-4-6",
        "markdownUrl": "https://benchlm.ai/md/models/claude-opus-4-6.md"
      },
      "modelB": {
        "slug": "claude-opus-4-7-adaptive",
        "canonicalModelKey": "claude-opus-4-7-max",
        "model": "Claude Opus 4.7 (Adaptive)",
        "creator": "Anthropic",
        "sourceType": "Proprietary",
        "reasoningType": "Reasoning",
        "contextWindow": "1M",
        "contextWindowTokens": 1000000,
        "displayScore": 84,
        "rankingEligible": true,
        "overallRank": 16,
        "url": "https://benchlm.ai/models/claude-opus-4-7-adaptive",
        "markdownUrl": "https://benchlm.ai/md/models/claude-opus-4-7-adaptive.md"
      },
      "overallWinner": "A",
      "winner": {
        "slug": "claude-opus-4-6",
        "canonicalModelKey": "claude-opus-4-6",
        "model": "Claude Opus 4.6",
        "creator": "Anthropic",
        "sourceType": "Proprietary",
        "reasoningType": "Non-Reasoning",
        "contextWindow": "1M",
        "contextWindowTokens": 1000000,
        "displayScore": 86,
        "rankingEligible": true,
        "overallRank": 12,
        "url": "https://benchlm.ai/models/claude-opus-4-6",
        "markdownUrl": "https://benchlm.ai/md/models/claude-opus-4-6.md"
      },
      "scoreDiff": 2,
      "winsA": 2,
      "winsB": 2,
      "comparableCategoryCount": 4,
      "benchmarkCountA": 47,
      "benchmarkCountB": 36,
      "categoryResults": {
        "agentic": {
          "categoryLabel": "Agentic",
          "avgA": 72.6,
          "avgB": 74.9,
          "winner": "B",
          "benchmarkCount": 12
        },
        "coding": {
          "categoryLabel": "Coding",
          "avgA": 64.4,
          "avgB": 72.9,
          "winner": "B",
          "benchmarkCount": 11
        },
        "multimodalGrounded": {
          "categoryLabel": "Multimodal & Grounded",
          "avgA": 77.3,
          "avgB": 64.3,
          "winner": "A",
          "benchmarkCount": 10
        },
        "reasoning": {
          "categoryLabel": "Reasoning",
          "avgA": null,
          "avgB": 75.8,
          "winner": null,
          "benchmarkCount": 4
        },
        "knowledge": {
          "categoryLabel": "Knowledge",
          "avgA": 76.2,
          "avgB": 68.2,
          "winner": "A",
          "benchmarkCount": 15
        },
        "instructionFollowing": {
          "categoryLabel": "Instruction Following",
          "avgA": null,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 1
        },
        "multilingual": {
          "categoryLabel": "Multilingual",
          "avgA": null,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 0
        },
        "math": {
          "categoryLabel": "Mathematics",
          "avgA": null,
          "avgB": 43.8,
          "winner": null,
          "benchmarkCount": 2
        }
      }
    },
    {
      "slug": "claude-opus-4-6-vs-glm-5-1",
      "url": "https://benchlm.ai/compare/claude-opus-4-6-vs-glm-5-1",
      "markdownUrl": "https://benchlm.ai/md/compare/claude-opus-4-6-vs-glm-5-1.md",
      "modelA": {
        "slug": "claude-opus-4-6",
        "canonicalModelKey": "claude-opus-4-6",
        "model": "Claude Opus 4.6",
        "creator": "Anthropic",
        "sourceType": "Proprietary",
        "reasoningType": "Non-Reasoning",
        "contextWindow": "1M",
        "contextWindowTokens": 1000000,
        "displayScore": 86,
        "rankingEligible": true,
        "overallRank": 12,
        "url": "https://benchlm.ai/models/claude-opus-4-6",
        "markdownUrl": "https://benchlm.ai/md/models/claude-opus-4-6.md"
      },
      "modelB": {
        "slug": "glm-5-1",
        "canonicalModelKey": "glm-5-1",
        "model": "GLM-5.1",
        "creator": "Z.AI",
        "sourceType": "Open Weight",
        "reasoningType": "Reasoning",
        "contextWindow": "203K",
        "contextWindowTokens": 203000,
        "displayScore": 82,
        "rankingEligible": true,
        "overallRank": 17,
        "url": "https://benchlm.ai/models/glm-5-1",
        "markdownUrl": "https://benchlm.ai/md/models/glm-5-1.md"
      },
      "overallWinner": "A",
      "winner": {
        "slug": "claude-opus-4-6",
        "canonicalModelKey": "claude-opus-4-6",
        "model": "Claude Opus 4.6",
        "creator": "Anthropic",
        "sourceType": "Proprietary",
        "reasoningType": "Non-Reasoning",
        "contextWindow": "1M",
        "contextWindowTokens": 1000000,
        "displayScore": 86,
        "rankingEligible": true,
        "overallRank": 12,
        "url": "https://benchlm.ai/models/claude-opus-4-6",
        "markdownUrl": "https://benchlm.ai/md/models/claude-opus-4-6.md"
      },
      "scoreDiff": 4,
      "winsA": 3,
      "winsB": 0,
      "comparableCategoryCount": 3,
      "benchmarkCountA": 47,
      "benchmarkCountB": 33,
      "categoryResults": {
        "agentic": {
          "categoryLabel": "Agentic",
          "avgA": 72.6,
          "avgB": 65.3,
          "winner": "A",
          "benchmarkCount": 13
        },
        "coding": {
          "categoryLabel": "Coding",
          "avgA": 64.4,
          "avgB": 60.9,
          "winner": "A",
          "benchmarkCount": 11
        },
        "multimodalGrounded": {
          "categoryLabel": "Multimodal & Grounded",
          "avgA": 77.3,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 7
        },
        "reasoning": {
          "categoryLabel": "Reasoning",
          "avgA": null,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 2
        },
        "knowledge": {
          "categoryLabel": "Knowledge",
          "avgA": 76.2,
          "avgB": 52.3,
          "winner": "A",
          "benchmarkCount": 15
        },
        "instructionFollowing": {
          "categoryLabel": "Instruction Following",
          "avgA": null,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 1
        },
        "multilingual": {
          "categoryLabel": "Multilingual",
          "avgA": null,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 0
        },
        "math": {
          "categoryLabel": "Mathematics",
          "avgA": null,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 5
        }
      }
    },
    {
      "slug": "claude-opus-4-6-vs-claude-sonnet-4-6",
      "url": "https://benchlm.ai/compare/claude-opus-4-6-vs-claude-sonnet-4-6",
      "markdownUrl": "https://benchlm.ai/md/compare/claude-opus-4-6-vs-claude-sonnet-4-6.md",
      "modelA": {
        "slug": "claude-opus-4-6",
        "canonicalModelKey": "claude-opus-4-6",
        "model": "Claude Opus 4.6",
        "creator": "Anthropic",
        "sourceType": "Proprietary",
        "reasoningType": "Non-Reasoning",
        "contextWindow": "1M",
        "contextWindowTokens": 1000000,
        "displayScore": 86,
        "rankingEligible": true,
        "overallRank": 12,
        "url": "https://benchlm.ai/models/claude-opus-4-6",
        "markdownUrl": "https://benchlm.ai/md/models/claude-opus-4-6.md"
      },
      "modelB": {
        "slug": "claude-sonnet-4-6",
        "canonicalModelKey": "claude-sonnet-4-6",
        "model": "Claude Sonnet 4.6",
        "creator": "Anthropic",
        "sourceType": "Proprietary",
        "reasoningType": "Non-Reasoning",
        "contextWindow": "200K",
        "contextWindowTokens": 200000,
        "displayScore": 82,
        "rankingEligible": true,
        "overallRank": 18,
        "url": "https://benchlm.ai/models/claude-sonnet-4-6",
        "markdownUrl": "https://benchlm.ai/md/models/claude-sonnet-4-6.md"
      },
      "overallWinner": "A",
      "winner": {
        "slug": "claude-opus-4-6",
        "canonicalModelKey": "claude-opus-4-6",
        "model": "Claude Opus 4.6",
        "creator": "Anthropic",
        "sourceType": "Proprietary",
        "reasoningType": "Non-Reasoning",
        "contextWindow": "1M",
        "contextWindowTokens": 1000000,
        "displayScore": 86,
        "rankingEligible": true,
        "overallRank": 12,
        "url": "https://benchlm.ai/models/claude-opus-4-6",
        "markdownUrl": "https://benchlm.ai/md/models/claude-opus-4-6.md"
      },
      "scoreDiff": 4,
      "winsA": 2,
      "winsB": 2,
      "comparableCategoryCount": 4,
      "benchmarkCountA": 47,
      "benchmarkCountB": 33,
      "categoryResults": {
        "agentic": {
          "categoryLabel": "Agentic",
          "avgA": 72.6,
          "avgB": 65.1,
          "winner": "A",
          "benchmarkCount": 11
        },
        "coding": {
          "categoryLabel": "Coding",
          "avgA": 64.4,
          "avgB": 66.4,
          "winner": "B",
          "benchmarkCount": 11
        },
        "multimodalGrounded": {
          "categoryLabel": "Multimodal & Grounded",
          "avgA": 77.3,
          "avgB": 77.4,
          "winner": "B",
          "benchmarkCount": 8
        },
        "reasoning": {
          "categoryLabel": "Reasoning",
          "avgA": null,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 2
        },
        "knowledge": {
          "categoryLabel": "Knowledge",
          "avgA": 76.2,
          "avgB": 73.7,
          "winner": "A",
          "benchmarkCount": 15
        },
        "instructionFollowing": {
          "categoryLabel": "Instruction Following",
          "avgA": null,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 1
        },
        "multilingual": {
          "categoryLabel": "Multilingual",
          "avgA": null,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 0
        },
        "math": {
          "categoryLabel": "Mathematics",
          "avgA": null,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 1
        }
      }
    },
    {
      "slug": "deepseek-v4-pro-max-vs-gemini-3-5-flash",
      "url": "https://benchlm.ai/compare/deepseek-v4-pro-max-vs-gemini-3-5-flash",
      "markdownUrl": "https://benchlm.ai/md/compare/deepseek-v4-pro-max-vs-gemini-3-5-flash.md",
      "modelA": {
        "slug": "gemini-3-5-flash",
        "canonicalModelKey": "gemini-3-5-flash",
        "model": "Gemini 3.5 Flash",
        "creator": "Google",
        "sourceType": "Proprietary",
        "reasoningType": "Reasoning",
        "contextWindow": "1M",
        "contextWindowTokens": 1000000,
        "displayScore": 86,
        "rankingEligible": true,
        "overallRank": 13,
        "url": "https://benchlm.ai/models/gemini-3-5-flash",
        "markdownUrl": "https://benchlm.ai/md/models/gemini-3-5-flash.md"
      },
      "modelB": {
        "slug": "deepseek-v4-pro-max",
        "canonicalModelKey": "deepseek-v4-pro-max",
        "model": "DeepSeek V4 Pro (Max)",
        "creator": "DeepSeek",
        "sourceType": "Open Weight",
        "reasoningType": "Reasoning",
        "contextWindow": "1M",
        "contextWindowTokens": 1000000,
        "displayScore": 86,
        "rankingEligible": true,
        "overallRank": 14,
        "url": "https://benchlm.ai/models/deepseek-v4-pro-max",
        "markdownUrl": "https://benchlm.ai/md/models/deepseek-v4-pro-max.md"
      },
      "overallWinner": "tie",
      "winner": null,
      "scoreDiff": 0,
      "winsA": 1,
      "winsB": 2,
      "comparableCategoryCount": 3,
      "benchmarkCountA": 40,
      "benchmarkCountB": 42,
      "categoryResults": {
        "agentic": {
          "categoryLabel": "Agentic",
          "avgA": 77.2,
          "avgB": 74,
          "winner": "A",
          "benchmarkCount": 13
        },
        "coding": {
          "categoryLabel": "Coding",
          "avgA": 54.5,
          "avgB": 75.9,
          "winner": "B",
          "benchmarkCount": 12
        },
        "multimodalGrounded": {
          "categoryLabel": "Multimodal & Grounded",
          "avgA": 83.8,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 5
        },
        "reasoning": {
          "categoryLabel": "Reasoning",
          "avgA": 74.7,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 6
        },
        "knowledge": {
          "categoryLabel": "Knowledge",
          "avgA": 58,
          "avgB": 66.1,
          "winner": "B",
          "benchmarkCount": 12
        },
        "instructionFollowing": {
          "categoryLabel": "Instruction Following",
          "avgA": 76.3,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 2
        },
        "multilingual": {
          "categoryLabel": "Multilingual",
          "avgA": null,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 0
        },
        "math": {
          "categoryLabel": "Mathematics",
          "avgA": null,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 4
        }
      }
    },
    {
      "slug": "gemini-3-5-flash-vs-gpt-5-3-codex",
      "url": "https://benchlm.ai/compare/gemini-3-5-flash-vs-gpt-5-3-codex",
      "markdownUrl": "https://benchlm.ai/md/compare/gemini-3-5-flash-vs-gpt-5-3-codex.md",
      "modelA": {
        "slug": "gemini-3-5-flash",
        "canonicalModelKey": "gemini-3-5-flash",
        "model": "Gemini 3.5 Flash",
        "creator": "Google",
        "sourceType": "Proprietary",
        "reasoningType": "Reasoning",
        "contextWindow": "1M",
        "contextWindowTokens": 1000000,
        "displayScore": 86,
        "rankingEligible": true,
        "overallRank": 13,
        "url": "https://benchlm.ai/models/gemini-3-5-flash",
        "markdownUrl": "https://benchlm.ai/md/models/gemini-3-5-flash.md"
      },
      "modelB": {
        "slug": "gpt-5-3-codex",
        "canonicalModelKey": "gpt-5-3-codex",
        "model": "GPT-5.3 Codex",
        "creator": "OpenAI",
        "sourceType": "Proprietary",
        "reasoningType": "Reasoning",
        "contextWindow": "400K",
        "contextWindowTokens": 400000,
        "displayScore": 85,
        "rankingEligible": true,
        "overallRank": 15,
        "url": "https://benchlm.ai/models/gpt-5-3-codex",
        "markdownUrl": "https://benchlm.ai/md/models/gpt-5-3-codex.md"
      },
      "overallWinner": "A",
      "winner": {
        "slug": "gemini-3-5-flash",
        "canonicalModelKey": "gemini-3-5-flash",
        "model": "Gemini 3.5 Flash",
        "creator": "Google",
        "sourceType": "Proprietary",
        "reasoningType": "Reasoning",
        "contextWindow": "1M",
        "contextWindowTokens": 1000000,
        "displayScore": 86,
        "rankingEligible": true,
        "overallRank": 13,
        "url": "https://benchlm.ai/models/gemini-3-5-flash",
        "markdownUrl": "https://benchlm.ai/md/models/gemini-3-5-flash.md"
      },
      "scoreDiff": 1,
      "winsA": 1,
      "winsB": 1,
      "comparableCategoryCount": 2,
      "benchmarkCountA": 40,
      "benchmarkCountB": 25,
      "categoryResults": {
        "agentic": {
          "categoryLabel": "Agentic",
          "avgA": 77.2,
          "avgB": 71.5,
          "winner": "A",
          "benchmarkCount": 11
        },
        "coding": {
          "categoryLabel": "Coding",
          "avgA": 54.5,
          "avgB": 63.1,
          "winner": "B",
          "benchmarkCount": 10
        },
        "multimodalGrounded": {
          "categoryLabel": "Multimodal & Grounded",
          "avgA": 83.8,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 5
        },
        "reasoning": {
          "categoryLabel": "Reasoning",
          "avgA": 74.7,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 5
        },
        "knowledge": {
          "categoryLabel": "Knowledge",
          "avgA": 58,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 9
        },
        "instructionFollowing": {
          "categoryLabel": "Instruction Following",
          "avgA": 76.3,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 2
        },
        "multilingual": {
          "categoryLabel": "Multilingual",
          "avgA": null,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 0
        },
        "math": {
          "categoryLabel": "Mathematics",
          "avgA": null,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 0
        }
      }
    },
    {
      "slug": "claude-opus-4-7-adaptive-vs-gemini-3-5-flash",
      "url": "https://benchlm.ai/compare/claude-opus-4-7-adaptive-vs-gemini-3-5-flash",
      "markdownUrl": "https://benchlm.ai/md/compare/claude-opus-4-7-adaptive-vs-gemini-3-5-flash.md",
      "modelA": {
        "slug": "gemini-3-5-flash",
        "canonicalModelKey": "gemini-3-5-flash",
        "model": "Gemini 3.5 Flash",
        "creator": "Google",
        "sourceType": "Proprietary",
        "reasoningType": "Reasoning",
        "contextWindow": "1M",
        "contextWindowTokens": 1000000,
        "displayScore": 86,
        "rankingEligible": true,
        "overallRank": 13,
        "url": "https://benchlm.ai/models/gemini-3-5-flash",
        "markdownUrl": "https://benchlm.ai/md/models/gemini-3-5-flash.md"
      },
      "modelB": {
        "slug": "claude-opus-4-7-adaptive",
        "canonicalModelKey": "claude-opus-4-7-max",
        "model": "Claude Opus 4.7 (Adaptive)",
        "creator": "Anthropic",
        "sourceType": "Proprietary",
        "reasoningType": "Reasoning",
        "contextWindow": "1M",
        "contextWindowTokens": 1000000,
        "displayScore": 84,
        "rankingEligible": true,
        "overallRank": 16,
        "url": "https://benchlm.ai/models/claude-opus-4-7-adaptive",
        "markdownUrl": "https://benchlm.ai/md/models/claude-opus-4-7-adaptive.md"
      },
      "overallWinner": "A",
      "winner": {
        "slug": "gemini-3-5-flash",
        "canonicalModelKey": "gemini-3-5-flash",
        "model": "Gemini 3.5 Flash",
        "creator": "Google",
        "sourceType": "Proprietary",
        "reasoningType": "Reasoning",
        "contextWindow": "1M",
        "contextWindowTokens": 1000000,
        "displayScore": 86,
        "rankingEligible": true,
        "overallRank": 13,
        "url": "https://benchlm.ai/models/gemini-3-5-flash",
        "markdownUrl": "https://benchlm.ai/md/models/gemini-3-5-flash.md"
      },
      "scoreDiff": 2,
      "winsA": 2,
      "winsB": 3,
      "comparableCategoryCount": 5,
      "benchmarkCountA": 40,
      "benchmarkCountB": 36,
      "categoryResults": {
        "agentic": {
          "categoryLabel": "Agentic",
          "avgA": 77.2,
          "avgB": 74.9,
          "winner": "A",
          "benchmarkCount": 13
        },
        "coding": {
          "categoryLabel": "Coding",
          "avgA": 54.5,
          "avgB": 72.9,
          "winner": "B",
          "benchmarkCount": 9
        },
        "multimodalGrounded": {
          "categoryLabel": "Multimodal & Grounded",
          "avgA": 83.8,
          "avgB": 64.3,
          "winner": "A",
          "benchmarkCount": 7
        },
        "reasoning": {
          "categoryLabel": "Reasoning",
          "avgA": 74.7,
          "avgB": 75.8,
          "winner": "B",
          "benchmarkCount": 6
        },
        "knowledge": {
          "categoryLabel": "Knowledge",
          "avgA": 58,
          "avgB": 68.2,
          "winner": "B",
          "benchmarkCount": 10
        },
        "instructionFollowing": {
          "categoryLabel": "Instruction Following",
          "avgA": 76.3,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 2
        },
        "multilingual": {
          "categoryLabel": "Multilingual",
          "avgA": null,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 0
        },
        "math": {
          "categoryLabel": "Mathematics",
          "avgA": null,
          "avgB": 43.8,
          "winner": null,
          "benchmarkCount": 1
        }
      }
    },
    {
      "slug": "gemini-3-5-flash-vs-glm-5-1",
      "url": "https://benchlm.ai/compare/gemini-3-5-flash-vs-glm-5-1",
      "markdownUrl": "https://benchlm.ai/md/compare/gemini-3-5-flash-vs-glm-5-1.md",
      "modelA": {
        "slug": "gemini-3-5-flash",
        "canonicalModelKey": "gemini-3-5-flash",
        "model": "Gemini 3.5 Flash",
        "creator": "Google",
        "sourceType": "Proprietary",
        "reasoningType": "Reasoning",
        "contextWindow": "1M",
        "contextWindowTokens": 1000000,
        "displayScore": 86,
        "rankingEligible": true,
        "overallRank": 13,
        "url": "https://benchlm.ai/models/gemini-3-5-flash",
        "markdownUrl": "https://benchlm.ai/md/models/gemini-3-5-flash.md"
      },
      "modelB": {
        "slug": "glm-5-1",
        "canonicalModelKey": "glm-5-1",
        "model": "GLM-5.1",
        "creator": "Z.AI",
        "sourceType": "Open Weight",
        "reasoningType": "Reasoning",
        "contextWindow": "203K",
        "contextWindowTokens": 203000,
        "displayScore": 82,
        "rankingEligible": true,
        "overallRank": 17,
        "url": "https://benchlm.ai/models/glm-5-1",
        "markdownUrl": "https://benchlm.ai/md/models/glm-5-1.md"
      },
      "overallWinner": "A",
      "winner": {
        "slug": "gemini-3-5-flash",
        "canonicalModelKey": "gemini-3-5-flash",
        "model": "Gemini 3.5 Flash",
        "creator": "Google",
        "sourceType": "Proprietary",
        "reasoningType": "Reasoning",
        "contextWindow": "1M",
        "contextWindowTokens": 1000000,
        "displayScore": 86,
        "rankingEligible": true,
        "overallRank": 13,
        "url": "https://benchlm.ai/models/gemini-3-5-flash",
        "markdownUrl": "https://benchlm.ai/md/models/gemini-3-5-flash.md"
      },
      "scoreDiff": 4,
      "winsA": 2,
      "winsB": 1,
      "comparableCategoryCount": 3,
      "benchmarkCountA": 40,
      "benchmarkCountB": 33,
      "categoryResults": {
        "agentic": {
          "categoryLabel": "Agentic",
          "avgA": 77.2,
          "avgB": 65.3,
          "winner": "A",
          "benchmarkCount": 15
        },
        "coding": {
          "categoryLabel": "Coding",
          "avgA": 54.5,
          "avgB": 60.9,
          "winner": "B",
          "benchmarkCount": 10
        },
        "multimodalGrounded": {
          "categoryLabel": "Multimodal & Grounded",
          "avgA": 83.8,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 5
        },
        "reasoning": {
          "categoryLabel": "Reasoning",
          "avgA": 74.7,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 5
        },
        "knowledge": {
          "categoryLabel": "Knowledge",
          "avgA": 58,
          "avgB": 52.3,
          "winner": "A",
          "benchmarkCount": 9
        },
        "instructionFollowing": {
          "categoryLabel": "Instruction Following",
          "avgA": 76.3,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 2
        },
        "multilingual": {
          "categoryLabel": "Multilingual",
          "avgA": null,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 0
        },
        "math": {
          "categoryLabel": "Mathematics",
          "avgA": null,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 4
        }
      }
    },
    {
      "slug": "claude-sonnet-4-6-vs-gemini-3-5-flash",
      "url": "https://benchlm.ai/compare/claude-sonnet-4-6-vs-gemini-3-5-flash",
      "markdownUrl": "https://benchlm.ai/md/compare/claude-sonnet-4-6-vs-gemini-3-5-flash.md",
      "modelA": {
        "slug": "gemini-3-5-flash",
        "canonicalModelKey": "gemini-3-5-flash",
        "model": "Gemini 3.5 Flash",
        "creator": "Google",
        "sourceType": "Proprietary",
        "reasoningType": "Reasoning",
        "contextWindow": "1M",
        "contextWindowTokens": 1000000,
        "displayScore": 86,
        "rankingEligible": true,
        "overallRank": 13,
        "url": "https://benchlm.ai/models/gemini-3-5-flash",
        "markdownUrl": "https://benchlm.ai/md/models/gemini-3-5-flash.md"
      },
      "modelB": {
        "slug": "claude-sonnet-4-6",
        "canonicalModelKey": "claude-sonnet-4-6",
        "model": "Claude Sonnet 4.6",
        "creator": "Anthropic",
        "sourceType": "Proprietary",
        "reasoningType": "Non-Reasoning",
        "contextWindow": "200K",
        "contextWindowTokens": 200000,
        "displayScore": 82,
        "rankingEligible": true,
        "overallRank": 18,
        "url": "https://benchlm.ai/models/claude-sonnet-4-6",
        "markdownUrl": "https://benchlm.ai/md/models/claude-sonnet-4-6.md"
      },
      "overallWinner": "A",
      "winner": {
        "slug": "gemini-3-5-flash",
        "canonicalModelKey": "gemini-3-5-flash",
        "model": "Gemini 3.5 Flash",
        "creator": "Google",
        "sourceType": "Proprietary",
        "reasoningType": "Reasoning",
        "contextWindow": "1M",
        "contextWindowTokens": 1000000,
        "displayScore": 86,
        "rankingEligible": true,
        "overallRank": 13,
        "url": "https://benchlm.ai/models/gemini-3-5-flash",
        "markdownUrl": "https://benchlm.ai/md/models/gemini-3-5-flash.md"
      },
      "scoreDiff": 4,
      "winsA": 2,
      "winsB": 2,
      "comparableCategoryCount": 4,
      "benchmarkCountA": 40,
      "benchmarkCountB": 33,
      "categoryResults": {
        "agentic": {
          "categoryLabel": "Agentic",
          "avgA": 77.2,
          "avgB": 65.1,
          "winner": "A",
          "benchmarkCount": 13
        },
        "coding": {
          "categoryLabel": "Coding",
          "avgA": 54.5,
          "avgB": 66.4,
          "winner": "B",
          "benchmarkCount": 11
        },
        "multimodalGrounded": {
          "categoryLabel": "Multimodal & Grounded",
          "avgA": 83.8,
          "avgB": 77.4,
          "winner": "A",
          "benchmarkCount": 5
        },
        "reasoning": {
          "categoryLabel": "Reasoning",
          "avgA": 74.7,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 5
        },
        "knowledge": {
          "categoryLabel": "Knowledge",
          "avgA": 58,
          "avgB": 73.7,
          "winner": "B",
          "benchmarkCount": 11
        },
        "instructionFollowing": {
          "categoryLabel": "Instruction Following",
          "avgA": 76.3,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 2
        },
        "multilingual": {
          "categoryLabel": "Multilingual",
          "avgA": null,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 0
        },
        "math": {
          "categoryLabel": "Mathematics",
          "avgA": null,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 0
        }
      }
    },
    {
      "slug": "deepseek-v4-pro-max-vs-gpt-5-3-codex",
      "url": "https://benchlm.ai/compare/deepseek-v4-pro-max-vs-gpt-5-3-codex",
      "markdownUrl": "https://benchlm.ai/md/compare/deepseek-v4-pro-max-vs-gpt-5-3-codex.md",
      "modelA": {
        "slug": "deepseek-v4-pro-max",
        "canonicalModelKey": "deepseek-v4-pro-max",
        "model": "DeepSeek V4 Pro (Max)",
        "creator": "DeepSeek",
        "sourceType": "Open Weight",
        "reasoningType": "Reasoning",
        "contextWindow": "1M",
        "contextWindowTokens": 1000000,
        "displayScore": 86,
        "rankingEligible": true,
        "overallRank": 14,
        "url": "https://benchlm.ai/models/deepseek-v4-pro-max",
        "markdownUrl": "https://benchlm.ai/md/models/deepseek-v4-pro-max.md"
      },
      "modelB": {
        "slug": "gpt-5-3-codex",
        "canonicalModelKey": "gpt-5-3-codex",
        "model": "GPT-5.3 Codex",
        "creator": "OpenAI",
        "sourceType": "Proprietary",
        "reasoningType": "Reasoning",
        "contextWindow": "400K",
        "contextWindowTokens": 400000,
        "displayScore": 85,
        "rankingEligible": true,
        "overallRank": 15,
        "url": "https://benchlm.ai/models/gpt-5-3-codex",
        "markdownUrl": "https://benchlm.ai/md/models/gpt-5-3-codex.md"
      },
      "overallWinner": "A",
      "winner": {
        "slug": "deepseek-v4-pro-max",
        "canonicalModelKey": "deepseek-v4-pro-max",
        "model": "DeepSeek V4 Pro (Max)",
        "creator": "DeepSeek",
        "sourceType": "Open Weight",
        "reasoningType": "Reasoning",
        "contextWindow": "1M",
        "contextWindowTokens": 1000000,
        "displayScore": 86,
        "rankingEligible": true,
        "overallRank": 14,
        "url": "https://benchlm.ai/models/deepseek-v4-pro-max",
        "markdownUrl": "https://benchlm.ai/md/models/deepseek-v4-pro-max.md"
      },
      "scoreDiff": 1,
      "winsA": 2,
      "winsB": 0,
      "comparableCategoryCount": 2,
      "benchmarkCountA": 42,
      "benchmarkCountB": 25,
      "categoryResults": {
        "agentic": {
          "categoryLabel": "Agentic",
          "avgA": 74,
          "avgB": 71.5,
          "winner": "A",
          "benchmarkCount": 12
        },
        "coding": {
          "categoryLabel": "Coding",
          "avgA": 75.9,
          "avgB": 63.1,
          "winner": "A",
          "benchmarkCount": 11
        },
        "multimodalGrounded": {
          "categoryLabel": "Multimodal & Grounded",
          "avgA": null,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 2
        },
        "reasoning": {
          "categoryLabel": "Reasoning",
          "avgA": null,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 4
        },
        "knowledge": {
          "categoryLabel": "Knowledge",
          "avgA": 66.1,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 12
        },
        "instructionFollowing": {
          "categoryLabel": "Instruction Following",
          "avgA": null,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 1
        },
        "multilingual": {
          "categoryLabel": "Multilingual",
          "avgA": null,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 0
        },
        "math": {
          "categoryLabel": "Mathematics",
          "avgA": null,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 4
        }
      }
    },
    {
      "slug": "claude-opus-4-7-adaptive-vs-deepseek-v4-pro-max",
      "url": "https://benchlm.ai/compare/claude-opus-4-7-adaptive-vs-deepseek-v4-pro-max",
      "markdownUrl": "https://benchlm.ai/md/compare/claude-opus-4-7-adaptive-vs-deepseek-v4-pro-max.md",
      "modelA": {
        "slug": "deepseek-v4-pro-max",
        "canonicalModelKey": "deepseek-v4-pro-max",
        "model": "DeepSeek V4 Pro (Max)",
        "creator": "DeepSeek",
        "sourceType": "Open Weight",
        "reasoningType": "Reasoning",
        "contextWindow": "1M",
        "contextWindowTokens": 1000000,
        "displayScore": 86,
        "rankingEligible": true,
        "overallRank": 14,
        "url": "https://benchlm.ai/models/deepseek-v4-pro-max",
        "markdownUrl": "https://benchlm.ai/md/models/deepseek-v4-pro-max.md"
      },
      "modelB": {
        "slug": "claude-opus-4-7-adaptive",
        "canonicalModelKey": "claude-opus-4-7-max",
        "model": "Claude Opus 4.7 (Adaptive)",
        "creator": "Anthropic",
        "sourceType": "Proprietary",
        "reasoningType": "Reasoning",
        "contextWindow": "1M",
        "contextWindowTokens": 1000000,
        "displayScore": 84,
        "rankingEligible": true,
        "overallRank": 16,
        "url": "https://benchlm.ai/models/claude-opus-4-7-adaptive",
        "markdownUrl": "https://benchlm.ai/md/models/claude-opus-4-7-adaptive.md"
      },
      "overallWinner": "A",
      "winner": {
        "slug": "deepseek-v4-pro-max",
        "canonicalModelKey": "deepseek-v4-pro-max",
        "model": "DeepSeek V4 Pro (Max)",
        "creator": "DeepSeek",
        "sourceType": "Open Weight",
        "reasoningType": "Reasoning",
        "contextWindow": "1M",
        "contextWindowTokens": 1000000,
        "displayScore": 86,
        "rankingEligible": true,
        "overallRank": 14,
        "url": "https://benchlm.ai/models/deepseek-v4-pro-max",
        "markdownUrl": "https://benchlm.ai/md/models/deepseek-v4-pro-max.md"
      },
      "scoreDiff": 2,
      "winsA": 1,
      "winsB": 2,
      "comparableCategoryCount": 3,
      "benchmarkCountA": 42,
      "benchmarkCountB": 36,
      "categoryResults": {
        "agentic": {
          "categoryLabel": "Agentic",
          "avgA": 74,
          "avgB": 74.9,
          "winner": "B",
          "benchmarkCount": 12
        },
        "coding": {
          "categoryLabel": "Coding",
          "avgA": 75.9,
          "avgB": 72.9,
          "winner": "A",
          "benchmarkCount": 10
        },
        "multimodalGrounded": {
          "categoryLabel": "Multimodal & Grounded",
          "avgA": null,
          "avgB": 64.3,
          "winner": null,
          "benchmarkCount": 5
        },
        "reasoning": {
          "categoryLabel": "Reasoning",
          "avgA": null,
          "avgB": 75.8,
          "winner": null,
          "benchmarkCount": 6
        },
        "knowledge": {
          "categoryLabel": "Knowledge",
          "avgA": 66.1,
          "avgB": 68.2,
          "winner": "B",
          "benchmarkCount": 13
        },
        "instructionFollowing": {
          "categoryLabel": "Instruction Following",
          "avgA": null,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 1
        },
        "multilingual": {
          "categoryLabel": "Multilingual",
          "avgA": null,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 0
        },
        "math": {
          "categoryLabel": "Mathematics",
          "avgA": null,
          "avgB": 43.8,
          "winner": null,
          "benchmarkCount": 5
        }
      }
    },
    {
      "slug": "deepseek-v4-pro-max-vs-glm-5-1",
      "url": "https://benchlm.ai/compare/deepseek-v4-pro-max-vs-glm-5-1",
      "markdownUrl": "https://benchlm.ai/md/compare/deepseek-v4-pro-max-vs-glm-5-1.md",
      "modelA": {
        "slug": "deepseek-v4-pro-max",
        "canonicalModelKey": "deepseek-v4-pro-max",
        "model": "DeepSeek V4 Pro (Max)",
        "creator": "DeepSeek",
        "sourceType": "Open Weight",
        "reasoningType": "Reasoning",
        "contextWindow": "1M",
        "contextWindowTokens": 1000000,
        "displayScore": 86,
        "rankingEligible": true,
        "overallRank": 14,
        "url": "https://benchlm.ai/models/deepseek-v4-pro-max",
        "markdownUrl": "https://benchlm.ai/md/models/deepseek-v4-pro-max.md"
      },
      "modelB": {
        "slug": "glm-5-1",
        "canonicalModelKey": "glm-5-1",
        "model": "GLM-5.1",
        "creator": "Z.AI",
        "sourceType": "Open Weight",
        "reasoningType": "Reasoning",
        "contextWindow": "203K",
        "contextWindowTokens": 203000,
        "displayScore": 82,
        "rankingEligible": true,
        "overallRank": 17,
        "url": "https://benchlm.ai/models/glm-5-1",
        "markdownUrl": "https://benchlm.ai/md/models/glm-5-1.md"
      },
      "overallWinner": "A",
      "winner": {
        "slug": "deepseek-v4-pro-max",
        "canonicalModelKey": "deepseek-v4-pro-max",
        "model": "DeepSeek V4 Pro (Max)",
        "creator": "DeepSeek",
        "sourceType": "Open Weight",
        "reasoningType": "Reasoning",
        "contextWindow": "1M",
        "contextWindowTokens": 1000000,
        "displayScore": 86,
        "rankingEligible": true,
        "overallRank": 14,
        "url": "https://benchlm.ai/models/deepseek-v4-pro-max",
        "markdownUrl": "https://benchlm.ai/md/models/deepseek-v4-pro-max.md"
      },
      "scoreDiff": 4,
      "winsA": 3,
      "winsB": 0,
      "comparableCategoryCount": 3,
      "benchmarkCountA": 42,
      "benchmarkCountB": 33,
      "categoryResults": {
        "agentic": {
          "categoryLabel": "Agentic",
          "avgA": 74,
          "avgB": 65.3,
          "winner": "A",
          "benchmarkCount": 14
        },
        "coding": {
          "categoryLabel": "Coding",
          "avgA": 75.9,
          "avgB": 60.9,
          "winner": "A",
          "benchmarkCount": 12
        },
        "multimodalGrounded": {
          "categoryLabel": "Multimodal & Grounded",
          "avgA": null,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 1
        },
        "reasoning": {
          "categoryLabel": "Reasoning",
          "avgA": null,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 4
        },
        "knowledge": {
          "categoryLabel": "Knowledge",
          "avgA": 66.1,
          "avgB": 52.3,
          "winner": "A",
          "benchmarkCount": 12
        },
        "instructionFollowing": {
          "categoryLabel": "Instruction Following",
          "avgA": null,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 1
        },
        "multilingual": {
          "categoryLabel": "Multilingual",
          "avgA": null,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 0
        },
        "math": {
          "categoryLabel": "Mathematics",
          "avgA": null,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 7
        }
      }
    },
    {
      "slug": "claude-sonnet-4-6-vs-deepseek-v4-pro-max",
      "url": "https://benchlm.ai/compare/claude-sonnet-4-6-vs-deepseek-v4-pro-max",
      "markdownUrl": "https://benchlm.ai/md/compare/claude-sonnet-4-6-vs-deepseek-v4-pro-max.md",
      "modelA": {
        "slug": "deepseek-v4-pro-max",
        "canonicalModelKey": "deepseek-v4-pro-max",
        "model": "DeepSeek V4 Pro (Max)",
        "creator": "DeepSeek",
        "sourceType": "Open Weight",
        "reasoningType": "Reasoning",
        "contextWindow": "1M",
        "contextWindowTokens": 1000000,
        "displayScore": 86,
        "rankingEligible": true,
        "overallRank": 14,
        "url": "https://benchlm.ai/models/deepseek-v4-pro-max",
        "markdownUrl": "https://benchlm.ai/md/models/deepseek-v4-pro-max.md"
      },
      "modelB": {
        "slug": "claude-sonnet-4-6",
        "canonicalModelKey": "claude-sonnet-4-6",
        "model": "Claude Sonnet 4.6",
        "creator": "Anthropic",
        "sourceType": "Proprietary",
        "reasoningType": "Non-Reasoning",
        "contextWindow": "200K",
        "contextWindowTokens": 200000,
        "displayScore": 82,
        "rankingEligible": true,
        "overallRank": 18,
        "url": "https://benchlm.ai/models/claude-sonnet-4-6",
        "markdownUrl": "https://benchlm.ai/md/models/claude-sonnet-4-6.md"
      },
      "overallWinner": "A",
      "winner": {
        "slug": "deepseek-v4-pro-max",
        "canonicalModelKey": "deepseek-v4-pro-max",
        "model": "DeepSeek V4 Pro (Max)",
        "creator": "DeepSeek",
        "sourceType": "Open Weight",
        "reasoningType": "Reasoning",
        "contextWindow": "1M",
        "contextWindowTokens": 1000000,
        "displayScore": 86,
        "rankingEligible": true,
        "overallRank": 14,
        "url": "https://benchlm.ai/models/deepseek-v4-pro-max",
        "markdownUrl": "https://benchlm.ai/md/models/deepseek-v4-pro-max.md"
      },
      "scoreDiff": 4,
      "winsA": 2,
      "winsB": 1,
      "comparableCategoryCount": 3,
      "benchmarkCountA": 42,
      "benchmarkCountB": 33,
      "categoryResults": {
        "agentic": {
          "categoryLabel": "Agentic",
          "avgA": 74,
          "avgB": 65.1,
          "winner": "A",
          "benchmarkCount": 14
        },
        "coding": {
          "categoryLabel": "Coding",
          "avgA": 75.9,
          "avgB": 66.4,
          "winner": "A",
          "benchmarkCount": 13
        },
        "multimodalGrounded": {
          "categoryLabel": "Multimodal & Grounded",
          "avgA": null,
          "avgB": 77.4,
          "winner": null,
          "benchmarkCount": 3
        },
        "reasoning": {
          "categoryLabel": "Reasoning",
          "avgA": null,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 4
        },
        "knowledge": {
          "categoryLabel": "Knowledge",
          "avgA": 66.1,
          "avgB": 73.7,
          "winner": "B",
          "benchmarkCount": 13
        },
        "instructionFollowing": {
          "categoryLabel": "Instruction Following",
          "avgA": null,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 1
        },
        "multilingual": {
          "categoryLabel": "Multilingual",
          "avgA": null,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 0
        },
        "math": {
          "categoryLabel": "Mathematics",
          "avgA": null,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 4
        }
      }
    },
    {
      "slug": "claude-opus-4-7-adaptive-vs-gpt-5-3-codex",
      "url": "https://benchlm.ai/compare/claude-opus-4-7-adaptive-vs-gpt-5-3-codex",
      "markdownUrl": "https://benchlm.ai/md/compare/claude-opus-4-7-adaptive-vs-gpt-5-3-codex.md",
      "modelA": {
        "slug": "gpt-5-3-codex",
        "canonicalModelKey": "gpt-5-3-codex",
        "model": "GPT-5.3 Codex",
        "creator": "OpenAI",
        "sourceType": "Proprietary",
        "reasoningType": "Reasoning",
        "contextWindow": "400K",
        "contextWindowTokens": 400000,
        "displayScore": 85,
        "rankingEligible": true,
        "overallRank": 15,
        "url": "https://benchlm.ai/models/gpt-5-3-codex",
        "markdownUrl": "https://benchlm.ai/md/models/gpt-5-3-codex.md"
      },
      "modelB": {
        "slug": "claude-opus-4-7-adaptive",
        "canonicalModelKey": "claude-opus-4-7-max",
        "model": "Claude Opus 4.7 (Adaptive)",
        "creator": "Anthropic",
        "sourceType": "Proprietary",
        "reasoningType": "Reasoning",
        "contextWindow": "1M",
        "contextWindowTokens": 1000000,
        "displayScore": 84,
        "rankingEligible": true,
        "overallRank": 16,
        "url": "https://benchlm.ai/models/claude-opus-4-7-adaptive",
        "markdownUrl": "https://benchlm.ai/md/models/claude-opus-4-7-adaptive.md"
      },
      "overallWinner": "A",
      "winner": {
        "slug": "gpt-5-3-codex",
        "canonicalModelKey": "gpt-5-3-codex",
        "model": "GPT-5.3 Codex",
        "creator": "OpenAI",
        "sourceType": "Proprietary",
        "reasoningType": "Reasoning",
        "contextWindow": "400K",
        "contextWindowTokens": 400000,
        "displayScore": 85,
        "rankingEligible": true,
        "overallRank": 15,
        "url": "https://benchlm.ai/models/gpt-5-3-codex",
        "markdownUrl": "https://benchlm.ai/md/models/gpt-5-3-codex.md"
      },
      "scoreDiff": 1,
      "winsA": 0,
      "winsB": 2,
      "comparableCategoryCount": 2,
      "benchmarkCountA": 25,
      "benchmarkCountB": 36,
      "categoryResults": {
        "agentic": {
          "categoryLabel": "Agentic",
          "avgA": 71.5,
          "avgB": 74.9,
          "winner": "B",
          "benchmarkCount": 10
        },
        "coding": {
          "categoryLabel": "Coding",
          "avgA": 63.1,
          "avgB": 72.9,
          "winner": "B",
          "benchmarkCount": 8
        },
        "multimodalGrounded": {
          "categoryLabel": "Multimodal & Grounded",
          "avgA": null,
          "avgB": 64.3,
          "winner": null,
          "benchmarkCount": 5
        },
        "reasoning": {
          "categoryLabel": "Reasoning",
          "avgA": null,
          "avgB": 75.8,
          "winner": null,
          "benchmarkCount": 4
        },
        "knowledge": {
          "categoryLabel": "Knowledge",
          "avgA": null,
          "avgB": 68.2,
          "winner": null,
          "benchmarkCount": 10
        },
        "instructionFollowing": {
          "categoryLabel": "Instruction Following",
          "avgA": null,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 1
        },
        "multilingual": {
          "categoryLabel": "Multilingual",
          "avgA": null,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 0
        },
        "math": {
          "categoryLabel": "Mathematics",
          "avgA": null,
          "avgB": 43.8,
          "winner": null,
          "benchmarkCount": 1
        }
      }
    },
    {
      "slug": "glm-5-1-vs-gpt-5-3-codex",
      "url": "https://benchlm.ai/compare/glm-5-1-vs-gpt-5-3-codex",
      "markdownUrl": "https://benchlm.ai/md/compare/glm-5-1-vs-gpt-5-3-codex.md",
      "modelA": {
        "slug": "gpt-5-3-codex",
        "canonicalModelKey": "gpt-5-3-codex",
        "model": "GPT-5.3 Codex",
        "creator": "OpenAI",
        "sourceType": "Proprietary",
        "reasoningType": "Reasoning",
        "contextWindow": "400K",
        "contextWindowTokens": 400000,
        "displayScore": 85,
        "rankingEligible": true,
        "overallRank": 15,
        "url": "https://benchlm.ai/models/gpt-5-3-codex",
        "markdownUrl": "https://benchlm.ai/md/models/gpt-5-3-codex.md"
      },
      "modelB": {
        "slug": "glm-5-1",
        "canonicalModelKey": "glm-5-1",
        "model": "GLM-5.1",
        "creator": "Z.AI",
        "sourceType": "Open Weight",
        "reasoningType": "Reasoning",
        "contextWindow": "203K",
        "contextWindowTokens": 203000,
        "displayScore": 82,
        "rankingEligible": true,
        "overallRank": 17,
        "url": "https://benchlm.ai/models/glm-5-1",
        "markdownUrl": "https://benchlm.ai/md/models/glm-5-1.md"
      },
      "overallWinner": "A",
      "winner": {
        "slug": "gpt-5-3-codex",
        "canonicalModelKey": "gpt-5-3-codex",
        "model": "GPT-5.3 Codex",
        "creator": "OpenAI",
        "sourceType": "Proprietary",
        "reasoningType": "Reasoning",
        "contextWindow": "400K",
        "contextWindowTokens": 400000,
        "displayScore": 85,
        "rankingEligible": true,
        "overallRank": 15,
        "url": "https://benchlm.ai/models/gpt-5-3-codex",
        "markdownUrl": "https://benchlm.ai/md/models/gpt-5-3-codex.md"
      },
      "scoreDiff": 3,
      "winsA": 2,
      "winsB": 0,
      "comparableCategoryCount": 2,
      "benchmarkCountA": 25,
      "benchmarkCountB": 33,
      "categoryResults": {
        "agentic": {
          "categoryLabel": "Agentic",
          "avgA": 71.5,
          "avgB": 65.3,
          "winner": "A",
          "benchmarkCount": 12
        },
        "coding": {
          "categoryLabel": "Coding",
          "avgA": 63.1,
          "avgB": 60.9,
          "winner": "A",
          "benchmarkCount": 8
        },
        "multimodalGrounded": {
          "categoryLabel": "Multimodal & Grounded",
          "avgA": null,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 2
        },
        "reasoning": {
          "categoryLabel": "Reasoning",
          "avgA": null,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 2
        },
        "knowledge": {
          "categoryLabel": "Knowledge",
          "avgA": null,
          "avgB": 52.3,
          "winner": null,
          "benchmarkCount": 8
        },
        "instructionFollowing": {
          "categoryLabel": "Instruction Following",
          "avgA": null,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 1
        },
        "multilingual": {
          "categoryLabel": "Multilingual",
          "avgA": null,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 0
        },
        "math": {
          "categoryLabel": "Mathematics",
          "avgA": null,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 4
        }
      }
    },
    {
      "slug": "claude-sonnet-4-6-vs-gpt-5-3-codex",
      "url": "https://benchlm.ai/compare/claude-sonnet-4-6-vs-gpt-5-3-codex",
      "markdownUrl": "https://benchlm.ai/md/compare/claude-sonnet-4-6-vs-gpt-5-3-codex.md",
      "modelA": {
        "slug": "gpt-5-3-codex",
        "canonicalModelKey": "gpt-5-3-codex",
        "model": "GPT-5.3 Codex",
        "creator": "OpenAI",
        "sourceType": "Proprietary",
        "reasoningType": "Reasoning",
        "contextWindow": "400K",
        "contextWindowTokens": 400000,
        "displayScore": 85,
        "rankingEligible": true,
        "overallRank": 15,
        "url": "https://benchlm.ai/models/gpt-5-3-codex",
        "markdownUrl": "https://benchlm.ai/md/models/gpt-5-3-codex.md"
      },
      "modelB": {
        "slug": "claude-sonnet-4-6",
        "canonicalModelKey": "claude-sonnet-4-6",
        "model": "Claude Sonnet 4.6",
        "creator": "Anthropic",
        "sourceType": "Proprietary",
        "reasoningType": "Non-Reasoning",
        "contextWindow": "200K",
        "contextWindowTokens": 200000,
        "displayScore": 82,
        "rankingEligible": true,
        "overallRank": 18,
        "url": "https://benchlm.ai/models/claude-sonnet-4-6",
        "markdownUrl": "https://benchlm.ai/md/models/claude-sonnet-4-6.md"
      },
      "overallWinner": "A",
      "winner": {
        "slug": "gpt-5-3-codex",
        "canonicalModelKey": "gpt-5-3-codex",
        "model": "GPT-5.3 Codex",
        "creator": "OpenAI",
        "sourceType": "Proprietary",
        "reasoningType": "Reasoning",
        "contextWindow": "400K",
        "contextWindowTokens": 400000,
        "displayScore": 85,
        "rankingEligible": true,
        "overallRank": 15,
        "url": "https://benchlm.ai/models/gpt-5-3-codex",
        "markdownUrl": "https://benchlm.ai/md/models/gpt-5-3-codex.md"
      },
      "scoreDiff": 3,
      "winsA": 1,
      "winsB": 1,
      "comparableCategoryCount": 2,
      "benchmarkCountA": 25,
      "benchmarkCountB": 33,
      "categoryResults": {
        "agentic": {
          "categoryLabel": "Agentic",
          "avgA": 71.5,
          "avgB": 65.1,
          "winner": "A",
          "benchmarkCount": 9
        },
        "coding": {
          "categoryLabel": "Coding",
          "avgA": 63.1,
          "avgB": 66.4,
          "winner": "B",
          "benchmarkCount": 9
        },
        "multimodalGrounded": {
          "categoryLabel": "Multimodal & Grounded",
          "avgA": null,
          "avgB": 77.4,
          "winner": null,
          "benchmarkCount": 3
        },
        "reasoning": {
          "categoryLabel": "Reasoning",
          "avgA": null,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 2
        },
        "knowledge": {
          "categoryLabel": "Knowledge",
          "avgA": null,
          "avgB": 73.7,
          "winner": null,
          "benchmarkCount": 10
        },
        "instructionFollowing": {
          "categoryLabel": "Instruction Following",
          "avgA": null,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 1
        },
        "multilingual": {
          "categoryLabel": "Multilingual",
          "avgA": null,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 0
        },
        "math": {
          "categoryLabel": "Mathematics",
          "avgA": null,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 0
        }
      }
    },
    {
      "slug": "claude-opus-4-7-adaptive-vs-glm-5-1",
      "url": "https://benchlm.ai/compare/claude-opus-4-7-adaptive-vs-glm-5-1",
      "markdownUrl": "https://benchlm.ai/md/compare/claude-opus-4-7-adaptive-vs-glm-5-1.md",
      "modelA": {
        "slug": "claude-opus-4-7-adaptive",
        "canonicalModelKey": "claude-opus-4-7-max",
        "model": "Claude Opus 4.7 (Adaptive)",
        "creator": "Anthropic",
        "sourceType": "Proprietary",
        "reasoningType": "Reasoning",
        "contextWindow": "1M",
        "contextWindowTokens": 1000000,
        "displayScore": 84,
        "rankingEligible": true,
        "overallRank": 16,
        "url": "https://benchlm.ai/models/claude-opus-4-7-adaptive",
        "markdownUrl": "https://benchlm.ai/md/models/claude-opus-4-7-adaptive.md"
      },
      "modelB": {
        "slug": "glm-5-1",
        "canonicalModelKey": "glm-5-1",
        "model": "GLM-5.1",
        "creator": "Z.AI",
        "sourceType": "Open Weight",
        "reasoningType": "Reasoning",
        "contextWindow": "203K",
        "contextWindowTokens": 203000,
        "displayScore": 82,
        "rankingEligible": true,
        "overallRank": 17,
        "url": "https://benchlm.ai/models/glm-5-1",
        "markdownUrl": "https://benchlm.ai/md/models/glm-5-1.md"
      },
      "overallWinner": "A",
      "winner": {
        "slug": "claude-opus-4-7-adaptive",
        "canonicalModelKey": "claude-opus-4-7-max",
        "model": "Claude Opus 4.7 (Adaptive)",
        "creator": "Anthropic",
        "sourceType": "Proprietary",
        "reasoningType": "Reasoning",
        "contextWindow": "1M",
        "contextWindowTokens": 1000000,
        "displayScore": 84,
        "rankingEligible": true,
        "overallRank": 16,
        "url": "https://benchlm.ai/models/claude-opus-4-7-adaptive",
        "markdownUrl": "https://benchlm.ai/md/models/claude-opus-4-7-adaptive.md"
      },
      "scoreDiff": 2,
      "winsA": 3,
      "winsB": 0,
      "comparableCategoryCount": 3,
      "benchmarkCountA": 36,
      "benchmarkCountB": 33,
      "categoryResults": {
        "agentic": {
          "categoryLabel": "Agentic",
          "avgA": 74.9,
          "avgB": 65.3,
          "winner": "A",
          "benchmarkCount": 12
        },
        "coding": {
          "categoryLabel": "Coding",
          "avgA": 72.9,
          "avgB": 60.9,
          "winner": "A",
          "benchmarkCount": 9
        },
        "multimodalGrounded": {
          "categoryLabel": "Multimodal & Grounded",
          "avgA": 64.3,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 5
        },
        "reasoning": {
          "categoryLabel": "Reasoning",
          "avgA": 75.8,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 4
        },
        "knowledge": {
          "categoryLabel": "Knowledge",
          "avgA": 68.2,
          "avgB": 52.3,
          "winner": "A",
          "benchmarkCount": 10
        },
        "instructionFollowing": {
          "categoryLabel": "Instruction Following",
          "avgA": null,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 1
        },
        "multilingual": {
          "categoryLabel": "Multilingual",
          "avgA": null,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 0
        },
        "math": {
          "categoryLabel": "Mathematics",
          "avgA": 43.8,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 5
        }
      }
    },
    {
      "slug": "claude-opus-4-7-adaptive-vs-claude-sonnet-4-6",
      "url": "https://benchlm.ai/compare/claude-opus-4-7-adaptive-vs-claude-sonnet-4-6",
      "markdownUrl": "https://benchlm.ai/md/compare/claude-opus-4-7-adaptive-vs-claude-sonnet-4-6.md",
      "modelA": {
        "slug": "claude-opus-4-7-adaptive",
        "canonicalModelKey": "claude-opus-4-7-max",
        "model": "Claude Opus 4.7 (Adaptive)",
        "creator": "Anthropic",
        "sourceType": "Proprietary",
        "reasoningType": "Reasoning",
        "contextWindow": "1M",
        "contextWindowTokens": 1000000,
        "displayScore": 84,
        "rankingEligible": true,
        "overallRank": 16,
        "url": "https://benchlm.ai/models/claude-opus-4-7-adaptive",
        "markdownUrl": "https://benchlm.ai/md/models/claude-opus-4-7-adaptive.md"
      },
      "modelB": {
        "slug": "claude-sonnet-4-6",
        "canonicalModelKey": "claude-sonnet-4-6",
        "model": "Claude Sonnet 4.6",
        "creator": "Anthropic",
        "sourceType": "Proprietary",
        "reasoningType": "Non-Reasoning",
        "contextWindow": "200K",
        "contextWindowTokens": 200000,
        "displayScore": 82,
        "rankingEligible": true,
        "overallRank": 18,
        "url": "https://benchlm.ai/models/claude-sonnet-4-6",
        "markdownUrl": "https://benchlm.ai/md/models/claude-sonnet-4-6.md"
      },
      "overallWinner": "A",
      "winner": {
        "slug": "claude-opus-4-7-adaptive",
        "canonicalModelKey": "claude-opus-4-7-max",
        "model": "Claude Opus 4.7 (Adaptive)",
        "creator": "Anthropic",
        "sourceType": "Proprietary",
        "reasoningType": "Reasoning",
        "contextWindow": "1M",
        "contextWindowTokens": 1000000,
        "displayScore": 84,
        "rankingEligible": true,
        "overallRank": 16,
        "url": "https://benchlm.ai/models/claude-opus-4-7-adaptive",
        "markdownUrl": "https://benchlm.ai/md/models/claude-opus-4-7-adaptive.md"
      },
      "scoreDiff": 2,
      "winsA": 2,
      "winsB": 2,
      "comparableCategoryCount": 4,
      "benchmarkCountA": 36,
      "benchmarkCountB": 33,
      "categoryResults": {
        "agentic": {
          "categoryLabel": "Agentic",
          "avgA": 74.9,
          "avgB": 65.1,
          "winner": "A",
          "benchmarkCount": 11
        },
        "coding": {
          "categoryLabel": "Coding",
          "avgA": 72.9,
          "avgB": 66.4,
          "winner": "A",
          "benchmarkCount": 10
        },
        "multimodalGrounded": {
          "categoryLabel": "Multimodal & Grounded",
          "avgA": 64.3,
          "avgB": 77.4,
          "winner": "B",
          "benchmarkCount": 5
        },
        "reasoning": {
          "categoryLabel": "Reasoning",
          "avgA": 75.8,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 4
        },
        "knowledge": {
          "categoryLabel": "Knowledge",
          "avgA": 68.2,
          "avgB": 73.7,
          "winner": "B",
          "benchmarkCount": 12
        },
        "instructionFollowing": {
          "categoryLabel": "Instruction Following",
          "avgA": null,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 1
        },
        "multilingual": {
          "categoryLabel": "Multilingual",
          "avgA": null,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 0
        },
        "math": {
          "categoryLabel": "Mathematics",
          "avgA": 43.8,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 1
        }
      }
    },
    {
      "slug": "claude-sonnet-4-6-vs-glm-5-1",
      "url": "https://benchlm.ai/compare/claude-sonnet-4-6-vs-glm-5-1",
      "markdownUrl": "https://benchlm.ai/md/compare/claude-sonnet-4-6-vs-glm-5-1.md",
      "modelA": {
        "slug": "glm-5-1",
        "canonicalModelKey": "glm-5-1",
        "model": "GLM-5.1",
        "creator": "Z.AI",
        "sourceType": "Open Weight",
        "reasoningType": "Reasoning",
        "contextWindow": "203K",
        "contextWindowTokens": 203000,
        "displayScore": 82,
        "rankingEligible": true,
        "overallRank": 17,
        "url": "https://benchlm.ai/models/glm-5-1",
        "markdownUrl": "https://benchlm.ai/md/models/glm-5-1.md"
      },
      "modelB": {
        "slug": "claude-sonnet-4-6",
        "canonicalModelKey": "claude-sonnet-4-6",
        "model": "Claude Sonnet 4.6",
        "creator": "Anthropic",
        "sourceType": "Proprietary",
        "reasoningType": "Non-Reasoning",
        "contextWindow": "200K",
        "contextWindowTokens": 200000,
        "displayScore": 82,
        "rankingEligible": true,
        "overallRank": 18,
        "url": "https://benchlm.ai/models/claude-sonnet-4-6",
        "markdownUrl": "https://benchlm.ai/md/models/claude-sonnet-4-6.md"
      },
      "overallWinner": "tie",
      "winner": null,
      "scoreDiff": 0,
      "winsA": 1,
      "winsB": 2,
      "comparableCategoryCount": 3,
      "benchmarkCountA": 33,
      "benchmarkCountB": 33,
      "categoryResults": {
        "agentic": {
          "categoryLabel": "Agentic",
          "avgA": 65.3,
          "avgB": 65.1,
          "winner": "A",
          "benchmarkCount": 12
        },
        "coding": {
          "categoryLabel": "Coding",
          "avgA": 60.9,
          "avgB": 66.4,
          "winner": "B",
          "benchmarkCount": 10
        },
        "multimodalGrounded": {
          "categoryLabel": "Multimodal & Grounded",
          "avgA": null,
          "avgB": 77.4,
          "winner": null,
          "benchmarkCount": 3
        },
        "reasoning": {
          "categoryLabel": "Reasoning",
          "avgA": null,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 2
        },
        "knowledge": {
          "categoryLabel": "Knowledge",
          "avgA": 52.3,
          "avgB": 73.7,
          "winner": "B",
          "benchmarkCount": 11
        },
        "instructionFollowing": {
          "categoryLabel": "Instruction Following",
          "avgA": null,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 1
        },
        "multilingual": {
          "categoryLabel": "Multilingual",
          "avgA": null,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 0
        },
        "math": {
          "categoryLabel": "Mathematics",
          "avgA": null,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 4
        }
      }
    },
    {
      "slug": "claude-mythos-5-vs-holo3-35b-a3b",
      "url": "https://benchlm.ai/compare/claude-mythos-5-vs-holo3-35b-a3b",
      "markdownUrl": "https://benchlm.ai/md/compare/claude-mythos-5-vs-holo3-35b-a3b.md",
      "modelA": {
        "slug": "claude-mythos-5",
        "canonicalModelKey": "claude-mythos-5",
        "model": "Claude Mythos 5",
        "creator": "Anthropic",
        "sourceType": "Proprietary",
        "reasoningType": "Reasoning",
        "contextWindow": "1M+",
        "contextWindowTokens": 1000000,
        "displayScore": 99,
        "rankingEligible": true,
        "overallRank": 1,
        "url": "https://benchlm.ai/models/claude-mythos-5",
        "markdownUrl": "https://benchlm.ai/md/models/claude-mythos-5.md"
      },
      "modelB": {
        "slug": "holo3-35b-a3b",
        "canonicalModelKey": "holo3-35b-a3b",
        "model": "Holo3-35B-A3B",
        "creator": "H Company",
        "sourceType": "Open Weight",
        "reasoningType": "Non-Reasoning",
        "contextWindow": "64K",
        "contextWindowTokens": 64000,
        "displayScore": 100,
        "rankingEligible": false,
        "overallRank": null,
        "url": "https://benchlm.ai/models/holo3-35b-a3b",
        "markdownUrl": "https://benchlm.ai/md/models/holo3-35b-a3b.md"
      },
      "overallWinner": "B",
      "winner": {
        "slug": "holo3-35b-a3b",
        "canonicalModelKey": "holo3-35b-a3b",
        "model": "Holo3-35B-A3B",
        "creator": "H Company",
        "sourceType": "Open Weight",
        "reasoningType": "Non-Reasoning",
        "contextWindow": "64K",
        "contextWindowTokens": 64000,
        "displayScore": 100,
        "rankingEligible": false,
        "overallRank": null,
        "url": "https://benchlm.ai/models/holo3-35b-a3b",
        "markdownUrl": "https://benchlm.ai/md/models/holo3-35b-a3b.md"
      },
      "scoreDiff": 1,
      "winsA": 1,
      "winsB": 0,
      "comparableCategoryCount": 1,
      "benchmarkCountA": 19,
      "benchmarkCountB": 1,
      "categoryResults": {
        "agentic": {
          "categoryLabel": "Agentic",
          "avgA": 87,
          "avgB": 82.6,
          "winner": "A",
          "benchmarkCount": 4
        },
        "coding": {
          "categoryLabel": "Coding",
          "avgA": 85.9,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 4
        },
        "multimodalGrounded": {
          "categoryLabel": "Multimodal & Grounded",
          "avgA": 92.7,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 5
        },
        "reasoning": {
          "categoryLabel": "Reasoning",
          "avgA": null,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 0
        },
        "knowledge": {
          "categoryLabel": "Knowledge",
          "avgA": 74.6,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 3
        },
        "instructionFollowing": {
          "categoryLabel": "Instruction Following",
          "avgA": null,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 0
        },
        "multilingual": {
          "categoryLabel": "Multilingual",
          "avgA": null,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 1
        },
        "math": {
          "categoryLabel": "Mathematics",
          "avgA": null,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 1
        }
      }
    },
    {
      "slug": "claude-fable-vs-gpt-5-5-pro",
      "url": "https://benchlm.ai/compare/claude-fable-vs-gpt-5-5-pro",
      "markdownUrl": "https://benchlm.ai/md/compare/claude-fable-vs-gpt-5-5-pro.md",
      "modelA": {
        "slug": "claude-fable",
        "canonicalModelKey": "claude-fable-5",
        "model": "Claude Fable 5",
        "creator": "Anthropic",
        "sourceType": "Proprietary",
        "reasoningType": "Reasoning",
        "contextWindow": "1M+",
        "contextWindowTokens": 1000000,
        "displayScore": 97,
        "rankingEligible": true,
        "overallRank": 2,
        "url": "https://benchlm.ai/models/claude-fable",
        "markdownUrl": "https://benchlm.ai/md/models/claude-fable.md"
      },
      "modelB": {
        "slug": "gpt-5-5-pro",
        "canonicalModelKey": "gpt-5-5-pro",
        "model": "GPT-5.5 Pro",
        "creator": "OpenAI",
        "sourceType": "Proprietary",
        "reasoningType": "Reasoning",
        "contextWindow": "1M",
        "contextWindowTokens": 1000000,
        "displayScore": 100,
        "rankingEligible": false,
        "overallRank": null,
        "url": "https://benchlm.ai/models/gpt-5-5-pro",
        "markdownUrl": "https://benchlm.ai/md/models/gpt-5-5-pro.md"
      },
      "overallWinner": "B",
      "winner": {
        "slug": "gpt-5-5-pro",
        "canonicalModelKey": "gpt-5-5-pro",
        "model": "GPT-5.5 Pro",
        "creator": "OpenAI",
        "sourceType": "Proprietary",
        "reasoningType": "Reasoning",
        "contextWindow": "1M",
        "contextWindowTokens": 1000000,
        "displayScore": 100,
        "rankingEligible": false,
        "overallRank": null,
        "url": "https://benchlm.ai/models/gpt-5-5-pro",
        "markdownUrl": "https://benchlm.ai/md/models/gpt-5-5-pro.md"
      },
      "scoreDiff": 3,
      "winsA": 1,
      "winsB": 1,
      "comparableCategoryCount": 2,
      "benchmarkCountA": 19,
      "benchmarkCountB": 4,
      "categoryResults": {
        "agentic": {
          "categoryLabel": "Agentic",
          "avgA": 85.2,
          "avgB": 90.1,
          "winner": "B",
          "benchmarkCount": 4
        },
        "coding": {
          "categoryLabel": "Coding",
          "avgA": 85.6,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 4
        },
        "multimodalGrounded": {
          "categoryLabel": "Multimodal & Grounded",
          "avgA": 92.4,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 5
        },
        "reasoning": {
          "categoryLabel": "Reasoning",
          "avgA": null,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 0
        },
        "knowledge": {
          "categoryLabel": "Knowledge",
          "avgA": 74.8,
          "avgB": 57.2,
          "winner": "A",
          "benchmarkCount": 3
        },
        "instructionFollowing": {
          "categoryLabel": "Instruction Following",
          "avgA": null,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 0
        },
        "multilingual": {
          "categoryLabel": "Multilingual",
          "avgA": null,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 1
        },
        "math": {
          "categoryLabel": "Mathematics",
          "avgA": null,
          "avgB": 52.4,
          "winner": null,
          "benchmarkCount": 2
        }
      }
    },
    {
      "slug": "claude-fable-vs-holo3-35b-a3b",
      "url": "https://benchlm.ai/compare/claude-fable-vs-holo3-35b-a3b",
      "markdownUrl": "https://benchlm.ai/md/compare/claude-fable-vs-holo3-35b-a3b.md",
      "modelA": {
        "slug": "claude-fable",
        "canonicalModelKey": "claude-fable-5",
        "model": "Claude Fable 5",
        "creator": "Anthropic",
        "sourceType": "Proprietary",
        "reasoningType": "Reasoning",
        "contextWindow": "1M+",
        "contextWindowTokens": 1000000,
        "displayScore": 97,
        "rankingEligible": true,
        "overallRank": 2,
        "url": "https://benchlm.ai/models/claude-fable",
        "markdownUrl": "https://benchlm.ai/md/models/claude-fable.md"
      },
      "modelB": {
        "slug": "holo3-35b-a3b",
        "canonicalModelKey": "holo3-35b-a3b",
        "model": "Holo3-35B-A3B",
        "creator": "H Company",
        "sourceType": "Open Weight",
        "reasoningType": "Non-Reasoning",
        "contextWindow": "64K",
        "contextWindowTokens": 64000,
        "displayScore": 100,
        "rankingEligible": false,
        "overallRank": null,
        "url": "https://benchlm.ai/models/holo3-35b-a3b",
        "markdownUrl": "https://benchlm.ai/md/models/holo3-35b-a3b.md"
      },
      "overallWinner": "B",
      "winner": {
        "slug": "holo3-35b-a3b",
        "canonicalModelKey": "holo3-35b-a3b",
        "model": "Holo3-35B-A3B",
        "creator": "H Company",
        "sourceType": "Open Weight",
        "reasoningType": "Non-Reasoning",
        "contextWindow": "64K",
        "contextWindowTokens": 64000,
        "displayScore": 100,
        "rankingEligible": false,
        "overallRank": null,
        "url": "https://benchlm.ai/models/holo3-35b-a3b",
        "markdownUrl": "https://benchlm.ai/md/models/holo3-35b-a3b.md"
      },
      "scoreDiff": 3,
      "winsA": 1,
      "winsB": 0,
      "comparableCategoryCount": 1,
      "benchmarkCountA": 19,
      "benchmarkCountB": 1,
      "categoryResults": {
        "agentic": {
          "categoryLabel": "Agentic",
          "avgA": 85.2,
          "avgB": 82.6,
          "winner": "A",
          "benchmarkCount": 4
        },
        "coding": {
          "categoryLabel": "Coding",
          "avgA": 85.6,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 4
        },
        "multimodalGrounded": {
          "categoryLabel": "Multimodal & Grounded",
          "avgA": 92.4,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 5
        },
        "reasoning": {
          "categoryLabel": "Reasoning",
          "avgA": null,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 0
        },
        "knowledge": {
          "categoryLabel": "Knowledge",
          "avgA": 74.8,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 3
        },
        "instructionFollowing": {
          "categoryLabel": "Instruction Following",
          "avgA": null,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 0
        },
        "multilingual": {
          "categoryLabel": "Multilingual",
          "avgA": null,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 1
        },
        "math": {
          "categoryLabel": "Mathematics",
          "avgA": null,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 1
        }
      }
    },
    {
      "slug": "claude-opus-4-8-vs-gpt-5-5-pro",
      "url": "https://benchlm.ai/compare/claude-opus-4-8-vs-gpt-5-5-pro",
      "markdownUrl": "https://benchlm.ai/md/compare/claude-opus-4-8-vs-gpt-5-5-pro.md",
      "modelA": {
        "slug": "claude-opus-4-8",
        "canonicalModelKey": "claude-opus-4-8",
        "model": "Claude Opus 4.8",
        "creator": "Anthropic",
        "sourceType": "Proprietary",
        "reasoningType": "Reasoning",
        "contextWindow": "1M",
        "contextWindowTokens": 1000000,
        "displayScore": 93,
        "rankingEligible": true,
        "overallRank": 3,
        "url": "https://benchlm.ai/models/claude-opus-4-8",
        "markdownUrl": "https://benchlm.ai/md/models/claude-opus-4-8.md"
      },
      "modelB": {
        "slug": "gpt-5-5-pro",
        "canonicalModelKey": "gpt-5-5-pro",
        "model": "GPT-5.5 Pro",
        "creator": "OpenAI",
        "sourceType": "Proprietary",
        "reasoningType": "Reasoning",
        "contextWindow": "1M",
        "contextWindowTokens": 1000000,
        "displayScore": 100,
        "rankingEligible": false,
        "overallRank": null,
        "url": "https://benchlm.ai/models/gpt-5-5-pro",
        "markdownUrl": "https://benchlm.ai/md/models/gpt-5-5-pro.md"
      },
      "overallWinner": "B",
      "winner": {
        "slug": "gpt-5-5-pro",
        "canonicalModelKey": "gpt-5-5-pro",
        "model": "GPT-5.5 Pro",
        "creator": "OpenAI",
        "sourceType": "Proprietary",
        "reasoningType": "Reasoning",
        "contextWindow": "1M",
        "contextWindowTokens": 1000000,
        "displayScore": 100,
        "rankingEligible": false,
        "overallRank": null,
        "url": "https://benchlm.ai/models/gpt-5-5-pro",
        "markdownUrl": "https://benchlm.ai/md/models/gpt-5-5-pro.md"
      },
      "scoreDiff": 7,
      "winsA": 1,
      "winsB": 1,
      "comparableCategoryCount": 2,
      "benchmarkCountA": 41,
      "benchmarkCountB": 4,
      "categoryResults": {
        "agentic": {
          "categoryLabel": "Agentic",
          "avgA": 80.1,
          "avgB": 90.1,
          "winner": "B",
          "benchmarkCount": 12
        },
        "coding": {
          "categoryLabel": "Coding",
          "avgA": 76.4,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 9
        },
        "multimodalGrounded": {
          "categoryLabel": "Multimodal & Grounded",
          "avgA": 76.1,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 5
        },
        "reasoning": {
          "categoryLabel": "Reasoning",
          "avgA": null,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 2
        },
        "knowledge": {
          "categoryLabel": "Knowledge",
          "avgA": 70.1,
          "avgB": 57.2,
          "winner": "A",
          "benchmarkCount": 10
        },
        "instructionFollowing": {
          "categoryLabel": "Instruction Following",
          "avgA": null,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 1
        },
        "multilingual": {
          "categoryLabel": "Multilingual",
          "avgA": null,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 1
        },
        "math": {
          "categoryLabel": "Mathematics",
          "avgA": null,
          "avgB": 52.4,
          "winner": null,
          "benchmarkCount": 2
        }
      }
    },
    {
      "slug": "claude-opus-4-8-vs-holo3-35b-a3b",
      "url": "https://benchlm.ai/compare/claude-opus-4-8-vs-holo3-35b-a3b",
      "markdownUrl": "https://benchlm.ai/md/compare/claude-opus-4-8-vs-holo3-35b-a3b.md",
      "modelA": {
        "slug": "claude-opus-4-8",
        "canonicalModelKey": "claude-opus-4-8",
        "model": "Claude Opus 4.8",
        "creator": "Anthropic",
        "sourceType": "Proprietary",
        "reasoningType": "Reasoning",
        "contextWindow": "1M",
        "contextWindowTokens": 1000000,
        "displayScore": 93,
        "rankingEligible": true,
        "overallRank": 3,
        "url": "https://benchlm.ai/models/claude-opus-4-8",
        "markdownUrl": "https://benchlm.ai/md/models/claude-opus-4-8.md"
      },
      "modelB": {
        "slug": "holo3-35b-a3b",
        "canonicalModelKey": "holo3-35b-a3b",
        "model": "Holo3-35B-A3B",
        "creator": "H Company",
        "sourceType": "Open Weight",
        "reasoningType": "Non-Reasoning",
        "contextWindow": "64K",
        "contextWindowTokens": 64000,
        "displayScore": 100,
        "rankingEligible": false,
        "overallRank": null,
        "url": "https://benchlm.ai/models/holo3-35b-a3b",
        "markdownUrl": "https://benchlm.ai/md/models/holo3-35b-a3b.md"
      },
      "overallWinner": "B",
      "winner": {
        "slug": "holo3-35b-a3b",
        "canonicalModelKey": "holo3-35b-a3b",
        "model": "Holo3-35B-A3B",
        "creator": "H Company",
        "sourceType": "Open Weight",
        "reasoningType": "Non-Reasoning",
        "contextWindow": "64K",
        "contextWindowTokens": 64000,
        "displayScore": 100,
        "rankingEligible": false,
        "overallRank": null,
        "url": "https://benchlm.ai/models/holo3-35b-a3b",
        "markdownUrl": "https://benchlm.ai/md/models/holo3-35b-a3b.md"
      },
      "scoreDiff": 7,
      "winsA": 0,
      "winsB": 1,
      "comparableCategoryCount": 1,
      "benchmarkCountA": 41,
      "benchmarkCountB": 1,
      "categoryResults": {
        "agentic": {
          "categoryLabel": "Agentic",
          "avgA": 80.1,
          "avgB": 82.6,
          "winner": "B",
          "benchmarkCount": 12
        },
        "coding": {
          "categoryLabel": "Coding",
          "avgA": 76.4,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 9
        },
        "multimodalGrounded": {
          "categoryLabel": "Multimodal & Grounded",
          "avgA": 76.1,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 5
        },
        "reasoning": {
          "categoryLabel": "Reasoning",
          "avgA": null,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 2
        },
        "knowledge": {
          "categoryLabel": "Knowledge",
          "avgA": 70.1,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 10
        },
        "instructionFollowing": {
          "categoryLabel": "Instruction Following",
          "avgA": null,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 1
        },
        "multilingual": {
          "categoryLabel": "Multilingual",
          "avgA": null,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 1
        },
        "math": {
          "categoryLabel": "Mathematics",
          "avgA": null,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 1
        }
      }
    },
    {
      "slug": "gemini-3-1-pro-vs-gpt-5-5-pro",
      "url": "https://benchlm.ai/compare/gemini-3-1-pro-vs-gpt-5-5-pro",
      "markdownUrl": "https://benchlm.ai/md/compare/gemini-3-1-pro-vs-gpt-5-5-pro.md",
      "modelA": {
        "slug": "gemini-3-1-pro",
        "canonicalModelKey": "gemini-3-1-pro",
        "model": "Gemini 3.1 Pro",
        "creator": "Google",
        "sourceType": "Proprietary",
        "reasoningType": "Non-Reasoning",
        "contextWindow": "1M",
        "contextWindowTokens": 1000000,
        "displayScore": 91,
        "rankingEligible": true,
        "overallRank": 4,
        "url": "https://benchlm.ai/models/gemini-3-1-pro",
        "markdownUrl": "https://benchlm.ai/md/models/gemini-3-1-pro.md"
      },
      "modelB": {
        "slug": "gpt-5-5-pro",
        "canonicalModelKey": "gpt-5-5-pro",
        "model": "GPT-5.5 Pro",
        "creator": "OpenAI",
        "sourceType": "Proprietary",
        "reasoningType": "Reasoning",
        "contextWindow": "1M",
        "contextWindowTokens": 1000000,
        "displayScore": 100,
        "rankingEligible": false,
        "overallRank": null,
        "url": "https://benchlm.ai/models/gpt-5-5-pro",
        "markdownUrl": "https://benchlm.ai/md/models/gpt-5-5-pro.md"
      },
      "overallWinner": "B",
      "winner": {
        "slug": "gpt-5-5-pro",
        "canonicalModelKey": "gpt-5-5-pro",
        "model": "GPT-5.5 Pro",
        "creator": "OpenAI",
        "sourceType": "Proprietary",
        "reasoningType": "Reasoning",
        "contextWindow": "1M",
        "contextWindowTokens": 1000000,
        "displayScore": 100,
        "rankingEligible": false,
        "overallRank": null,
        "url": "https://benchlm.ai/models/gpt-5-5-pro",
        "markdownUrl": "https://benchlm.ai/md/models/gpt-5-5-pro.md"
      },
      "scoreDiff": 9,
      "winsA": 0,
      "winsB": 0,
      "comparableCategoryCount": 0,
      "benchmarkCountA": 38,
      "benchmarkCountB": 4,
      "categoryResults": {
        "agentic": {
          "categoryLabel": "Agentic",
          "avgA": null,
          "avgB": 90.1,
          "winner": null,
          "benchmarkCount": 9
        },
        "coding": {
          "categoryLabel": "Coding",
          "avgA": null,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 6
        },
        "multimodalGrounded": {
          "categoryLabel": "Multimodal & Grounded",
          "avgA": 82.8,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 10
        },
        "reasoning": {
          "categoryLabel": "Reasoning",
          "avgA": 77.1,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 3
        },
        "knowledge": {
          "categoryLabel": "Knowledge",
          "avgA": null,
          "avgB": 57.2,
          "winner": null,
          "benchmarkCount": 11
        },
        "instructionFollowing": {
          "categoryLabel": "Instruction Following",
          "avgA": null,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 1
        },
        "multilingual": {
          "categoryLabel": "Multilingual",
          "avgA": null,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 0
        },
        "math": {
          "categoryLabel": "Mathematics",
          "avgA": null,
          "avgB": 52.4,
          "winner": null,
          "benchmarkCount": 1
        }
      }
    },
    {
      "slug": "gemini-3-1-pro-vs-holo3-35b-a3b",
      "url": "https://benchlm.ai/compare/gemini-3-1-pro-vs-holo3-35b-a3b",
      "markdownUrl": "https://benchlm.ai/md/compare/gemini-3-1-pro-vs-holo3-35b-a3b.md",
      "modelA": {
        "slug": "gemini-3-1-pro",
        "canonicalModelKey": "gemini-3-1-pro",
        "model": "Gemini 3.1 Pro",
        "creator": "Google",
        "sourceType": "Proprietary",
        "reasoningType": "Non-Reasoning",
        "contextWindow": "1M",
        "contextWindowTokens": 1000000,
        "displayScore": 91,
        "rankingEligible": true,
        "overallRank": 4,
        "url": "https://benchlm.ai/models/gemini-3-1-pro",
        "markdownUrl": "https://benchlm.ai/md/models/gemini-3-1-pro.md"
      },
      "modelB": {
        "slug": "holo3-35b-a3b",
        "canonicalModelKey": "holo3-35b-a3b",
        "model": "Holo3-35B-A3B",
        "creator": "H Company",
        "sourceType": "Open Weight",
        "reasoningType": "Non-Reasoning",
        "contextWindow": "64K",
        "contextWindowTokens": 64000,
        "displayScore": 100,
        "rankingEligible": false,
        "overallRank": null,
        "url": "https://benchlm.ai/models/holo3-35b-a3b",
        "markdownUrl": "https://benchlm.ai/md/models/holo3-35b-a3b.md"
      },
      "overallWinner": "B",
      "winner": {
        "slug": "holo3-35b-a3b",
        "canonicalModelKey": "holo3-35b-a3b",
        "model": "Holo3-35B-A3B",
        "creator": "H Company",
        "sourceType": "Open Weight",
        "reasoningType": "Non-Reasoning",
        "contextWindow": "64K",
        "contextWindowTokens": 64000,
        "displayScore": 100,
        "rankingEligible": false,
        "overallRank": null,
        "url": "https://benchlm.ai/models/holo3-35b-a3b",
        "markdownUrl": "https://benchlm.ai/md/models/holo3-35b-a3b.md"
      },
      "scoreDiff": 9,
      "winsA": 0,
      "winsB": 0,
      "comparableCategoryCount": 0,
      "benchmarkCountA": 38,
      "benchmarkCountB": 1,
      "categoryResults": {
        "agentic": {
          "categoryLabel": "Agentic",
          "avgA": null,
          "avgB": 82.6,
          "winner": null,
          "benchmarkCount": 9
        },
        "coding": {
          "categoryLabel": "Coding",
          "avgA": null,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 6
        },
        "multimodalGrounded": {
          "categoryLabel": "Multimodal & Grounded",
          "avgA": 82.8,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 10
        },
        "reasoning": {
          "categoryLabel": "Reasoning",
          "avgA": 77.1,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 3
        },
        "knowledge": {
          "categoryLabel": "Knowledge",
          "avgA": null,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 10
        },
        "instructionFollowing": {
          "categoryLabel": "Instruction Following",
          "avgA": null,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 1
        },
        "multilingual": {
          "categoryLabel": "Multilingual",
          "avgA": null,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 0
        },
        "math": {
          "categoryLabel": "Mathematics",
          "avgA": null,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 0
        }
      }
    },
    {
      "slug": "gpt-5-5-pro-vs-qwen3-7-max",
      "url": "https://benchlm.ai/compare/gpt-5-5-pro-vs-qwen3-7-max",
      "markdownUrl": "https://benchlm.ai/md/compare/gpt-5-5-pro-vs-qwen3-7-max.md",
      "modelA": {
        "slug": "qwen3-7-max",
        "canonicalModelKey": "qwen3-7-max",
        "model": "Qwen3.7 Max",
        "creator": "Alibaba",
        "sourceType": "Proprietary",
        "reasoningType": "Reasoning",
        "contextWindow": "1M",
        "contextWindowTokens": 1000000,
        "displayScore": 91,
        "rankingEligible": true,
        "overallRank": 5,
        "url": "https://benchlm.ai/models/qwen3-7-max",
        "markdownUrl": "https://benchlm.ai/md/models/qwen3-7-max.md"
      },
      "modelB": {
        "slug": "gpt-5-5-pro",
        "canonicalModelKey": "gpt-5-5-pro",
        "model": "GPT-5.5 Pro",
        "creator": "OpenAI",
        "sourceType": "Proprietary",
        "reasoningType": "Reasoning",
        "contextWindow": "1M",
        "contextWindowTokens": 1000000,
        "displayScore": 100,
        "rankingEligible": false,
        "overallRank": null,
        "url": "https://benchlm.ai/models/gpt-5-5-pro",
        "markdownUrl": "https://benchlm.ai/md/models/gpt-5-5-pro.md"
      },
      "overallWinner": "B",
      "winner": {
        "slug": "gpt-5-5-pro",
        "canonicalModelKey": "gpt-5-5-pro",
        "model": "GPT-5.5 Pro",
        "creator": "OpenAI",
        "sourceType": "Proprietary",
        "reasoningType": "Reasoning",
        "contextWindow": "1M",
        "contextWindowTokens": 1000000,
        "displayScore": 100,
        "rankingEligible": false,
        "overallRank": null,
        "url": "https://benchlm.ai/models/gpt-5-5-pro",
        "markdownUrl": "https://benchlm.ai/md/models/gpt-5-5-pro.md"
      },
      "scoreDiff": 9,
      "winsA": 1,
      "winsB": 1,
      "comparableCategoryCount": 2,
      "benchmarkCountA": 51,
      "benchmarkCountB": 4,
      "categoryResults": {
        "agentic": {
          "categoryLabel": "Agentic",
          "avgA": 69.7,
          "avgB": 90.1,
          "winner": "B",
          "benchmarkCount": 14
        },
        "coding": {
          "categoryLabel": "Coding",
          "avgA": 73.6,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 10
        },
        "multimodalGrounded": {
          "categoryLabel": "Multimodal & Grounded",
          "avgA": null,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 1
        },
        "reasoning": {
          "categoryLabel": "Reasoning",
          "avgA": 90.4,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 3
        },
        "knowledge": {
          "categoryLabel": "Knowledge",
          "avgA": 71.2,
          "avgB": 57.2,
          "winner": "A",
          "benchmarkCount": 14
        },
        "instructionFollowing": {
          "categoryLabel": "Instruction Following",
          "avgA": 89,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 3
        },
        "multilingual": {
          "categoryLabel": "Multilingual",
          "avgA": 87,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 5
        },
        "math": {
          "categoryLabel": "Mathematics",
          "avgA": null,
          "avgB": 52.4,
          "winner": null,
          "benchmarkCount": 4
        }
      }
    },
    {
      "slug": "holo3-35b-a3b-vs-qwen3-7-max",
      "url": "https://benchlm.ai/compare/holo3-35b-a3b-vs-qwen3-7-max",
      "markdownUrl": "https://benchlm.ai/md/compare/holo3-35b-a3b-vs-qwen3-7-max.md",
      "modelA": {
        "slug": "qwen3-7-max",
        "canonicalModelKey": "qwen3-7-max",
        "model": "Qwen3.7 Max",
        "creator": "Alibaba",
        "sourceType": "Proprietary",
        "reasoningType": "Reasoning",
        "contextWindow": "1M",
        "contextWindowTokens": 1000000,
        "displayScore": 91,
        "rankingEligible": true,
        "overallRank": 5,
        "url": "https://benchlm.ai/models/qwen3-7-max",
        "markdownUrl": "https://benchlm.ai/md/models/qwen3-7-max.md"
      },
      "modelB": {
        "slug": "holo3-35b-a3b",
        "canonicalModelKey": "holo3-35b-a3b",
        "model": "Holo3-35B-A3B",
        "creator": "H Company",
        "sourceType": "Open Weight",
        "reasoningType": "Non-Reasoning",
        "contextWindow": "64K",
        "contextWindowTokens": 64000,
        "displayScore": 100,
        "rankingEligible": false,
        "overallRank": null,
        "url": "https://benchlm.ai/models/holo3-35b-a3b",
        "markdownUrl": "https://benchlm.ai/md/models/holo3-35b-a3b.md"
      },
      "overallWinner": "B",
      "winner": {
        "slug": "holo3-35b-a3b",
        "canonicalModelKey": "holo3-35b-a3b",
        "model": "Holo3-35B-A3B",
        "creator": "H Company",
        "sourceType": "Open Weight",
        "reasoningType": "Non-Reasoning",
        "contextWindow": "64K",
        "contextWindowTokens": 64000,
        "displayScore": 100,
        "rankingEligible": false,
        "overallRank": null,
        "url": "https://benchlm.ai/models/holo3-35b-a3b",
        "markdownUrl": "https://benchlm.ai/md/models/holo3-35b-a3b.md"
      },
      "scoreDiff": 9,
      "winsA": 0,
      "winsB": 1,
      "comparableCategoryCount": 1,
      "benchmarkCountA": 51,
      "benchmarkCountB": 1,
      "categoryResults": {
        "agentic": {
          "categoryLabel": "Agentic",
          "avgA": 69.7,
          "avgB": 82.6,
          "winner": "B",
          "benchmarkCount": 14
        },
        "coding": {
          "categoryLabel": "Coding",
          "avgA": 73.6,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 10
        },
        "multimodalGrounded": {
          "categoryLabel": "Multimodal & Grounded",
          "avgA": null,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 1
        },
        "reasoning": {
          "categoryLabel": "Reasoning",
          "avgA": 90.4,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 3
        },
        "knowledge": {
          "categoryLabel": "Knowledge",
          "avgA": 71.2,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 13
        },
        "instructionFollowing": {
          "categoryLabel": "Instruction Following",
          "avgA": 89,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 3
        },
        "multilingual": {
          "categoryLabel": "Multilingual",
          "avgA": 87,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 5
        },
        "math": {
          "categoryLabel": "Mathematics",
          "avgA": null,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 3
        }
      }
    },
    {
      "slug": "gpt-5-4-pro-vs-gpt-5-5-pro",
      "url": "https://benchlm.ai/compare/gpt-5-4-pro-vs-gpt-5-5-pro",
      "markdownUrl": "https://benchlm.ai/md/compare/gpt-5-4-pro-vs-gpt-5-5-pro.md",
      "modelA": {
        "slug": "gpt-5-4-pro",
        "canonicalModelKey": "gpt-5-4-pro",
        "model": "GPT-5.4 Pro",
        "creator": "OpenAI",
        "sourceType": "Proprietary",
        "reasoningType": "Reasoning",
        "contextWindow": "1.05M",
        "contextWindowTokens": 1050000,
        "displayScore": 90,
        "rankingEligible": true,
        "overallRank": 6,
        "url": "https://benchlm.ai/models/gpt-5-4-pro",
        "markdownUrl": "https://benchlm.ai/md/models/gpt-5-4-pro.md"
      },
      "modelB": {
        "slug": "gpt-5-5-pro",
        "canonicalModelKey": "gpt-5-5-pro",
        "model": "GPT-5.5 Pro",
        "creator": "OpenAI",
        "sourceType": "Proprietary",
        "reasoningType": "Reasoning",
        "contextWindow": "1M",
        "contextWindowTokens": 1000000,
        "displayScore": 100,
        "rankingEligible": false,
        "overallRank": null,
        "url": "https://benchlm.ai/models/gpt-5-5-pro",
        "markdownUrl": "https://benchlm.ai/md/models/gpt-5-5-pro.md"
      },
      "overallWinner": "B",
      "winner": {
        "slug": "gpt-5-5-pro",
        "canonicalModelKey": "gpt-5-5-pro",
        "model": "GPT-5.5 Pro",
        "creator": "OpenAI",
        "sourceType": "Proprietary",
        "reasoningType": "Reasoning",
        "contextWindow": "1M",
        "contextWindowTokens": 1000000,
        "displayScore": 100,
        "rankingEligible": false,
        "overallRank": null,
        "url": "https://benchlm.ai/models/gpt-5-5-pro",
        "markdownUrl": "https://benchlm.ai/md/models/gpt-5-5-pro.md"
      },
      "scoreDiff": 10,
      "winsA": 0,
      "winsB": 3,
      "comparableCategoryCount": 3,
      "benchmarkCountA": 10,
      "benchmarkCountB": 4,
      "categoryResults": {
        "agentic": {
          "categoryLabel": "Agentic",
          "avgA": 89.3,
          "avgB": 90.1,
          "winner": "B",
          "benchmarkCount": 1
        },
        "coding": {
          "categoryLabel": "Coding",
          "avgA": null,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 0
        },
        "multimodalGrounded": {
          "categoryLabel": "Multimodal & Grounded",
          "avgA": 94,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 1
        },
        "reasoning": {
          "categoryLabel": "Reasoning",
          "avgA": 83.3,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 2
        },
        "knowledge": {
          "categoryLabel": "Knowledge",
          "avgA": 49,
          "avgB": 57.2,
          "winner": "B",
          "benchmarkCount": 4
        },
        "instructionFollowing": {
          "categoryLabel": "Instruction Following",
          "avgA": null,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 0
        },
        "multilingual": {
          "categoryLabel": "Multilingual",
          "avgA": null,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 0
        },
        "math": {
          "categoryLabel": "Mathematics",
          "avgA": 50,
          "avgB": 52.4,
          "winner": "B",
          "benchmarkCount": 2
        }
      }
    },
    {
      "slug": "gpt-5-4-pro-vs-holo3-35b-a3b",
      "url": "https://benchlm.ai/compare/gpt-5-4-pro-vs-holo3-35b-a3b",
      "markdownUrl": "https://benchlm.ai/md/compare/gpt-5-4-pro-vs-holo3-35b-a3b.md",
      "modelA": {
        "slug": "gpt-5-4-pro",
        "canonicalModelKey": "gpt-5-4-pro",
        "model": "GPT-5.4 Pro",
        "creator": "OpenAI",
        "sourceType": "Proprietary",
        "reasoningType": "Reasoning",
        "contextWindow": "1.05M",
        "contextWindowTokens": 1050000,
        "displayScore": 90,
        "rankingEligible": true,
        "overallRank": 6,
        "url": "https://benchlm.ai/models/gpt-5-4-pro",
        "markdownUrl": "https://benchlm.ai/md/models/gpt-5-4-pro.md"
      },
      "modelB": {
        "slug": "holo3-35b-a3b",
        "canonicalModelKey": "holo3-35b-a3b",
        "model": "Holo3-35B-A3B",
        "creator": "H Company",
        "sourceType": "Open Weight",
        "reasoningType": "Non-Reasoning",
        "contextWindow": "64K",
        "contextWindowTokens": 64000,
        "displayScore": 100,
        "rankingEligible": false,
        "overallRank": null,
        "url": "https://benchlm.ai/models/holo3-35b-a3b",
        "markdownUrl": "https://benchlm.ai/md/models/holo3-35b-a3b.md"
      },
      "overallWinner": "B",
      "winner": {
        "slug": "holo3-35b-a3b",
        "canonicalModelKey": "holo3-35b-a3b",
        "model": "Holo3-35B-A3B",
        "creator": "H Company",
        "sourceType": "Open Weight",
        "reasoningType": "Non-Reasoning",
        "contextWindow": "64K",
        "contextWindowTokens": 64000,
        "displayScore": 100,
        "rankingEligible": false,
        "overallRank": null,
        "url": "https://benchlm.ai/models/holo3-35b-a3b",
        "markdownUrl": "https://benchlm.ai/md/models/holo3-35b-a3b.md"
      },
      "scoreDiff": 10,
      "winsA": 1,
      "winsB": 0,
      "comparableCategoryCount": 1,
      "benchmarkCountA": 10,
      "benchmarkCountB": 1,
      "categoryResults": {
        "agentic": {
          "categoryLabel": "Agentic",
          "avgA": 89.3,
          "avgB": 82.6,
          "winner": "A",
          "benchmarkCount": 2
        },
        "coding": {
          "categoryLabel": "Coding",
          "avgA": null,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 0
        },
        "multimodalGrounded": {
          "categoryLabel": "Multimodal & Grounded",
          "avgA": 94,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 1
        },
        "reasoning": {
          "categoryLabel": "Reasoning",
          "avgA": 83.3,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 2
        },
        "knowledge": {
          "categoryLabel": "Knowledge",
          "avgA": 49,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 4
        },
        "instructionFollowing": {
          "categoryLabel": "Instruction Following",
          "avgA": null,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 0
        },
        "multilingual": {
          "categoryLabel": "Multilingual",
          "avgA": null,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 0
        },
        "math": {
          "categoryLabel": "Mathematics",
          "avgA": 50,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 2
        }
      }
    },
    {
      "slug": "gpt-5-5-vs-gpt-5-5-pro",
      "url": "https://benchlm.ai/compare/gpt-5-5-vs-gpt-5-5-pro",
      "markdownUrl": "https://benchlm.ai/md/compare/gpt-5-5-vs-gpt-5-5-pro.md",
      "modelA": {
        "slug": "gpt-5-5",
        "canonicalModelKey": "gpt-5-5",
        "model": "GPT-5.5",
        "creator": "OpenAI",
        "sourceType": "Proprietary",
        "reasoningType": "Reasoning",
        "contextWindow": "1M",
        "contextWindowTokens": 1000000,
        "displayScore": 89,
        "rankingEligible": true,
        "overallRank": 7,
        "url": "https://benchlm.ai/models/gpt-5-5",
        "markdownUrl": "https://benchlm.ai/md/models/gpt-5-5.md"
      },
      "modelB": {
        "slug": "gpt-5-5-pro",
        "canonicalModelKey": "gpt-5-5-pro",
        "model": "GPT-5.5 Pro",
        "creator": "OpenAI",
        "sourceType": "Proprietary",
        "reasoningType": "Reasoning",
        "contextWindow": "1M",
        "contextWindowTokens": 1000000,
        "displayScore": 100,
        "rankingEligible": false,
        "overallRank": null,
        "url": "https://benchlm.ai/models/gpt-5-5-pro",
        "markdownUrl": "https://benchlm.ai/md/models/gpt-5-5-pro.md"
      },
      "overallWinner": "B",
      "winner": {
        "slug": "gpt-5-5-pro",
        "canonicalModelKey": "gpt-5-5-pro",
        "model": "GPT-5.5 Pro",
        "creator": "OpenAI",
        "sourceType": "Proprietary",
        "reasoningType": "Reasoning",
        "contextWindow": "1M",
        "contextWindowTokens": 1000000,
        "displayScore": 100,
        "rankingEligible": false,
        "overallRank": null,
        "url": "https://benchlm.ai/models/gpt-5-5-pro",
        "markdownUrl": "https://benchlm.ai/md/models/gpt-5-5-pro.md"
      },
      "scoreDiff": 11,
      "winsA": 1,
      "winsB": 2,
      "comparableCategoryCount": 3,
      "benchmarkCountA": 42,
      "benchmarkCountB": 4,
      "categoryResults": {
        "agentic": {
          "categoryLabel": "Agentic",
          "avgA": 81.5,
          "avgB": 90.1,
          "winner": "B",
          "benchmarkCount": 12
        },
        "coding": {
          "categoryLabel": "Coding",
          "avgA": 58.6,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 8
        },
        "multimodalGrounded": {
          "categoryLabel": "Multimodal & Grounded",
          "avgA": 70.4,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 5
        },
        "reasoning": {
          "categoryLabel": "Reasoning",
          "avgA": 85,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 5
        },
        "knowledge": {
          "categoryLabel": "Knowledge",
          "avgA": 66.4,
          "avgB": 57.2,
          "winner": "A",
          "benchmarkCount": 10
        },
        "instructionFollowing": {
          "categoryLabel": "Instruction Following",
          "avgA": null,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 1
        },
        "multilingual": {
          "categoryLabel": "Multilingual",
          "avgA": null,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 0
        },
        "math": {
          "categoryLabel": "Mathematics",
          "avgA": 51.7,
          "avgB": 52.4,
          "winner": "B",
          "benchmarkCount": 1
        }
      }
    },
    {
      "slug": "gpt-5-5-vs-holo3-35b-a3b",
      "url": "https://benchlm.ai/compare/gpt-5-5-vs-holo3-35b-a3b",
      "markdownUrl": "https://benchlm.ai/md/compare/gpt-5-5-vs-holo3-35b-a3b.md",
      "modelA": {
        "slug": "gpt-5-5",
        "canonicalModelKey": "gpt-5-5",
        "model": "GPT-5.5",
        "creator": "OpenAI",
        "sourceType": "Proprietary",
        "reasoningType": "Reasoning",
        "contextWindow": "1M",
        "contextWindowTokens": 1000000,
        "displayScore": 89,
        "rankingEligible": true,
        "overallRank": 7,
        "url": "https://benchlm.ai/models/gpt-5-5",
        "markdownUrl": "https://benchlm.ai/md/models/gpt-5-5.md"
      },
      "modelB": {
        "slug": "holo3-35b-a3b",
        "canonicalModelKey": "holo3-35b-a3b",
        "model": "Holo3-35B-A3B",
        "creator": "H Company",
        "sourceType": "Open Weight",
        "reasoningType": "Non-Reasoning",
        "contextWindow": "64K",
        "contextWindowTokens": 64000,
        "displayScore": 100,
        "rankingEligible": false,
        "overallRank": null,
        "url": "https://benchlm.ai/models/holo3-35b-a3b",
        "markdownUrl": "https://benchlm.ai/md/models/holo3-35b-a3b.md"
      },
      "overallWinner": "B",
      "winner": {
        "slug": "holo3-35b-a3b",
        "canonicalModelKey": "holo3-35b-a3b",
        "model": "Holo3-35B-A3B",
        "creator": "H Company",
        "sourceType": "Open Weight",
        "reasoningType": "Non-Reasoning",
        "contextWindow": "64K",
        "contextWindowTokens": 64000,
        "displayScore": 100,
        "rankingEligible": false,
        "overallRank": null,
        "url": "https://benchlm.ai/models/holo3-35b-a3b",
        "markdownUrl": "https://benchlm.ai/md/models/holo3-35b-a3b.md"
      },
      "scoreDiff": 11,
      "winsA": 0,
      "winsB": 1,
      "comparableCategoryCount": 1,
      "benchmarkCountA": 42,
      "benchmarkCountB": 1,
      "categoryResults": {
        "agentic": {
          "categoryLabel": "Agentic",
          "avgA": 81.5,
          "avgB": 82.6,
          "winner": "B",
          "benchmarkCount": 12
        },
        "coding": {
          "categoryLabel": "Coding",
          "avgA": 58.6,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 8
        },
        "multimodalGrounded": {
          "categoryLabel": "Multimodal & Grounded",
          "avgA": 70.4,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 5
        },
        "reasoning": {
          "categoryLabel": "Reasoning",
          "avgA": 85,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 5
        },
        "knowledge": {
          "categoryLabel": "Knowledge",
          "avgA": 66.4,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 10
        },
        "instructionFollowing": {
          "categoryLabel": "Instruction Following",
          "avgA": null,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 1
        },
        "multilingual": {
          "categoryLabel": "Multilingual",
          "avgA": null,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 0
        },
        "math": {
          "categoryLabel": "Mathematics",
          "avgA": 51.7,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 1
        }
      }
    },
    {
      "slug": "gemini-3-pro-deep-think-vs-gpt-5-5-pro",
      "url": "https://benchlm.ai/compare/gemini-3-pro-deep-think-vs-gpt-5-5-pro",
      "markdownUrl": "https://benchlm.ai/md/compare/gemini-3-pro-deep-think-vs-gpt-5-5-pro.md",
      "modelA": {
        "slug": "gemini-3-pro-deep-think",
        "canonicalModelKey": "gemini-3-pro-deep-think",
        "model": "Gemini 3 Pro Deep Think",
        "creator": "Google",
        "sourceType": "Proprietary",
        "reasoningType": "Reasoning",
        "contextWindow": "2M",
        "contextWindowTokens": 2000000,
        "displayScore": 89,
        "rankingEligible": true,
        "overallRank": 8,
        "url": "https://benchlm.ai/models/gemini-3-pro-deep-think",
        "markdownUrl": "https://benchlm.ai/md/models/gemini-3-pro-deep-think.md"
      },
      "modelB": {
        "slug": "gpt-5-5-pro",
        "canonicalModelKey": "gpt-5-5-pro",
        "model": "GPT-5.5 Pro",
        "creator": "OpenAI",
        "sourceType": "Proprietary",
        "reasoningType": "Reasoning",
        "contextWindow": "1M",
        "contextWindowTokens": 1000000,
        "displayScore": 100,
        "rankingEligible": false,
        "overallRank": null,
        "url": "https://benchlm.ai/models/gpt-5-5-pro",
        "markdownUrl": "https://benchlm.ai/md/models/gpt-5-5-pro.md"
      },
      "overallWinner": "B",
      "winner": {
        "slug": "gpt-5-5-pro",
        "canonicalModelKey": "gpt-5-5-pro",
        "model": "GPT-5.5 Pro",
        "creator": "OpenAI",
        "sourceType": "Proprietary",
        "reasoningType": "Reasoning",
        "contextWindow": "1M",
        "contextWindowTokens": 1000000,
        "displayScore": 100,
        "rankingEligible": false,
        "overallRank": null,
        "url": "https://benchlm.ai/models/gpt-5-5-pro",
        "markdownUrl": "https://benchlm.ai/md/models/gpt-5-5-pro.md"
      },
      "scoreDiff": 11,
      "winsA": 0,
      "winsB": 0,
      "comparableCategoryCount": 0,
      "benchmarkCountA": 4,
      "benchmarkCountB": 4,
      "categoryResults": {
        "agentic": {
          "categoryLabel": "Agentic",
          "avgA": null,
          "avgB": 90.1,
          "winner": null,
          "benchmarkCount": 3
        },
        "coding": {
          "categoryLabel": "Coding",
          "avgA": null,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 0
        },
        "multimodalGrounded": {
          "categoryLabel": "Multimodal & Grounded",
          "avgA": null,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 0
        },
        "reasoning": {
          "categoryLabel": "Reasoning",
          "avgA": 45.1,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 2
        },
        "knowledge": {
          "categoryLabel": "Knowledge",
          "avgA": null,
          "avgB": 57.2,
          "winner": null,
          "benchmarkCount": 2
        },
        "instructionFollowing": {
          "categoryLabel": "Instruction Following",
          "avgA": null,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 0
        },
        "multilingual": {
          "categoryLabel": "Multilingual",
          "avgA": null,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 0
        },
        "math": {
          "categoryLabel": "Mathematics",
          "avgA": null,
          "avgB": 52.4,
          "winner": null,
          "benchmarkCount": 1
        }
      }
    },
    {
      "slug": "gemini-3-pro-deep-think-vs-holo3-35b-a3b",
      "url": "https://benchlm.ai/compare/gemini-3-pro-deep-think-vs-holo3-35b-a3b",
      "markdownUrl": "https://benchlm.ai/md/compare/gemini-3-pro-deep-think-vs-holo3-35b-a3b.md",
      "modelA": {
        "slug": "gemini-3-pro-deep-think",
        "canonicalModelKey": "gemini-3-pro-deep-think",
        "model": "Gemini 3 Pro Deep Think",
        "creator": "Google",
        "sourceType": "Proprietary",
        "reasoningType": "Reasoning",
        "contextWindow": "2M",
        "contextWindowTokens": 2000000,
        "displayScore": 89,
        "rankingEligible": true,
        "overallRank": 8,
        "url": "https://benchlm.ai/models/gemini-3-pro-deep-think",
        "markdownUrl": "https://benchlm.ai/md/models/gemini-3-pro-deep-think.md"
      },
      "modelB": {
        "slug": "holo3-35b-a3b",
        "canonicalModelKey": "holo3-35b-a3b",
        "model": "Holo3-35B-A3B",
        "creator": "H Company",
        "sourceType": "Open Weight",
        "reasoningType": "Non-Reasoning",
        "contextWindow": "64K",
        "contextWindowTokens": 64000,
        "displayScore": 100,
        "rankingEligible": false,
        "overallRank": null,
        "url": "https://benchlm.ai/models/holo3-35b-a3b",
        "markdownUrl": "https://benchlm.ai/md/models/holo3-35b-a3b.md"
      },
      "overallWinner": "B",
      "winner": {
        "slug": "holo3-35b-a3b",
        "canonicalModelKey": "holo3-35b-a3b",
        "model": "Holo3-35B-A3B",
        "creator": "H Company",
        "sourceType": "Open Weight",
        "reasoningType": "Non-Reasoning",
        "contextWindow": "64K",
        "contextWindowTokens": 64000,
        "displayScore": 100,
        "rankingEligible": false,
        "overallRank": null,
        "url": "https://benchlm.ai/models/holo3-35b-a3b",
        "markdownUrl": "https://benchlm.ai/md/models/holo3-35b-a3b.md"
      },
      "scoreDiff": 11,
      "winsA": 0,
      "winsB": 0,
      "comparableCategoryCount": 0,
      "benchmarkCountA": 4,
      "benchmarkCountB": 1,
      "categoryResults": {
        "agentic": {
          "categoryLabel": "Agentic",
          "avgA": null,
          "avgB": 82.6,
          "winner": null,
          "benchmarkCount": 3
        },
        "coding": {
          "categoryLabel": "Coding",
          "avgA": null,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 0
        },
        "multimodalGrounded": {
          "categoryLabel": "Multimodal & Grounded",
          "avgA": null,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 0
        },
        "reasoning": {
          "categoryLabel": "Reasoning",
          "avgA": 45.1,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 2
        },
        "knowledge": {
          "categoryLabel": "Knowledge",
          "avgA": null,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 0
        },
        "instructionFollowing": {
          "categoryLabel": "Instruction Following",
          "avgA": null,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 0
        },
        "multilingual": {
          "categoryLabel": "Multilingual",
          "avgA": null,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 0
        },
        "math": {
          "categoryLabel": "Mathematics",
          "avgA": null,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 0
        }
      }
    },
    {
      "slug": "gpt-5-5-pro-vs-grok-4-1",
      "url": "https://benchlm.ai/compare/gpt-5-5-pro-vs-grok-4-1",
      "markdownUrl": "https://benchlm.ai/md/compare/gpt-5-5-pro-vs-grok-4-1.md",
      "modelA": {
        "slug": "grok-4-1",
        "canonicalModelKey": "grok-4-1",
        "model": "Grok 4.1",
        "creator": "xAI",
        "sourceType": "Proprietary",
        "reasoningType": "Non-Reasoning",
        "contextWindow": "1M",
        "contextWindowTokens": 1000000,
        "displayScore": 89,
        "rankingEligible": true,
        "overallRank": 9,
        "url": "https://benchlm.ai/models/grok-4-1",
        "markdownUrl": "https://benchlm.ai/md/models/grok-4-1.md"
      },
      "modelB": {
        "slug": "gpt-5-5-pro",
        "canonicalModelKey": "gpt-5-5-pro",
        "model": "GPT-5.5 Pro",
        "creator": "OpenAI",
        "sourceType": "Proprietary",
        "reasoningType": "Reasoning",
        "contextWindow": "1M",
        "contextWindowTokens": 1000000,
        "displayScore": 100,
        "rankingEligible": false,
        "overallRank": null,
        "url": "https://benchlm.ai/models/gpt-5-5-pro",
        "markdownUrl": "https://benchlm.ai/md/models/gpt-5-5-pro.md"
      },
      "overallWinner": "B",
      "winner": {
        "slug": "gpt-5-5-pro",
        "canonicalModelKey": "gpt-5-5-pro",
        "model": "GPT-5.5 Pro",
        "creator": "OpenAI",
        "sourceType": "Proprietary",
        "reasoningType": "Reasoning",
        "contextWindow": "1M",
        "contextWindowTokens": 1000000,
        "displayScore": 100,
        "rankingEligible": false,
        "overallRank": null,
        "url": "https://benchlm.ai/models/gpt-5-5-pro",
        "markdownUrl": "https://benchlm.ai/md/models/gpt-5-5-pro.md"
      },
      "scoreDiff": 11,
      "winsA": 0,
      "winsB": 0,
      "comparableCategoryCount": 0,
      "benchmarkCountA": 0,
      "benchmarkCountB": 4,
      "categoryResults": {
        "agentic": {
          "categoryLabel": "Agentic",
          "avgA": null,
          "avgB": 90.1,
          "winner": null,
          "benchmarkCount": 1
        },
        "coding": {
          "categoryLabel": "Coding",
          "avgA": null,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 0
        },
        "multimodalGrounded": {
          "categoryLabel": "Multimodal & Grounded",
          "avgA": null,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 0
        },
        "reasoning": {
          "categoryLabel": "Reasoning",
          "avgA": null,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 0
        },
        "knowledge": {
          "categoryLabel": "Knowledge",
          "avgA": null,
          "avgB": 57.2,
          "winner": null,
          "benchmarkCount": 2
        },
        "instructionFollowing": {
          "categoryLabel": "Instruction Following",
          "avgA": null,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 0
        },
        "multilingual": {
          "categoryLabel": "Multilingual",
          "avgA": null,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 0
        },
        "math": {
          "categoryLabel": "Mathematics",
          "avgA": null,
          "avgB": 52.4,
          "winner": null,
          "benchmarkCount": 1
        }
      }
    },
    {
      "slug": "grok-4-1-vs-holo3-35b-a3b",
      "url": "https://benchlm.ai/compare/grok-4-1-vs-holo3-35b-a3b",
      "markdownUrl": "https://benchlm.ai/md/compare/grok-4-1-vs-holo3-35b-a3b.md",
      "modelA": {
        "slug": "grok-4-1",
        "canonicalModelKey": "grok-4-1",
        "model": "Grok 4.1",
        "creator": "xAI",
        "sourceType": "Proprietary",
        "reasoningType": "Non-Reasoning",
        "contextWindow": "1M",
        "contextWindowTokens": 1000000,
        "displayScore": 89,
        "rankingEligible": true,
        "overallRank": 9,
        "url": "https://benchlm.ai/models/grok-4-1",
        "markdownUrl": "https://benchlm.ai/md/models/grok-4-1.md"
      },
      "modelB": {
        "slug": "holo3-35b-a3b",
        "canonicalModelKey": "holo3-35b-a3b",
        "model": "Holo3-35B-A3B",
        "creator": "H Company",
        "sourceType": "Open Weight",
        "reasoningType": "Non-Reasoning",
        "contextWindow": "64K",
        "contextWindowTokens": 64000,
        "displayScore": 100,
        "rankingEligible": false,
        "overallRank": null,
        "url": "https://benchlm.ai/models/holo3-35b-a3b",
        "markdownUrl": "https://benchlm.ai/md/models/holo3-35b-a3b.md"
      },
      "overallWinner": "B",
      "winner": {
        "slug": "holo3-35b-a3b",
        "canonicalModelKey": "holo3-35b-a3b",
        "model": "Holo3-35B-A3B",
        "creator": "H Company",
        "sourceType": "Open Weight",
        "reasoningType": "Non-Reasoning",
        "contextWindow": "64K",
        "contextWindowTokens": 64000,
        "displayScore": 100,
        "rankingEligible": false,
        "overallRank": null,
        "url": "https://benchlm.ai/models/holo3-35b-a3b",
        "markdownUrl": "https://benchlm.ai/md/models/holo3-35b-a3b.md"
      },
      "scoreDiff": 11,
      "winsA": 0,
      "winsB": 0,
      "comparableCategoryCount": 0,
      "benchmarkCountA": 0,
      "benchmarkCountB": 1,
      "categoryResults": {
        "agentic": {
          "categoryLabel": "Agentic",
          "avgA": null,
          "avgB": 82.6,
          "winner": null,
          "benchmarkCount": 1
        },
        "coding": {
          "categoryLabel": "Coding",
          "avgA": null,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 0
        },
        "multimodalGrounded": {
          "categoryLabel": "Multimodal & Grounded",
          "avgA": null,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 0
        },
        "reasoning": {
          "categoryLabel": "Reasoning",
          "avgA": null,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 0
        },
        "knowledge": {
          "categoryLabel": "Knowledge",
          "avgA": null,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 0
        },
        "instructionFollowing": {
          "categoryLabel": "Instruction Following",
          "avgA": null,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 0
        },
        "multilingual": {
          "categoryLabel": "Multilingual",
          "avgA": null,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 0
        },
        "math": {
          "categoryLabel": "Mathematics",
          "avgA": null,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 0
        }
      }
    },
    {
      "slug": "gpt-5-4-vs-gpt-5-5-pro",
      "url": "https://benchlm.ai/compare/gpt-5-4-vs-gpt-5-5-pro",
      "markdownUrl": "https://benchlm.ai/md/compare/gpt-5-4-vs-gpt-5-5-pro.md",
      "modelA": {
        "slug": "gpt-5-4",
        "canonicalModelKey": "gpt-5-4",
        "model": "GPT-5.4",
        "creator": "OpenAI",
        "sourceType": "Proprietary",
        "reasoningType": "Reasoning",
        "contextWindow": "1.05M",
        "contextWindowTokens": 1050000,
        "displayScore": 88,
        "rankingEligible": true,
        "overallRank": 10,
        "url": "https://benchlm.ai/models/gpt-5-4",
        "markdownUrl": "https://benchlm.ai/md/models/gpt-5-4.md"
      },
      "modelB": {
        "slug": "gpt-5-5-pro",
        "canonicalModelKey": "gpt-5-5-pro",
        "model": "GPT-5.5 Pro",
        "creator": "OpenAI",
        "sourceType": "Proprietary",
        "reasoningType": "Reasoning",
        "contextWindow": "1M",
        "contextWindowTokens": 1000000,
        "displayScore": 100,
        "rankingEligible": false,
        "overallRank": null,
        "url": "https://benchlm.ai/models/gpt-5-5-pro",
        "markdownUrl": "https://benchlm.ai/md/models/gpt-5-5-pro.md"
      },
      "overallWinner": "B",
      "winner": {
        "slug": "gpt-5-5-pro",
        "canonicalModelKey": "gpt-5-5-pro",
        "model": "GPT-5.5 Pro",
        "creator": "OpenAI",
        "sourceType": "Proprietary",
        "reasoningType": "Reasoning",
        "contextWindow": "1M",
        "contextWindowTokens": 1000000,
        "displayScore": 100,
        "rankingEligible": false,
        "overallRank": null,
        "url": "https://benchlm.ai/models/gpt-5-5-pro",
        "markdownUrl": "https://benchlm.ai/md/models/gpt-5-5-pro.md"
      },
      "scoreDiff": 12,
      "winsA": 1,
      "winsB": 1,
      "comparableCategoryCount": 2,
      "benchmarkCountA": 48,
      "benchmarkCountB": 4,
      "categoryResults": {
        "agentic": {
          "categoryLabel": "Agentic",
          "avgA": 77,
          "avgB": 90.1,
          "winner": "B",
          "benchmarkCount": 14
        },
        "coding": {
          "categoryLabel": "Coding",
          "avgA": 57.7,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 7
        },
        "multimodalGrounded": {
          "categoryLabel": "Multimodal & Grounded",
          "avgA": 72.7,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 12
        },
        "reasoning": {
          "categoryLabel": "Reasoning",
          "avgA": null,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 2
        },
        "knowledge": {
          "categoryLabel": "Knowledge",
          "avgA": 66.1,
          "avgB": 57.2,
          "winner": "A",
          "benchmarkCount": 12
        },
        "instructionFollowing": {
          "categoryLabel": "Instruction Following",
          "avgA": null,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 1
        },
        "multilingual": {
          "categoryLabel": "Multilingual",
          "avgA": null,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 0
        },
        "math": {
          "categoryLabel": "Mathematics",
          "avgA": null,
          "avgB": 52.4,
          "winner": null,
          "benchmarkCount": 1
        }
      }
    },
    {
      "slug": "gpt-5-4-vs-holo3-35b-a3b",
      "url": "https://benchlm.ai/compare/gpt-5-4-vs-holo3-35b-a3b",
      "markdownUrl": "https://benchlm.ai/md/compare/gpt-5-4-vs-holo3-35b-a3b.md",
      "modelA": {
        "slug": "gpt-5-4",
        "canonicalModelKey": "gpt-5-4",
        "model": "GPT-5.4",
        "creator": "OpenAI",
        "sourceType": "Proprietary",
        "reasoningType": "Reasoning",
        "contextWindow": "1.05M",
        "contextWindowTokens": 1050000,
        "displayScore": 88,
        "rankingEligible": true,
        "overallRank": 10,
        "url": "https://benchlm.ai/models/gpt-5-4",
        "markdownUrl": "https://benchlm.ai/md/models/gpt-5-4.md"
      },
      "modelB": {
        "slug": "holo3-35b-a3b",
        "canonicalModelKey": "holo3-35b-a3b",
        "model": "Holo3-35B-A3B",
        "creator": "H Company",
        "sourceType": "Open Weight",
        "reasoningType": "Non-Reasoning",
        "contextWindow": "64K",
        "contextWindowTokens": 64000,
        "displayScore": 100,
        "rankingEligible": false,
        "overallRank": null,
        "url": "https://benchlm.ai/models/holo3-35b-a3b",
        "markdownUrl": "https://benchlm.ai/md/models/holo3-35b-a3b.md"
      },
      "overallWinner": "B",
      "winner": {
        "slug": "holo3-35b-a3b",
        "canonicalModelKey": "holo3-35b-a3b",
        "model": "Holo3-35B-A3B",
        "creator": "H Company",
        "sourceType": "Open Weight",
        "reasoningType": "Non-Reasoning",
        "contextWindow": "64K",
        "contextWindowTokens": 64000,
        "displayScore": 100,
        "rankingEligible": false,
        "overallRank": null,
        "url": "https://benchlm.ai/models/holo3-35b-a3b",
        "markdownUrl": "https://benchlm.ai/md/models/holo3-35b-a3b.md"
      },
      "scoreDiff": 12,
      "winsA": 0,
      "winsB": 1,
      "comparableCategoryCount": 1,
      "benchmarkCountA": 48,
      "benchmarkCountB": 1,
      "categoryResults": {
        "agentic": {
          "categoryLabel": "Agentic",
          "avgA": 77,
          "avgB": 82.6,
          "winner": "B",
          "benchmarkCount": 14
        },
        "coding": {
          "categoryLabel": "Coding",
          "avgA": 57.7,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 7
        },
        "multimodalGrounded": {
          "categoryLabel": "Multimodal & Grounded",
          "avgA": 72.7,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 12
        },
        "reasoning": {
          "categoryLabel": "Reasoning",
          "avgA": null,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 2
        },
        "knowledge": {
          "categoryLabel": "Knowledge",
          "avgA": 66.1,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 12
        },
        "instructionFollowing": {
          "categoryLabel": "Instruction Following",
          "avgA": null,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 1
        },
        "multilingual": {
          "categoryLabel": "Multilingual",
          "avgA": null,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 0
        },
        "math": {
          "categoryLabel": "Mathematics",
          "avgA": null,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 0
        }
      }
    },
    {
      "slug": "gpt-5-5-pro-vs-qwen3-7-plus",
      "url": "https://benchlm.ai/compare/gpt-5-5-pro-vs-qwen3-7-plus",
      "markdownUrl": "https://benchlm.ai/md/compare/gpt-5-5-pro-vs-qwen3-7-plus.md",
      "modelA": {
        "slug": "qwen3-7-plus",
        "canonicalModelKey": "qwen3-7-plus",
        "model": "Qwen3.7 Plus",
        "creator": "Alibaba",
        "sourceType": "Proprietary",
        "reasoningType": "Reasoning",
        "contextWindow": "1M",
        "contextWindowTokens": 1000000,
        "displayScore": 88,
        "rankingEligible": true,
        "overallRank": 11,
        "url": "https://benchlm.ai/models/qwen3-7-plus",
        "markdownUrl": "https://benchlm.ai/md/models/qwen3-7-plus.md"
      },
      "modelB": {
        "slug": "gpt-5-5-pro",
        "canonicalModelKey": "gpt-5-5-pro",
        "model": "GPT-5.5 Pro",
        "creator": "OpenAI",
        "sourceType": "Proprietary",
        "reasoningType": "Reasoning",
        "contextWindow": "1M",
        "contextWindowTokens": 1000000,
        "displayScore": 100,
        "rankingEligible": false,
        "overallRank": null,
        "url": "https://benchlm.ai/models/gpt-5-5-pro",
        "markdownUrl": "https://benchlm.ai/md/models/gpt-5-5-pro.md"
      },
      "overallWinner": "B",
      "winner": {
        "slug": "gpt-5-5-pro",
        "canonicalModelKey": "gpt-5-5-pro",
        "model": "GPT-5.5 Pro",
        "creator": "OpenAI",
        "sourceType": "Proprietary",
        "reasoningType": "Reasoning",
        "contextWindow": "1M",
        "contextWindowTokens": 1000000,
        "displayScore": 100,
        "rankingEligible": false,
        "overallRank": null,
        "url": "https://benchlm.ai/models/gpt-5-5-pro",
        "markdownUrl": "https://benchlm.ai/md/models/gpt-5-5-pro.md"
      },
      "scoreDiff": 12,
      "winsA": 1,
      "winsB": 1,
      "comparableCategoryCount": 2,
      "benchmarkCountA": 68,
      "benchmarkCountB": 4,
      "categoryResults": {
        "agentic": {
          "categoryLabel": "Agentic",
          "avgA": 71.7,
          "avgB": 90.1,
          "winner": "B",
          "benchmarkCount": 16
        },
        "coding": {
          "categoryLabel": "Coding",
          "avgA": 71.1,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 10
        },
        "multimodalGrounded": {
          "categoryLabel": "Multimodal & Grounded",
          "avgA": 81.1,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 16
        },
        "reasoning": {
          "categoryLabel": "Reasoning",
          "avgA": 91.7,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 3
        },
        "knowledge": {
          "categoryLabel": "Knowledge",
          "avgA": 67.9,
          "avgB": 57.2,
          "winner": "A",
          "benchmarkCount": 14
        },
        "instructionFollowing": {
          "categoryLabel": "Instruction Following",
          "avgA": 89.2,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 3
        },
        "multilingual": {
          "categoryLabel": "Multilingual",
          "avgA": 85.4,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 5
        },
        "math": {
          "categoryLabel": "Mathematics",
          "avgA": null,
          "avgB": 52.4,
          "winner": null,
          "benchmarkCount": 4
        }
      }
    },
    {
      "slug": "holo3-35b-a3b-vs-qwen3-7-plus",
      "url": "https://benchlm.ai/compare/holo3-35b-a3b-vs-qwen3-7-plus",
      "markdownUrl": "https://benchlm.ai/md/compare/holo3-35b-a3b-vs-qwen3-7-plus.md",
      "modelA": {
        "slug": "qwen3-7-plus",
        "canonicalModelKey": "qwen3-7-plus",
        "model": "Qwen3.7 Plus",
        "creator": "Alibaba",
        "sourceType": "Proprietary",
        "reasoningType": "Reasoning",
        "contextWindow": "1M",
        "contextWindowTokens": 1000000,
        "displayScore": 88,
        "rankingEligible": true,
        "overallRank": 11,
        "url": "https://benchlm.ai/models/qwen3-7-plus",
        "markdownUrl": "https://benchlm.ai/md/models/qwen3-7-plus.md"
      },
      "modelB": {
        "slug": "holo3-35b-a3b",
        "canonicalModelKey": "holo3-35b-a3b",
        "model": "Holo3-35B-A3B",
        "creator": "H Company",
        "sourceType": "Open Weight",
        "reasoningType": "Non-Reasoning",
        "contextWindow": "64K",
        "contextWindowTokens": 64000,
        "displayScore": 100,
        "rankingEligible": false,
        "overallRank": null,
        "url": "https://benchlm.ai/models/holo3-35b-a3b",
        "markdownUrl": "https://benchlm.ai/md/models/holo3-35b-a3b.md"
      },
      "overallWinner": "B",
      "winner": {
        "slug": "holo3-35b-a3b",
        "canonicalModelKey": "holo3-35b-a3b",
        "model": "Holo3-35B-A3B",
        "creator": "H Company",
        "sourceType": "Open Weight",
        "reasoningType": "Non-Reasoning",
        "contextWindow": "64K",
        "contextWindowTokens": 64000,
        "displayScore": 100,
        "rankingEligible": false,
        "overallRank": null,
        "url": "https://benchlm.ai/models/holo3-35b-a3b",
        "markdownUrl": "https://benchlm.ai/md/models/holo3-35b-a3b.md"
      },
      "scoreDiff": 12,
      "winsA": 0,
      "winsB": 1,
      "comparableCategoryCount": 1,
      "benchmarkCountA": 68,
      "benchmarkCountB": 1,
      "categoryResults": {
        "agentic": {
          "categoryLabel": "Agentic",
          "avgA": 71.7,
          "avgB": 82.6,
          "winner": "B",
          "benchmarkCount": 15
        },
        "coding": {
          "categoryLabel": "Coding",
          "avgA": 71.1,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 10
        },
        "multimodalGrounded": {
          "categoryLabel": "Multimodal & Grounded",
          "avgA": 81.1,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 16
        },
        "reasoning": {
          "categoryLabel": "Reasoning",
          "avgA": 91.7,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 3
        },
        "knowledge": {
          "categoryLabel": "Knowledge",
          "avgA": 67.9,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 13
        },
        "instructionFollowing": {
          "categoryLabel": "Instruction Following",
          "avgA": 89.2,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 3
        },
        "multilingual": {
          "categoryLabel": "Multilingual",
          "avgA": 85.4,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 5
        },
        "math": {
          "categoryLabel": "Mathematics",
          "avgA": null,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 3
        }
      }
    },
    {
      "slug": "claude-opus-4-6-vs-gpt-5-5-pro",
      "url": "https://benchlm.ai/compare/claude-opus-4-6-vs-gpt-5-5-pro",
      "markdownUrl": "https://benchlm.ai/md/compare/claude-opus-4-6-vs-gpt-5-5-pro.md",
      "modelA": {
        "slug": "claude-opus-4-6",
        "canonicalModelKey": "claude-opus-4-6",
        "model": "Claude Opus 4.6",
        "creator": "Anthropic",
        "sourceType": "Proprietary",
        "reasoningType": "Non-Reasoning",
        "contextWindow": "1M",
        "contextWindowTokens": 1000000,
        "displayScore": 86,
        "rankingEligible": true,
        "overallRank": 12,
        "url": "https://benchlm.ai/models/claude-opus-4-6",
        "markdownUrl": "https://benchlm.ai/md/models/claude-opus-4-6.md"
      },
      "modelB": {
        "slug": "gpt-5-5-pro",
        "canonicalModelKey": "gpt-5-5-pro",
        "model": "GPT-5.5 Pro",
        "creator": "OpenAI",
        "sourceType": "Proprietary",
        "reasoningType": "Reasoning",
        "contextWindow": "1M",
        "contextWindowTokens": 1000000,
        "displayScore": 100,
        "rankingEligible": false,
        "overallRank": null,
        "url": "https://benchlm.ai/models/gpt-5-5-pro",
        "markdownUrl": "https://benchlm.ai/md/models/gpt-5-5-pro.md"
      },
      "overallWinner": "B",
      "winner": {
        "slug": "gpt-5-5-pro",
        "canonicalModelKey": "gpt-5-5-pro",
        "model": "GPT-5.5 Pro",
        "creator": "OpenAI",
        "sourceType": "Proprietary",
        "reasoningType": "Reasoning",
        "contextWindow": "1M",
        "contextWindowTokens": 1000000,
        "displayScore": 100,
        "rankingEligible": false,
        "overallRank": null,
        "url": "https://benchlm.ai/models/gpt-5-5-pro",
        "markdownUrl": "https://benchlm.ai/md/models/gpt-5-5-pro.md"
      },
      "scoreDiff": 14,
      "winsA": 1,
      "winsB": 1,
      "comparableCategoryCount": 2,
      "benchmarkCountA": 47,
      "benchmarkCountB": 4,
      "categoryResults": {
        "agentic": {
          "categoryLabel": "Agentic",
          "avgA": 72.6,
          "avgB": 90.1,
          "winner": "B",
          "benchmarkCount": 11
        },
        "coding": {
          "categoryLabel": "Coding",
          "avgA": 64.4,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 10
        },
        "multimodalGrounded": {
          "categoryLabel": "Multimodal & Grounded",
          "avgA": 77.3,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 7
        },
        "reasoning": {
          "categoryLabel": "Reasoning",
          "avgA": null,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 2
        },
        "knowledge": {
          "categoryLabel": "Knowledge",
          "avgA": 76.2,
          "avgB": 57.2,
          "winner": "A",
          "benchmarkCount": 15
        },
        "instructionFollowing": {
          "categoryLabel": "Instruction Following",
          "avgA": null,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 1
        },
        "multilingual": {
          "categoryLabel": "Multilingual",
          "avgA": null,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 0
        },
        "math": {
          "categoryLabel": "Mathematics",
          "avgA": null,
          "avgB": 52.4,
          "winner": null,
          "benchmarkCount": 2
        }
      }
    },
    {
      "slug": "claude-opus-4-6-vs-holo3-35b-a3b",
      "url": "https://benchlm.ai/compare/claude-opus-4-6-vs-holo3-35b-a3b",
      "markdownUrl": "https://benchlm.ai/md/compare/claude-opus-4-6-vs-holo3-35b-a3b.md",
      "modelA": {
        "slug": "claude-opus-4-6",
        "canonicalModelKey": "claude-opus-4-6",
        "model": "Claude Opus 4.6",
        "creator": "Anthropic",
        "sourceType": "Proprietary",
        "reasoningType": "Non-Reasoning",
        "contextWindow": "1M",
        "contextWindowTokens": 1000000,
        "displayScore": 86,
        "rankingEligible": true,
        "overallRank": 12,
        "url": "https://benchlm.ai/models/claude-opus-4-6",
        "markdownUrl": "https://benchlm.ai/md/models/claude-opus-4-6.md"
      },
      "modelB": {
        "slug": "holo3-35b-a3b",
        "canonicalModelKey": "holo3-35b-a3b",
        "model": "Holo3-35B-A3B",
        "creator": "H Company",
        "sourceType": "Open Weight",
        "reasoningType": "Non-Reasoning",
        "contextWindow": "64K",
        "contextWindowTokens": 64000,
        "displayScore": 100,
        "rankingEligible": false,
        "overallRank": null,
        "url": "https://benchlm.ai/models/holo3-35b-a3b",
        "markdownUrl": "https://benchlm.ai/md/models/holo3-35b-a3b.md"
      },
      "overallWinner": "B",
      "winner": {
        "slug": "holo3-35b-a3b",
        "canonicalModelKey": "holo3-35b-a3b",
        "model": "Holo3-35B-A3B",
        "creator": "H Company",
        "sourceType": "Open Weight",
        "reasoningType": "Non-Reasoning",
        "contextWindow": "64K",
        "contextWindowTokens": 64000,
        "displayScore": 100,
        "rankingEligible": false,
        "overallRank": null,
        "url": "https://benchlm.ai/models/holo3-35b-a3b",
        "markdownUrl": "https://benchlm.ai/md/models/holo3-35b-a3b.md"
      },
      "scoreDiff": 14,
      "winsA": 0,
      "winsB": 1,
      "comparableCategoryCount": 1,
      "benchmarkCountA": 47,
      "benchmarkCountB": 1,
      "categoryResults": {
        "agentic": {
          "categoryLabel": "Agentic",
          "avgA": 72.6,
          "avgB": 82.6,
          "winner": "B",
          "benchmarkCount": 11
        },
        "coding": {
          "categoryLabel": "Coding",
          "avgA": 64.4,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 10
        },
        "multimodalGrounded": {
          "categoryLabel": "Multimodal & Grounded",
          "avgA": 77.3,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 7
        },
        "reasoning": {
          "categoryLabel": "Reasoning",
          "avgA": null,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 2
        },
        "knowledge": {
          "categoryLabel": "Knowledge",
          "avgA": 76.2,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 15
        },
        "instructionFollowing": {
          "categoryLabel": "Instruction Following",
          "avgA": null,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 1
        },
        "multilingual": {
          "categoryLabel": "Multilingual",
          "avgA": null,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 0
        },
        "math": {
          "categoryLabel": "Mathematics",
          "avgA": null,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 1
        }
      }
    },
    {
      "slug": "gemini-3-5-flash-vs-gpt-5-5-pro",
      "url": "https://benchlm.ai/compare/gemini-3-5-flash-vs-gpt-5-5-pro",
      "markdownUrl": "https://benchlm.ai/md/compare/gemini-3-5-flash-vs-gpt-5-5-pro.md",
      "modelA": {
        "slug": "gemini-3-5-flash",
        "canonicalModelKey": "gemini-3-5-flash",
        "model": "Gemini 3.5 Flash",
        "creator": "Google",
        "sourceType": "Proprietary",
        "reasoningType": "Reasoning",
        "contextWindow": "1M",
        "contextWindowTokens": 1000000,
        "displayScore": 86,
        "rankingEligible": true,
        "overallRank": 13,
        "url": "https://benchlm.ai/models/gemini-3-5-flash",
        "markdownUrl": "https://benchlm.ai/md/models/gemini-3-5-flash.md"
      },
      "modelB": {
        "slug": "gpt-5-5-pro",
        "canonicalModelKey": "gpt-5-5-pro",
        "model": "GPT-5.5 Pro",
        "creator": "OpenAI",
        "sourceType": "Proprietary",
        "reasoningType": "Reasoning",
        "contextWindow": "1M",
        "contextWindowTokens": 1000000,
        "displayScore": 100,
        "rankingEligible": false,
        "overallRank": null,
        "url": "https://benchlm.ai/models/gpt-5-5-pro",
        "markdownUrl": "https://benchlm.ai/md/models/gpt-5-5-pro.md"
      },
      "overallWinner": "B",
      "winner": {
        "slug": "gpt-5-5-pro",
        "canonicalModelKey": "gpt-5-5-pro",
        "model": "GPT-5.5 Pro",
        "creator": "OpenAI",
        "sourceType": "Proprietary",
        "reasoningType": "Reasoning",
        "contextWindow": "1M",
        "contextWindowTokens": 1000000,
        "displayScore": 100,
        "rankingEligible": false,
        "overallRank": null,
        "url": "https://benchlm.ai/models/gpt-5-5-pro",
        "markdownUrl": "https://benchlm.ai/md/models/gpt-5-5-pro.md"
      },
      "scoreDiff": 14,
      "winsA": 1,
      "winsB": 1,
      "comparableCategoryCount": 2,
      "benchmarkCountA": 40,
      "benchmarkCountB": 4,
      "categoryResults": {
        "agentic": {
          "categoryLabel": "Agentic",
          "avgA": 77.2,
          "avgB": 90.1,
          "winner": "B",
          "benchmarkCount": 12
        },
        "coding": {
          "categoryLabel": "Coding",
          "avgA": 54.5,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 8
        },
        "multimodalGrounded": {
          "categoryLabel": "Multimodal & Grounded",
          "avgA": 83.8,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 5
        },
        "reasoning": {
          "categoryLabel": "Reasoning",
          "avgA": 74.7,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 5
        },
        "knowledge": {
          "categoryLabel": "Knowledge",
          "avgA": 58,
          "avgB": 57.2,
          "winner": "A",
          "benchmarkCount": 10
        },
        "instructionFollowing": {
          "categoryLabel": "Instruction Following",
          "avgA": 76.3,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 2
        },
        "multilingual": {
          "categoryLabel": "Multilingual",
          "avgA": null,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 0
        },
        "math": {
          "categoryLabel": "Mathematics",
          "avgA": null,
          "avgB": 52.4,
          "winner": null,
          "benchmarkCount": 1
        }
      }
    },
    {
      "slug": "gemini-3-5-flash-vs-holo3-35b-a3b",
      "url": "https://benchlm.ai/compare/gemini-3-5-flash-vs-holo3-35b-a3b",
      "markdownUrl": "https://benchlm.ai/md/compare/gemini-3-5-flash-vs-holo3-35b-a3b.md",
      "modelA": {
        "slug": "gemini-3-5-flash",
        "canonicalModelKey": "gemini-3-5-flash",
        "model": "Gemini 3.5 Flash",
        "creator": "Google",
        "sourceType": "Proprietary",
        "reasoningType": "Reasoning",
        "contextWindow": "1M",
        "contextWindowTokens": 1000000,
        "displayScore": 86,
        "rankingEligible": true,
        "overallRank": 13,
        "url": "https://benchlm.ai/models/gemini-3-5-flash",
        "markdownUrl": "https://benchlm.ai/md/models/gemini-3-5-flash.md"
      },
      "modelB": {
        "slug": "holo3-35b-a3b",
        "canonicalModelKey": "holo3-35b-a3b",
        "model": "Holo3-35B-A3B",
        "creator": "H Company",
        "sourceType": "Open Weight",
        "reasoningType": "Non-Reasoning",
        "contextWindow": "64K",
        "contextWindowTokens": 64000,
        "displayScore": 100,
        "rankingEligible": false,
        "overallRank": null,
        "url": "https://benchlm.ai/models/holo3-35b-a3b",
        "markdownUrl": "https://benchlm.ai/md/models/holo3-35b-a3b.md"
      },
      "overallWinner": "B",
      "winner": {
        "slug": "holo3-35b-a3b",
        "canonicalModelKey": "holo3-35b-a3b",
        "model": "Holo3-35B-A3B",
        "creator": "H Company",
        "sourceType": "Open Weight",
        "reasoningType": "Non-Reasoning",
        "contextWindow": "64K",
        "contextWindowTokens": 64000,
        "displayScore": 100,
        "rankingEligible": false,
        "overallRank": null,
        "url": "https://benchlm.ai/models/holo3-35b-a3b",
        "markdownUrl": "https://benchlm.ai/md/models/holo3-35b-a3b.md"
      },
      "scoreDiff": 14,
      "winsA": 0,
      "winsB": 1,
      "comparableCategoryCount": 1,
      "benchmarkCountA": 40,
      "benchmarkCountB": 1,
      "categoryResults": {
        "agentic": {
          "categoryLabel": "Agentic",
          "avgA": 77.2,
          "avgB": 82.6,
          "winner": "B",
          "benchmarkCount": 11
        },
        "coding": {
          "categoryLabel": "Coding",
          "avgA": 54.5,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 8
        },
        "multimodalGrounded": {
          "categoryLabel": "Multimodal & Grounded",
          "avgA": 83.8,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 5
        },
        "reasoning": {
          "categoryLabel": "Reasoning",
          "avgA": 74.7,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 5
        },
        "knowledge": {
          "categoryLabel": "Knowledge",
          "avgA": 58,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 9
        },
        "instructionFollowing": {
          "categoryLabel": "Instruction Following",
          "avgA": 76.3,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 2
        },
        "multilingual": {
          "categoryLabel": "Multilingual",
          "avgA": null,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 0
        },
        "math": {
          "categoryLabel": "Mathematics",
          "avgA": null,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 0
        }
      }
    },
    {
      "slug": "deepseek-v4-pro-max-vs-gpt-5-5-pro",
      "url": "https://benchlm.ai/compare/deepseek-v4-pro-max-vs-gpt-5-5-pro",
      "markdownUrl": "https://benchlm.ai/md/compare/deepseek-v4-pro-max-vs-gpt-5-5-pro.md",
      "modelA": {
        "slug": "deepseek-v4-pro-max",
        "canonicalModelKey": "deepseek-v4-pro-max",
        "model": "DeepSeek V4 Pro (Max)",
        "creator": "DeepSeek",
        "sourceType": "Open Weight",
        "reasoningType": "Reasoning",
        "contextWindow": "1M",
        "contextWindowTokens": 1000000,
        "displayScore": 86,
        "rankingEligible": true,
        "overallRank": 14,
        "url": "https://benchlm.ai/models/deepseek-v4-pro-max",
        "markdownUrl": "https://benchlm.ai/md/models/deepseek-v4-pro-max.md"
      },
      "modelB": {
        "slug": "gpt-5-5-pro",
        "canonicalModelKey": "gpt-5-5-pro",
        "model": "GPT-5.5 Pro",
        "creator": "OpenAI",
        "sourceType": "Proprietary",
        "reasoningType": "Reasoning",
        "contextWindow": "1M",
        "contextWindowTokens": 1000000,
        "displayScore": 100,
        "rankingEligible": false,
        "overallRank": null,
        "url": "https://benchlm.ai/models/gpt-5-5-pro",
        "markdownUrl": "https://benchlm.ai/md/models/gpt-5-5-pro.md"
      },
      "overallWinner": "B",
      "winner": {
        "slug": "gpt-5-5-pro",
        "canonicalModelKey": "gpt-5-5-pro",
        "model": "GPT-5.5 Pro",
        "creator": "OpenAI",
        "sourceType": "Proprietary",
        "reasoningType": "Reasoning",
        "contextWindow": "1M",
        "contextWindowTokens": 1000000,
        "displayScore": 100,
        "rankingEligible": false,
        "overallRank": null,
        "url": "https://benchlm.ai/models/gpt-5-5-pro",
        "markdownUrl": "https://benchlm.ai/md/models/gpt-5-5-pro.md"
      },
      "scoreDiff": 14,
      "winsA": 1,
      "winsB": 1,
      "comparableCategoryCount": 2,
      "benchmarkCountA": 42,
      "benchmarkCountB": 4,
      "categoryResults": {
        "agentic": {
          "categoryLabel": "Agentic",
          "avgA": 74,
          "avgB": 90.1,
          "winner": "B",
          "benchmarkCount": 10
        },
        "coding": {
          "categoryLabel": "Coding",
          "avgA": 75.9,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 10
        },
        "multimodalGrounded": {
          "categoryLabel": "Multimodal & Grounded",
          "avgA": null,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 1
        },
        "reasoning": {
          "categoryLabel": "Reasoning",
          "avgA": null,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 4
        },
        "knowledge": {
          "categoryLabel": "Knowledge",
          "avgA": 66.1,
          "avgB": 57.2,
          "winner": "A",
          "benchmarkCount": 13
        },
        "instructionFollowing": {
          "categoryLabel": "Instruction Following",
          "avgA": null,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 1
        },
        "multilingual": {
          "categoryLabel": "Multilingual",
          "avgA": null,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 0
        },
        "math": {
          "categoryLabel": "Mathematics",
          "avgA": null,
          "avgB": 52.4,
          "winner": null,
          "benchmarkCount": 5
        }
      }
    },
    {
      "slug": "deepseek-v4-pro-max-vs-holo3-35b-a3b",
      "url": "https://benchlm.ai/compare/deepseek-v4-pro-max-vs-holo3-35b-a3b",
      "markdownUrl": "https://benchlm.ai/md/compare/deepseek-v4-pro-max-vs-holo3-35b-a3b.md",
      "modelA": {
        "slug": "deepseek-v4-pro-max",
        "canonicalModelKey": "deepseek-v4-pro-max",
        "model": "DeepSeek V4 Pro (Max)",
        "creator": "DeepSeek",
        "sourceType": "Open Weight",
        "reasoningType": "Reasoning",
        "contextWindow": "1M",
        "contextWindowTokens": 1000000,
        "displayScore": 86,
        "rankingEligible": true,
        "overallRank": 14,
        "url": "https://benchlm.ai/models/deepseek-v4-pro-max",
        "markdownUrl": "https://benchlm.ai/md/models/deepseek-v4-pro-max.md"
      },
      "modelB": {
        "slug": "holo3-35b-a3b",
        "canonicalModelKey": "holo3-35b-a3b",
        "model": "Holo3-35B-A3B",
        "creator": "H Company",
        "sourceType": "Open Weight",
        "reasoningType": "Non-Reasoning",
        "contextWindow": "64K",
        "contextWindowTokens": 64000,
        "displayScore": 100,
        "rankingEligible": false,
        "overallRank": null,
        "url": "https://benchlm.ai/models/holo3-35b-a3b",
        "markdownUrl": "https://benchlm.ai/md/models/holo3-35b-a3b.md"
      },
      "overallWinner": "B",
      "winner": {
        "slug": "holo3-35b-a3b",
        "canonicalModelKey": "holo3-35b-a3b",
        "model": "Holo3-35B-A3B",
        "creator": "H Company",
        "sourceType": "Open Weight",
        "reasoningType": "Non-Reasoning",
        "contextWindow": "64K",
        "contextWindowTokens": 64000,
        "displayScore": 100,
        "rankingEligible": false,
        "overallRank": null,
        "url": "https://benchlm.ai/models/holo3-35b-a3b",
        "markdownUrl": "https://benchlm.ai/md/models/holo3-35b-a3b.md"
      },
      "scoreDiff": 14,
      "winsA": 0,
      "winsB": 1,
      "comparableCategoryCount": 1,
      "benchmarkCountA": 42,
      "benchmarkCountB": 1,
      "categoryResults": {
        "agentic": {
          "categoryLabel": "Agentic",
          "avgA": 74,
          "avgB": 82.6,
          "winner": "B",
          "benchmarkCount": 11
        },
        "coding": {
          "categoryLabel": "Coding",
          "avgA": 75.9,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 10
        },
        "multimodalGrounded": {
          "categoryLabel": "Multimodal & Grounded",
          "avgA": null,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 1
        },
        "reasoning": {
          "categoryLabel": "Reasoning",
          "avgA": null,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 4
        },
        "knowledge": {
          "categoryLabel": "Knowledge",
          "avgA": 66.1,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 12
        },
        "instructionFollowing": {
          "categoryLabel": "Instruction Following",
          "avgA": null,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 1
        },
        "multilingual": {
          "categoryLabel": "Multilingual",
          "avgA": null,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 0
        },
        "math": {
          "categoryLabel": "Mathematics",
          "avgA": null,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 4
        }
      }
    },
    {
      "slug": "gpt-5-3-codex-vs-gpt-5-5-pro",
      "url": "https://benchlm.ai/compare/gpt-5-3-codex-vs-gpt-5-5-pro",
      "markdownUrl": "https://benchlm.ai/md/compare/gpt-5-3-codex-vs-gpt-5-5-pro.md",
      "modelA": {
        "slug": "gpt-5-3-codex",
        "canonicalModelKey": "gpt-5-3-codex",
        "model": "GPT-5.3 Codex",
        "creator": "OpenAI",
        "sourceType": "Proprietary",
        "reasoningType": "Reasoning",
        "contextWindow": "400K",
        "contextWindowTokens": 400000,
        "displayScore": 85,
        "rankingEligible": true,
        "overallRank": 15,
        "url": "https://benchlm.ai/models/gpt-5-3-codex",
        "markdownUrl": "https://benchlm.ai/md/models/gpt-5-3-codex.md"
      },
      "modelB": {
        "slug": "gpt-5-5-pro",
        "canonicalModelKey": "gpt-5-5-pro",
        "model": "GPT-5.5 Pro",
        "creator": "OpenAI",
        "sourceType": "Proprietary",
        "reasoningType": "Reasoning",
        "contextWindow": "1M",
        "contextWindowTokens": 1000000,
        "displayScore": 100,
        "rankingEligible": false,
        "overallRank": null,
        "url": "https://benchlm.ai/models/gpt-5-5-pro",
        "markdownUrl": "https://benchlm.ai/md/models/gpt-5-5-pro.md"
      },
      "overallWinner": "B",
      "winner": {
        "slug": "gpt-5-5-pro",
        "canonicalModelKey": "gpt-5-5-pro",
        "model": "GPT-5.5 Pro",
        "creator": "OpenAI",
        "sourceType": "Proprietary",
        "reasoningType": "Reasoning",
        "contextWindow": "1M",
        "contextWindowTokens": 1000000,
        "displayScore": 100,
        "rankingEligible": false,
        "overallRank": null,
        "url": "https://benchlm.ai/models/gpt-5-5-pro",
        "markdownUrl": "https://benchlm.ai/md/models/gpt-5-5-pro.md"
      },
      "scoreDiff": 15,
      "winsA": 0,
      "winsB": 1,
      "comparableCategoryCount": 1,
      "benchmarkCountA": 25,
      "benchmarkCountB": 4,
      "categoryResults": {
        "agentic": {
          "categoryLabel": "Agentic",
          "avgA": 71.5,
          "avgB": 90.1,
          "winner": "B",
          "benchmarkCount": 8
        },
        "coding": {
          "categoryLabel": "Coding",
          "avgA": 63.1,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 7
        },
        "multimodalGrounded": {
          "categoryLabel": "Multimodal & Grounded",
          "avgA": null,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 2
        },
        "reasoning": {
          "categoryLabel": "Reasoning",
          "avgA": null,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 2
        },
        "knowledge": {
          "categoryLabel": "Knowledge",
          "avgA": null,
          "avgB": 57.2,
          "winner": null,
          "benchmarkCount": 8
        },
        "instructionFollowing": {
          "categoryLabel": "Instruction Following",
          "avgA": null,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 1
        },
        "multilingual": {
          "categoryLabel": "Multilingual",
          "avgA": null,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 0
        },
        "math": {
          "categoryLabel": "Mathematics",
          "avgA": null,
          "avgB": 52.4,
          "winner": null,
          "benchmarkCount": 1
        }
      }
    },
    {
      "slug": "gpt-5-3-codex-vs-holo3-35b-a3b",
      "url": "https://benchlm.ai/compare/gpt-5-3-codex-vs-holo3-35b-a3b",
      "markdownUrl": "https://benchlm.ai/md/compare/gpt-5-3-codex-vs-holo3-35b-a3b.md",
      "modelA": {
        "slug": "gpt-5-3-codex",
        "canonicalModelKey": "gpt-5-3-codex",
        "model": "GPT-5.3 Codex",
        "creator": "OpenAI",
        "sourceType": "Proprietary",
        "reasoningType": "Reasoning",
        "contextWindow": "400K",
        "contextWindowTokens": 400000,
        "displayScore": 85,
        "rankingEligible": true,
        "overallRank": 15,
        "url": "https://benchlm.ai/models/gpt-5-3-codex",
        "markdownUrl": "https://benchlm.ai/md/models/gpt-5-3-codex.md"
      },
      "modelB": {
        "slug": "holo3-35b-a3b",
        "canonicalModelKey": "holo3-35b-a3b",
        "model": "Holo3-35B-A3B",
        "creator": "H Company",
        "sourceType": "Open Weight",
        "reasoningType": "Non-Reasoning",
        "contextWindow": "64K",
        "contextWindowTokens": 64000,
        "displayScore": 100,
        "rankingEligible": false,
        "overallRank": null,
        "url": "https://benchlm.ai/models/holo3-35b-a3b",
        "markdownUrl": "https://benchlm.ai/md/models/holo3-35b-a3b.md"
      },
      "overallWinner": "B",
      "winner": {
        "slug": "holo3-35b-a3b",
        "canonicalModelKey": "holo3-35b-a3b",
        "model": "Holo3-35B-A3B",
        "creator": "H Company",
        "sourceType": "Open Weight",
        "reasoningType": "Non-Reasoning",
        "contextWindow": "64K",
        "contextWindowTokens": 64000,
        "displayScore": 100,
        "rankingEligible": false,
        "overallRank": null,
        "url": "https://benchlm.ai/models/holo3-35b-a3b",
        "markdownUrl": "https://benchlm.ai/md/models/holo3-35b-a3b.md"
      },
      "scoreDiff": 15,
      "winsA": 0,
      "winsB": 1,
      "comparableCategoryCount": 1,
      "benchmarkCountA": 25,
      "benchmarkCountB": 1,
      "categoryResults": {
        "agentic": {
          "categoryLabel": "Agentic",
          "avgA": 71.5,
          "avgB": 82.6,
          "winner": "B",
          "benchmarkCount": 7
        },
        "coding": {
          "categoryLabel": "Coding",
          "avgA": 63.1,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 7
        },
        "multimodalGrounded": {
          "categoryLabel": "Multimodal & Grounded",
          "avgA": null,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 2
        },
        "reasoning": {
          "categoryLabel": "Reasoning",
          "avgA": null,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 2
        },
        "knowledge": {
          "categoryLabel": "Knowledge",
          "avgA": null,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 6
        },
        "instructionFollowing": {
          "categoryLabel": "Instruction Following",
          "avgA": null,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 1
        },
        "multilingual": {
          "categoryLabel": "Multilingual",
          "avgA": null,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 0
        },
        "math": {
          "categoryLabel": "Mathematics",
          "avgA": null,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 0
        }
      }
    },
    {
      "slug": "claude-opus-4-7-adaptive-vs-gpt-5-5-pro",
      "url": "https://benchlm.ai/compare/claude-opus-4-7-adaptive-vs-gpt-5-5-pro",
      "markdownUrl": "https://benchlm.ai/md/compare/claude-opus-4-7-adaptive-vs-gpt-5-5-pro.md",
      "modelA": {
        "slug": "claude-opus-4-7-adaptive",
        "canonicalModelKey": "claude-opus-4-7-max",
        "model": "Claude Opus 4.7 (Adaptive)",
        "creator": "Anthropic",
        "sourceType": "Proprietary",
        "reasoningType": "Reasoning",
        "contextWindow": "1M",
        "contextWindowTokens": 1000000,
        "displayScore": 84,
        "rankingEligible": true,
        "overallRank": 16,
        "url": "https://benchlm.ai/models/claude-opus-4-7-adaptive",
        "markdownUrl": "https://benchlm.ai/md/models/claude-opus-4-7-adaptive.md"
      },
      "modelB": {
        "slug": "gpt-5-5-pro",
        "canonicalModelKey": "gpt-5-5-pro",
        "model": "GPT-5.5 Pro",
        "creator": "OpenAI",
        "sourceType": "Proprietary",
        "reasoningType": "Reasoning",
        "contextWindow": "1M",
        "contextWindowTokens": 1000000,
        "displayScore": 100,
        "rankingEligible": false,
        "overallRank": null,
        "url": "https://benchlm.ai/models/gpt-5-5-pro",
        "markdownUrl": "https://benchlm.ai/md/models/gpt-5-5-pro.md"
      },
      "overallWinner": "B",
      "winner": {
        "slug": "gpt-5-5-pro",
        "canonicalModelKey": "gpt-5-5-pro",
        "model": "GPT-5.5 Pro",
        "creator": "OpenAI",
        "sourceType": "Proprietary",
        "reasoningType": "Reasoning",
        "contextWindow": "1M",
        "contextWindowTokens": 1000000,
        "displayScore": 100,
        "rankingEligible": false,
        "overallRank": null,
        "url": "https://benchlm.ai/models/gpt-5-5-pro",
        "markdownUrl": "https://benchlm.ai/md/models/gpt-5-5-pro.md"
      },
      "scoreDiff": 16,
      "winsA": 1,
      "winsB": 2,
      "comparableCategoryCount": 3,
      "benchmarkCountA": 36,
      "benchmarkCountB": 4,
      "categoryResults": {
        "agentic": {
          "categoryLabel": "Agentic",
          "avgA": 74.9,
          "avgB": 90.1,
          "winner": "B",
          "benchmarkCount": 9
        },
        "coding": {
          "categoryLabel": "Coding",
          "avgA": 72.9,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 6
        },
        "multimodalGrounded": {
          "categoryLabel": "Multimodal & Grounded",
          "avgA": 64.3,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 5
        },
        "reasoning": {
          "categoryLabel": "Reasoning",
          "avgA": 75.8,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 4
        },
        "knowledge": {
          "categoryLabel": "Knowledge",
          "avgA": 68.2,
          "avgB": 57.2,
          "winner": "A",
          "benchmarkCount": 10
        },
        "instructionFollowing": {
          "categoryLabel": "Instruction Following",
          "avgA": null,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 1
        },
        "multilingual": {
          "categoryLabel": "Multilingual",
          "avgA": null,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 0
        },
        "math": {
          "categoryLabel": "Mathematics",
          "avgA": 43.8,
          "avgB": 52.4,
          "winner": "B",
          "benchmarkCount": 1
        }
      }
    },
    {
      "slug": "claude-opus-4-7-adaptive-vs-holo3-35b-a3b",
      "url": "https://benchlm.ai/compare/claude-opus-4-7-adaptive-vs-holo3-35b-a3b",
      "markdownUrl": "https://benchlm.ai/md/compare/claude-opus-4-7-adaptive-vs-holo3-35b-a3b.md",
      "modelA": {
        "slug": "claude-opus-4-7-adaptive",
        "canonicalModelKey": "claude-opus-4-7-max",
        "model": "Claude Opus 4.7 (Adaptive)",
        "creator": "Anthropic",
        "sourceType": "Proprietary",
        "reasoningType": "Reasoning",
        "contextWindow": "1M",
        "contextWindowTokens": 1000000,
        "displayScore": 84,
        "rankingEligible": true,
        "overallRank": 16,
        "url": "https://benchlm.ai/models/claude-opus-4-7-adaptive",
        "markdownUrl": "https://benchlm.ai/md/models/claude-opus-4-7-adaptive.md"
      },
      "modelB": {
        "slug": "holo3-35b-a3b",
        "canonicalModelKey": "holo3-35b-a3b",
        "model": "Holo3-35B-A3B",
        "creator": "H Company",
        "sourceType": "Open Weight",
        "reasoningType": "Non-Reasoning",
        "contextWindow": "64K",
        "contextWindowTokens": 64000,
        "displayScore": 100,
        "rankingEligible": false,
        "overallRank": null,
        "url": "https://benchlm.ai/models/holo3-35b-a3b",
        "markdownUrl": "https://benchlm.ai/md/models/holo3-35b-a3b.md"
      },
      "overallWinner": "B",
      "winner": {
        "slug": "holo3-35b-a3b",
        "canonicalModelKey": "holo3-35b-a3b",
        "model": "Holo3-35B-A3B",
        "creator": "H Company",
        "sourceType": "Open Weight",
        "reasoningType": "Non-Reasoning",
        "contextWindow": "64K",
        "contextWindowTokens": 64000,
        "displayScore": 100,
        "rankingEligible": false,
        "overallRank": null,
        "url": "https://benchlm.ai/models/holo3-35b-a3b",
        "markdownUrl": "https://benchlm.ai/md/models/holo3-35b-a3b.md"
      },
      "scoreDiff": 16,
      "winsA": 0,
      "winsB": 1,
      "comparableCategoryCount": 1,
      "benchmarkCountA": 36,
      "benchmarkCountB": 1,
      "categoryResults": {
        "agentic": {
          "categoryLabel": "Agentic",
          "avgA": 74.9,
          "avgB": 82.6,
          "winner": "B",
          "benchmarkCount": 9
        },
        "coding": {
          "categoryLabel": "Coding",
          "avgA": 72.9,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 6
        },
        "multimodalGrounded": {
          "categoryLabel": "Multimodal & Grounded",
          "avgA": 64.3,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 5
        },
        "reasoning": {
          "categoryLabel": "Reasoning",
          "avgA": 75.8,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 4
        },
        "knowledge": {
          "categoryLabel": "Knowledge",
          "avgA": 68.2,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 10
        },
        "instructionFollowing": {
          "categoryLabel": "Instruction Following",
          "avgA": null,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 1
        },
        "multilingual": {
          "categoryLabel": "Multilingual",
          "avgA": null,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 0
        },
        "math": {
          "categoryLabel": "Mathematics",
          "avgA": 43.8,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 1
        }
      }
    },
    {
      "slug": "glm-5-1-vs-gpt-5-5-pro",
      "url": "https://benchlm.ai/compare/glm-5-1-vs-gpt-5-5-pro",
      "markdownUrl": "https://benchlm.ai/md/compare/glm-5-1-vs-gpt-5-5-pro.md",
      "modelA": {
        "slug": "glm-5-1",
        "canonicalModelKey": "glm-5-1",
        "model": "GLM-5.1",
        "creator": "Z.AI",
        "sourceType": "Open Weight",
        "reasoningType": "Reasoning",
        "contextWindow": "203K",
        "contextWindowTokens": 203000,
        "displayScore": 82,
        "rankingEligible": true,
        "overallRank": 17,
        "url": "https://benchlm.ai/models/glm-5-1",
        "markdownUrl": "https://benchlm.ai/md/models/glm-5-1.md"
      },
      "modelB": {
        "slug": "gpt-5-5-pro",
        "canonicalModelKey": "gpt-5-5-pro",
        "model": "GPT-5.5 Pro",
        "creator": "OpenAI",
        "sourceType": "Proprietary",
        "reasoningType": "Reasoning",
        "contextWindow": "1M",
        "contextWindowTokens": 1000000,
        "displayScore": 100,
        "rankingEligible": false,
        "overallRank": null,
        "url": "https://benchlm.ai/models/gpt-5-5-pro",
        "markdownUrl": "https://benchlm.ai/md/models/gpt-5-5-pro.md"
      },
      "overallWinner": "B",
      "winner": {
        "slug": "gpt-5-5-pro",
        "canonicalModelKey": "gpt-5-5-pro",
        "model": "GPT-5.5 Pro",
        "creator": "OpenAI",
        "sourceType": "Proprietary",
        "reasoningType": "Reasoning",
        "contextWindow": "1M",
        "contextWindowTokens": 1000000,
        "displayScore": 100,
        "rankingEligible": false,
        "overallRank": null,
        "url": "https://benchlm.ai/models/gpt-5-5-pro",
        "markdownUrl": "https://benchlm.ai/md/models/gpt-5-5-pro.md"
      },
      "scoreDiff": 18,
      "winsA": 0,
      "winsB": 2,
      "comparableCategoryCount": 2,
      "benchmarkCountA": 33,
      "benchmarkCountB": 4,
      "categoryResults": {
        "agentic": {
          "categoryLabel": "Agentic",
          "avgA": 65.3,
          "avgB": 90.1,
          "winner": "B",
          "benchmarkCount": 10
        },
        "coding": {
          "categoryLabel": "Coding",
          "avgA": 60.9,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 7
        },
        "multimodalGrounded": {
          "categoryLabel": "Multimodal & Grounded",
          "avgA": null,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 1
        },
        "reasoning": {
          "categoryLabel": "Reasoning",
          "avgA": null,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 2
        },
        "knowledge": {
          "categoryLabel": "Knowledge",
          "avgA": 52.3,
          "avgB": 57.2,
          "winner": "B",
          "benchmarkCount": 9
        },
        "instructionFollowing": {
          "categoryLabel": "Instruction Following",
          "avgA": null,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 1
        },
        "multilingual": {
          "categoryLabel": "Multilingual",
          "avgA": null,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 0
        },
        "math": {
          "categoryLabel": "Mathematics",
          "avgA": null,
          "avgB": 52.4,
          "winner": null,
          "benchmarkCount": 5
        }
      }
    },
    {
      "slug": "glm-5-1-vs-holo3-35b-a3b",
      "url": "https://benchlm.ai/compare/glm-5-1-vs-holo3-35b-a3b",
      "markdownUrl": "https://benchlm.ai/md/compare/glm-5-1-vs-holo3-35b-a3b.md",
      "modelA": {
        "slug": "glm-5-1",
        "canonicalModelKey": "glm-5-1",
        "model": "GLM-5.1",
        "creator": "Z.AI",
        "sourceType": "Open Weight",
        "reasoningType": "Reasoning",
        "contextWindow": "203K",
        "contextWindowTokens": 203000,
        "displayScore": 82,
        "rankingEligible": true,
        "overallRank": 17,
        "url": "https://benchlm.ai/models/glm-5-1",
        "markdownUrl": "https://benchlm.ai/md/models/glm-5-1.md"
      },
      "modelB": {
        "slug": "holo3-35b-a3b",
        "canonicalModelKey": "holo3-35b-a3b",
        "model": "Holo3-35B-A3B",
        "creator": "H Company",
        "sourceType": "Open Weight",
        "reasoningType": "Non-Reasoning",
        "contextWindow": "64K",
        "contextWindowTokens": 64000,
        "displayScore": 100,
        "rankingEligible": false,
        "overallRank": null,
        "url": "https://benchlm.ai/models/holo3-35b-a3b",
        "markdownUrl": "https://benchlm.ai/md/models/holo3-35b-a3b.md"
      },
      "overallWinner": "B",
      "winner": {
        "slug": "holo3-35b-a3b",
        "canonicalModelKey": "holo3-35b-a3b",
        "model": "Holo3-35B-A3B",
        "creator": "H Company",
        "sourceType": "Open Weight",
        "reasoningType": "Non-Reasoning",
        "contextWindow": "64K",
        "contextWindowTokens": 64000,
        "displayScore": 100,
        "rankingEligible": false,
        "overallRank": null,
        "url": "https://benchlm.ai/models/holo3-35b-a3b",
        "markdownUrl": "https://benchlm.ai/md/models/holo3-35b-a3b.md"
      },
      "scoreDiff": 18,
      "winsA": 0,
      "winsB": 1,
      "comparableCategoryCount": 1,
      "benchmarkCountA": 33,
      "benchmarkCountB": 1,
      "categoryResults": {
        "agentic": {
          "categoryLabel": "Agentic",
          "avgA": 65.3,
          "avgB": 82.6,
          "winner": "B",
          "benchmarkCount": 11
        },
        "coding": {
          "categoryLabel": "Coding",
          "avgA": 60.9,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 7
        },
        "multimodalGrounded": {
          "categoryLabel": "Multimodal & Grounded",
          "avgA": null,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 1
        },
        "reasoning": {
          "categoryLabel": "Reasoning",
          "avgA": null,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 2
        },
        "knowledge": {
          "categoryLabel": "Knowledge",
          "avgA": 52.3,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 8
        },
        "instructionFollowing": {
          "categoryLabel": "Instruction Following",
          "avgA": null,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 1
        },
        "multilingual": {
          "categoryLabel": "Multilingual",
          "avgA": null,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 0
        },
        "math": {
          "categoryLabel": "Mathematics",
          "avgA": null,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 4
        }
      }
    },
    {
      "slug": "claude-sonnet-4-6-vs-gpt-5-5-pro",
      "url": "https://benchlm.ai/compare/claude-sonnet-4-6-vs-gpt-5-5-pro",
      "markdownUrl": "https://benchlm.ai/md/compare/claude-sonnet-4-6-vs-gpt-5-5-pro.md",
      "modelA": {
        "slug": "claude-sonnet-4-6",
        "canonicalModelKey": "claude-sonnet-4-6",
        "model": "Claude Sonnet 4.6",
        "creator": "Anthropic",
        "sourceType": "Proprietary",
        "reasoningType": "Non-Reasoning",
        "contextWindow": "200K",
        "contextWindowTokens": 200000,
        "displayScore": 82,
        "rankingEligible": true,
        "overallRank": 18,
        "url": "https://benchlm.ai/models/claude-sonnet-4-6",
        "markdownUrl": "https://benchlm.ai/md/models/claude-sonnet-4-6.md"
      },
      "modelB": {
        "slug": "gpt-5-5-pro",
        "canonicalModelKey": "gpt-5-5-pro",
        "model": "GPT-5.5 Pro",
        "creator": "OpenAI",
        "sourceType": "Proprietary",
        "reasoningType": "Reasoning",
        "contextWindow": "1M",
        "contextWindowTokens": 1000000,
        "displayScore": 100,
        "rankingEligible": false,
        "overallRank": null,
        "url": "https://benchlm.ai/models/gpt-5-5-pro",
        "markdownUrl": "https://benchlm.ai/md/models/gpt-5-5-pro.md"
      },
      "overallWinner": "B",
      "winner": {
        "slug": "gpt-5-5-pro",
        "canonicalModelKey": "gpt-5-5-pro",
        "model": "GPT-5.5 Pro",
        "creator": "OpenAI",
        "sourceType": "Proprietary",
        "reasoningType": "Reasoning",
        "contextWindow": "1M",
        "contextWindowTokens": 1000000,
        "displayScore": 100,
        "rankingEligible": false,
        "overallRank": null,
        "url": "https://benchlm.ai/models/gpt-5-5-pro",
        "markdownUrl": "https://benchlm.ai/md/models/gpt-5-5-pro.md"
      },
      "scoreDiff": 18,
      "winsA": 1,
      "winsB": 1,
      "comparableCategoryCount": 2,
      "benchmarkCountA": 33,
      "benchmarkCountB": 4,
      "categoryResults": {
        "agentic": {
          "categoryLabel": "Agentic",
          "avgA": 65.1,
          "avgB": 90.1,
          "winner": "B",
          "benchmarkCount": 10
        },
        "coding": {
          "categoryLabel": "Coding",
          "avgA": 66.4,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 8
        },
        "multimodalGrounded": {
          "categoryLabel": "Multimodal & Grounded",
          "avgA": 77.4,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 3
        },
        "reasoning": {
          "categoryLabel": "Reasoning",
          "avgA": null,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 2
        },
        "knowledge": {
          "categoryLabel": "Knowledge",
          "avgA": 73.7,
          "avgB": 57.2,
          "winner": "A",
          "benchmarkCount": 11
        },
        "instructionFollowing": {
          "categoryLabel": "Instruction Following",
          "avgA": null,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 1
        },
        "multilingual": {
          "categoryLabel": "Multilingual",
          "avgA": null,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 0
        },
        "math": {
          "categoryLabel": "Mathematics",
          "avgA": null,
          "avgB": 52.4,
          "winner": null,
          "benchmarkCount": 1
        }
      }
    },
    {
      "slug": "claude-sonnet-4-6-vs-holo3-35b-a3b",
      "url": "https://benchlm.ai/compare/claude-sonnet-4-6-vs-holo3-35b-a3b",
      "markdownUrl": "https://benchlm.ai/md/compare/claude-sonnet-4-6-vs-holo3-35b-a3b.md",
      "modelA": {
        "slug": "claude-sonnet-4-6",
        "canonicalModelKey": "claude-sonnet-4-6",
        "model": "Claude Sonnet 4.6",
        "creator": "Anthropic",
        "sourceType": "Proprietary",
        "reasoningType": "Non-Reasoning",
        "contextWindow": "200K",
        "contextWindowTokens": 200000,
        "displayScore": 82,
        "rankingEligible": true,
        "overallRank": 18,
        "url": "https://benchlm.ai/models/claude-sonnet-4-6",
        "markdownUrl": "https://benchlm.ai/md/models/claude-sonnet-4-6.md"
      },
      "modelB": {
        "slug": "holo3-35b-a3b",
        "canonicalModelKey": "holo3-35b-a3b",
        "model": "Holo3-35B-A3B",
        "creator": "H Company",
        "sourceType": "Open Weight",
        "reasoningType": "Non-Reasoning",
        "contextWindow": "64K",
        "contextWindowTokens": 64000,
        "displayScore": 100,
        "rankingEligible": false,
        "overallRank": null,
        "url": "https://benchlm.ai/models/holo3-35b-a3b",
        "markdownUrl": "https://benchlm.ai/md/models/holo3-35b-a3b.md"
      },
      "overallWinner": "B",
      "winner": {
        "slug": "holo3-35b-a3b",
        "canonicalModelKey": "holo3-35b-a3b",
        "model": "Holo3-35B-A3B",
        "creator": "H Company",
        "sourceType": "Open Weight",
        "reasoningType": "Non-Reasoning",
        "contextWindow": "64K",
        "contextWindowTokens": 64000,
        "displayScore": 100,
        "rankingEligible": false,
        "overallRank": null,
        "url": "https://benchlm.ai/models/holo3-35b-a3b",
        "markdownUrl": "https://benchlm.ai/md/models/holo3-35b-a3b.md"
      },
      "scoreDiff": 18,
      "winsA": 0,
      "winsB": 1,
      "comparableCategoryCount": 1,
      "benchmarkCountA": 33,
      "benchmarkCountB": 1,
      "categoryResults": {
        "agentic": {
          "categoryLabel": "Agentic",
          "avgA": 65.1,
          "avgB": 82.6,
          "winner": "B",
          "benchmarkCount": 9
        },
        "coding": {
          "categoryLabel": "Coding",
          "avgA": 66.4,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 8
        },
        "multimodalGrounded": {
          "categoryLabel": "Multimodal & Grounded",
          "avgA": 77.4,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 3
        },
        "reasoning": {
          "categoryLabel": "Reasoning",
          "avgA": null,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 2
        },
        "knowledge": {
          "categoryLabel": "Knowledge",
          "avgA": 73.7,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 10
        },
        "instructionFollowing": {
          "categoryLabel": "Instruction Following",
          "avgA": null,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 1
        },
        "multilingual": {
          "categoryLabel": "Multilingual",
          "avgA": null,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 0
        },
        "math": {
          "categoryLabel": "Mathematics",
          "avgA": null,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 0
        }
      }
    },
    {
      "slug": "deepseek-v4-pro-high-vs-gpt-5-5-pro",
      "url": "https://benchlm.ai/compare/deepseek-v4-pro-high-vs-gpt-5-5-pro",
      "markdownUrl": "https://benchlm.ai/md/compare/deepseek-v4-pro-high-vs-gpt-5-5-pro.md",
      "modelA": {
        "slug": "deepseek-v4-pro-high",
        "canonicalModelKey": "deepseek-v4-pro-high",
        "model": "DeepSeek V4 Pro (High)",
        "creator": "DeepSeek",
        "sourceType": "Open Weight",
        "reasoningType": "Reasoning",
        "contextWindow": "1M",
        "contextWindowTokens": 1000000,
        "displayScore": 82,
        "rankingEligible": true,
        "overallRank": 19,
        "url": "https://benchlm.ai/models/deepseek-v4-pro-high",
        "markdownUrl": "https://benchlm.ai/md/models/deepseek-v4-pro-high.md"
      },
      "modelB": {
        "slug": "gpt-5-5-pro",
        "canonicalModelKey": "gpt-5-5-pro",
        "model": "GPT-5.5 Pro",
        "creator": "OpenAI",
        "sourceType": "Proprietary",
        "reasoningType": "Reasoning",
        "contextWindow": "1M",
        "contextWindowTokens": 1000000,
        "displayScore": 100,
        "rankingEligible": false,
        "overallRank": null,
        "url": "https://benchlm.ai/models/gpt-5-5-pro",
        "markdownUrl": "https://benchlm.ai/md/models/gpt-5-5-pro.md"
      },
      "overallWinner": "B",
      "winner": {
        "slug": "gpt-5-5-pro",
        "canonicalModelKey": "gpt-5-5-pro",
        "model": "GPT-5.5 Pro",
        "creator": "OpenAI",
        "sourceType": "Proprietary",
        "reasoningType": "Reasoning",
        "contextWindow": "1M",
        "contextWindowTokens": 1000000,
        "displayScore": 100,
        "rankingEligible": false,
        "overallRank": null,
        "url": "https://benchlm.ai/models/gpt-5-5-pro",
        "markdownUrl": "https://benchlm.ai/md/models/gpt-5-5-pro.md"
      },
      "scoreDiff": 18,
      "winsA": 1,
      "winsB": 1,
      "comparableCategoryCount": 2,
      "benchmarkCountA": 40,
      "benchmarkCountB": 4,
      "categoryResults": {
        "agentic": {
          "categoryLabel": "Agentic",
          "avgA": 70,
          "avgB": 90.1,
          "winner": "B",
          "benchmarkCount": 9
        },
        "coding": {
          "categoryLabel": "Coding",
          "avgA": 73.8,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 9
        },
        "multimodalGrounded": {
          "categoryLabel": "Multimodal & Grounded",
          "avgA": null,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 1
        },
        "reasoning": {
          "categoryLabel": "Reasoning",
          "avgA": null,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 4
        },
        "knowledge": {
          "categoryLabel": "Knowledge",
          "avgA": 62.6,
          "avgB": 57.2,
          "winner": "A",
          "benchmarkCount": 13
        },
        "instructionFollowing": {
          "categoryLabel": "Instruction Following",
          "avgA": null,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 1
        },
        "multilingual": {
          "categoryLabel": "Multilingual",
          "avgA": null,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 0
        },
        "math": {
          "categoryLabel": "Mathematics",
          "avgA": null,
          "avgB": 52.4,
          "winner": null,
          "benchmarkCount": 5
        }
      }
    },
    {
      "slug": "deepseek-v4-pro-high-vs-holo3-35b-a3b",
      "url": "https://benchlm.ai/compare/deepseek-v4-pro-high-vs-holo3-35b-a3b",
      "markdownUrl": "https://benchlm.ai/md/compare/deepseek-v4-pro-high-vs-holo3-35b-a3b.md",
      "modelA": {
        "slug": "deepseek-v4-pro-high",
        "canonicalModelKey": "deepseek-v4-pro-high",
        "model": "DeepSeek V4 Pro (High)",
        "creator": "DeepSeek",
        "sourceType": "Open Weight",
        "reasoningType": "Reasoning",
        "contextWindow": "1M",
        "contextWindowTokens": 1000000,
        "displayScore": 82,
        "rankingEligible": true,
        "overallRank": 19,
        "url": "https://benchlm.ai/models/deepseek-v4-pro-high",
        "markdownUrl": "https://benchlm.ai/md/models/deepseek-v4-pro-high.md"
      },
      "modelB": {
        "slug": "holo3-35b-a3b",
        "canonicalModelKey": "holo3-35b-a3b",
        "model": "Holo3-35B-A3B",
        "creator": "H Company",
        "sourceType": "Open Weight",
        "reasoningType": "Non-Reasoning",
        "contextWindow": "64K",
        "contextWindowTokens": 64000,
        "displayScore": 100,
        "rankingEligible": false,
        "overallRank": null,
        "url": "https://benchlm.ai/models/holo3-35b-a3b",
        "markdownUrl": "https://benchlm.ai/md/models/holo3-35b-a3b.md"
      },
      "overallWinner": "B",
      "winner": {
        "slug": "holo3-35b-a3b",
        "canonicalModelKey": "holo3-35b-a3b",
        "model": "Holo3-35B-A3B",
        "creator": "H Company",
        "sourceType": "Open Weight",
        "reasoningType": "Non-Reasoning",
        "contextWindow": "64K",
        "contextWindowTokens": 64000,
        "displayScore": 100,
        "rankingEligible": false,
        "overallRank": null,
        "url": "https://benchlm.ai/models/holo3-35b-a3b",
        "markdownUrl": "https://benchlm.ai/md/models/holo3-35b-a3b.md"
      },
      "scoreDiff": 18,
      "winsA": 0,
      "winsB": 1,
      "comparableCategoryCount": 1,
      "benchmarkCountA": 40,
      "benchmarkCountB": 1,
      "categoryResults": {
        "agentic": {
          "categoryLabel": "Agentic",
          "avgA": 70,
          "avgB": 82.6,
          "winner": "B",
          "benchmarkCount": 10
        },
        "coding": {
          "categoryLabel": "Coding",
          "avgA": 73.8,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 9
        },
        "multimodalGrounded": {
          "categoryLabel": "Multimodal & Grounded",
          "avgA": null,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 1
        },
        "reasoning": {
          "categoryLabel": "Reasoning",
          "avgA": null,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 4
        },
        "knowledge": {
          "categoryLabel": "Knowledge",
          "avgA": 62.6,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 12
        },
        "instructionFollowing": {
          "categoryLabel": "Instruction Following",
          "avgA": null,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 1
        },
        "multilingual": {
          "categoryLabel": "Multilingual",
          "avgA": null,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 0
        },
        "math": {
          "categoryLabel": "Mathematics",
          "avgA": null,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 4
        }
      }
    },
    {
      "slug": "gpt-5-5-pro-vs-o1-preview",
      "url": "https://benchlm.ai/compare/gpt-5-5-pro-vs-o1-preview",
      "markdownUrl": "https://benchlm.ai/md/compare/gpt-5-5-pro-vs-o1-preview.md",
      "modelA": {
        "slug": "o1-preview",
        "canonicalModelKey": "o1-preview",
        "model": "o1-preview",
        "creator": "OpenAI",
        "sourceType": "Proprietary",
        "reasoningType": "Reasoning",
        "contextWindow": "200K",
        "contextWindowTokens": 200000,
        "displayScore": 82,
        "rankingEligible": true,
        "overallRank": 20,
        "url": "https://benchlm.ai/models/o1-preview",
        "markdownUrl": "https://benchlm.ai/md/models/o1-preview.md"
      },
      "modelB": {
        "slug": "gpt-5-5-pro",
        "canonicalModelKey": "gpt-5-5-pro",
        "model": "GPT-5.5 Pro",
        "creator": "OpenAI",
        "sourceType": "Proprietary",
        "reasoningType": "Reasoning",
        "contextWindow": "1M",
        "contextWindowTokens": 1000000,
        "displayScore": 100,
        "rankingEligible": false,
        "overallRank": null,
        "url": "https://benchlm.ai/models/gpt-5-5-pro",
        "markdownUrl": "https://benchlm.ai/md/models/gpt-5-5-pro.md"
      },
      "overallWinner": "B",
      "winner": {
        "slug": "gpt-5-5-pro",
        "canonicalModelKey": "gpt-5-5-pro",
        "model": "GPT-5.5 Pro",
        "creator": "OpenAI",
        "sourceType": "Proprietary",
        "reasoningType": "Reasoning",
        "contextWindow": "1M",
        "contextWindowTokens": 1000000,
        "displayScore": 100,
        "rankingEligible": false,
        "overallRank": null,
        "url": "https://benchlm.ai/models/gpt-5-5-pro",
        "markdownUrl": "https://benchlm.ai/md/models/gpt-5-5-pro.md"
      },
      "scoreDiff": 18,
      "winsA": 0,
      "winsB": 0,
      "comparableCategoryCount": 0,
      "benchmarkCountA": 2,
      "benchmarkCountB": 4,
      "categoryResults": {
        "agentic": {
          "categoryLabel": "Agentic",
          "avgA": null,
          "avgB": 90.1,
          "winner": null,
          "benchmarkCount": 1
        },
        "coding": {
          "categoryLabel": "Coding",
          "avgA": null,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 1
        },
        "multimodalGrounded": {
          "categoryLabel": "Multimodal & Grounded",
          "avgA": null,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 0
        },
        "reasoning": {
          "categoryLabel": "Reasoning",
          "avgA": null,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 0
        },
        "knowledge": {
          "categoryLabel": "Knowledge",
          "avgA": null,
          "avgB": 57.2,
          "winner": null,
          "benchmarkCount": 3
        },
        "instructionFollowing": {
          "categoryLabel": "Instruction Following",
          "avgA": null,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 0
        },
        "multilingual": {
          "categoryLabel": "Multilingual",
          "avgA": null,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 0
        },
        "math": {
          "categoryLabel": "Mathematics",
          "avgA": null,
          "avgB": 52.4,
          "winner": null,
          "benchmarkCount": 1
        }
      }
    },
    {
      "slug": "holo3-35b-a3b-vs-o1-preview",
      "url": "https://benchlm.ai/compare/holo3-35b-a3b-vs-o1-preview",
      "markdownUrl": "https://benchlm.ai/md/compare/holo3-35b-a3b-vs-o1-preview.md",
      "modelA": {
        "slug": "o1-preview",
        "canonicalModelKey": "o1-preview",
        "model": "o1-preview",
        "creator": "OpenAI",
        "sourceType": "Proprietary",
        "reasoningType": "Reasoning",
        "contextWindow": "200K",
        "contextWindowTokens": 200000,
        "displayScore": 82,
        "rankingEligible": true,
        "overallRank": 20,
        "url": "https://benchlm.ai/models/o1-preview",
        "markdownUrl": "https://benchlm.ai/md/models/o1-preview.md"
      },
      "modelB": {
        "slug": "holo3-35b-a3b",
        "canonicalModelKey": "holo3-35b-a3b",
        "model": "Holo3-35B-A3B",
        "creator": "H Company",
        "sourceType": "Open Weight",
        "reasoningType": "Non-Reasoning",
        "contextWindow": "64K",
        "contextWindowTokens": 64000,
        "displayScore": 100,
        "rankingEligible": false,
        "overallRank": null,
        "url": "https://benchlm.ai/models/holo3-35b-a3b",
        "markdownUrl": "https://benchlm.ai/md/models/holo3-35b-a3b.md"
      },
      "overallWinner": "B",
      "winner": {
        "slug": "holo3-35b-a3b",
        "canonicalModelKey": "holo3-35b-a3b",
        "model": "Holo3-35B-A3B",
        "creator": "H Company",
        "sourceType": "Open Weight",
        "reasoningType": "Non-Reasoning",
        "contextWindow": "64K",
        "contextWindowTokens": 64000,
        "displayScore": 100,
        "rankingEligible": false,
        "overallRank": null,
        "url": "https://benchlm.ai/models/holo3-35b-a3b",
        "markdownUrl": "https://benchlm.ai/md/models/holo3-35b-a3b.md"
      },
      "scoreDiff": 18,
      "winsA": 0,
      "winsB": 0,
      "comparableCategoryCount": 0,
      "benchmarkCountA": 2,
      "benchmarkCountB": 1,
      "categoryResults": {
        "agentic": {
          "categoryLabel": "Agentic",
          "avgA": null,
          "avgB": 82.6,
          "winner": null,
          "benchmarkCount": 1
        },
        "coding": {
          "categoryLabel": "Coding",
          "avgA": null,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 1
        },
        "multimodalGrounded": {
          "categoryLabel": "Multimodal & Grounded",
          "avgA": null,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 0
        },
        "reasoning": {
          "categoryLabel": "Reasoning",
          "avgA": null,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 0
        },
        "knowledge": {
          "categoryLabel": "Knowledge",
          "avgA": null,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 1
        },
        "instructionFollowing": {
          "categoryLabel": "Instruction Following",
          "avgA": null,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 0
        },
        "multilingual": {
          "categoryLabel": "Multilingual",
          "avgA": null,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 0
        },
        "math": {
          "categoryLabel": "Mathematics",
          "avgA": null,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 0
        }
      }
    },
    {
      "slug": "gpt-5-5-pro-vs-kimi-2-6",
      "url": "https://benchlm.ai/compare/gpt-5-5-pro-vs-kimi-2-6",
      "markdownUrl": "https://benchlm.ai/md/compare/gpt-5-5-pro-vs-kimi-2-6.md",
      "modelA": {
        "slug": "kimi-2-6",
        "canonicalModelKey": "kimi-2-6",
        "model": "Kimi K2.6",
        "creator": "Moonshot AI",
        "sourceType": "Open Weight",
        "reasoningType": "Reasoning",
        "contextWindow": "256K",
        "contextWindowTokens": 256000,
        "displayScore": 81,
        "rankingEligible": true,
        "overallRank": 21,
        "url": "https://benchlm.ai/models/kimi-2-6",
        "markdownUrl": "https://benchlm.ai/md/models/kimi-2-6.md"
      },
      "modelB": {
        "slug": "gpt-5-5-pro",
        "canonicalModelKey": "gpt-5-5-pro",
        "model": "GPT-5.5 Pro",
        "creator": "OpenAI",
        "sourceType": "Proprietary",
        "reasoningType": "Reasoning",
        "contextWindow": "1M",
        "contextWindowTokens": 1000000,
        "displayScore": 100,
        "rankingEligible": false,
        "overallRank": null,
        "url": "https://benchlm.ai/models/gpt-5-5-pro",
        "markdownUrl": "https://benchlm.ai/md/models/gpt-5-5-pro.md"
      },
      "overallWinner": "B",
      "winner": {
        "slug": "gpt-5-5-pro",
        "canonicalModelKey": "gpt-5-5-pro",
        "model": "GPT-5.5 Pro",
        "creator": "OpenAI",
        "sourceType": "Proprietary",
        "reasoningType": "Reasoning",
        "contextWindow": "1M",
        "contextWindowTokens": 1000000,
        "displayScore": 100,
        "rankingEligible": false,
        "overallRank": null,
        "url": "https://benchlm.ai/models/gpt-5-5-pro",
        "markdownUrl": "https://benchlm.ai/md/models/gpt-5-5-pro.md"
      },
      "scoreDiff": 19,
      "winsA": 0,
      "winsB": 2,
      "comparableCategoryCount": 2,
      "benchmarkCountA": 48,
      "benchmarkCountB": 4,
      "categoryResults": {
        "agentic": {
          "categoryLabel": "Agentic",
          "avgA": 73.1,
          "avgB": 90.1,
          "winner": "B",
          "benchmarkCount": 14
        },
        "coding": {
          "categoryLabel": "Coding",
          "avgA": 72,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 12
        },
        "multimodalGrounded": {
          "categoryLabel": "Multimodal & Grounded",
          "avgA": 79.7,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 7
        },
        "reasoning": {
          "categoryLabel": "Reasoning",
          "avgA": null,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 2
        },
        "knowledge": {
          "categoryLabel": "Knowledge",
          "avgA": 53.8,
          "avgB": 57.2,
          "winner": "B",
          "benchmarkCount": 10
        },
        "instructionFollowing": {
          "categoryLabel": "Instruction Following",
          "avgA": null,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 1
        },
        "multilingual": {
          "categoryLabel": "Multilingual",
          "avgA": null,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 0
        },
        "math": {
          "categoryLabel": "Mathematics",
          "avgA": null,
          "avgB": 52.4,
          "winner": null,
          "benchmarkCount": 4
        }
      }
    },
    {
      "slug": "holo3-35b-a3b-vs-kimi-2-6",
      "url": "https://benchlm.ai/compare/holo3-35b-a3b-vs-kimi-2-6",
      "markdownUrl": "https://benchlm.ai/md/compare/holo3-35b-a3b-vs-kimi-2-6.md",
      "modelA": {
        "slug": "kimi-2-6",
        "canonicalModelKey": "kimi-2-6",
        "model": "Kimi K2.6",
        "creator": "Moonshot AI",
        "sourceType": "Open Weight",
        "reasoningType": "Reasoning",
        "contextWindow": "256K",
        "contextWindowTokens": 256000,
        "displayScore": 81,
        "rankingEligible": true,
        "overallRank": 21,
        "url": "https://benchlm.ai/models/kimi-2-6",
        "markdownUrl": "https://benchlm.ai/md/models/kimi-2-6.md"
      },
      "modelB": {
        "slug": "holo3-35b-a3b",
        "canonicalModelKey": "holo3-35b-a3b",
        "model": "Holo3-35B-A3B",
        "creator": "H Company",
        "sourceType": "Open Weight",
        "reasoningType": "Non-Reasoning",
        "contextWindow": "64K",
        "contextWindowTokens": 64000,
        "displayScore": 100,
        "rankingEligible": false,
        "overallRank": null,
        "url": "https://benchlm.ai/models/holo3-35b-a3b",
        "markdownUrl": "https://benchlm.ai/md/models/holo3-35b-a3b.md"
      },
      "overallWinner": "B",
      "winner": {
        "slug": "holo3-35b-a3b",
        "canonicalModelKey": "holo3-35b-a3b",
        "model": "Holo3-35B-A3B",
        "creator": "H Company",
        "sourceType": "Open Weight",
        "reasoningType": "Non-Reasoning",
        "contextWindow": "64K",
        "contextWindowTokens": 64000,
        "displayScore": 100,
        "rankingEligible": false,
        "overallRank": null,
        "url": "https://benchlm.ai/models/holo3-35b-a3b",
        "markdownUrl": "https://benchlm.ai/md/models/holo3-35b-a3b.md"
      },
      "scoreDiff": 19,
      "winsA": 0,
      "winsB": 1,
      "comparableCategoryCount": 1,
      "benchmarkCountA": 48,
      "benchmarkCountB": 1,
      "categoryResults": {
        "agentic": {
          "categoryLabel": "Agentic",
          "avgA": 73.1,
          "avgB": 82.6,
          "winner": "B",
          "benchmarkCount": 14
        },
        "coding": {
          "categoryLabel": "Coding",
          "avgA": 72,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 12
        },
        "multimodalGrounded": {
          "categoryLabel": "Multimodal & Grounded",
          "avgA": 79.7,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 7
        },
        "reasoning": {
          "categoryLabel": "Reasoning",
          "avgA": null,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 2
        },
        "knowledge": {
          "categoryLabel": "Knowledge",
          "avgA": 53.8,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 9
        },
        "instructionFollowing": {
          "categoryLabel": "Instruction Following",
          "avgA": null,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 1
        },
        "multilingual": {
          "categoryLabel": "Multilingual",
          "avgA": null,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 0
        },
        "math": {
          "categoryLabel": "Mathematics",
          "avgA": null,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 3
        }
      }
    },
    {
      "slug": "gemini-3-pro-vs-gpt-5-5-pro",
      "url": "https://benchlm.ai/compare/gemini-3-pro-vs-gpt-5-5-pro",
      "markdownUrl": "https://benchlm.ai/md/compare/gemini-3-pro-vs-gpt-5-5-pro.md",
      "modelA": {
        "slug": "gemini-3-pro",
        "canonicalModelKey": "gemini-3-pro",
        "model": "Gemini 3 Pro",
        "creator": "Google",
        "sourceType": "Proprietary",
        "reasoningType": "Non-Reasoning",
        "contextWindow": "2M",
        "contextWindowTokens": 2000000,
        "displayScore": 80,
        "rankingEligible": true,
        "overallRank": 22,
        "url": "https://benchlm.ai/models/gemini-3-pro",
        "markdownUrl": "https://benchlm.ai/md/models/gemini-3-pro.md"
      },
      "modelB": {
        "slug": "gpt-5-5-pro",
        "canonicalModelKey": "gpt-5-5-pro",
        "model": "GPT-5.5 Pro",
        "creator": "OpenAI",
        "sourceType": "Proprietary",
        "reasoningType": "Reasoning",
        "contextWindow": "1M",
        "contextWindowTokens": 1000000,
        "displayScore": 100,
        "rankingEligible": false,
        "overallRank": null,
        "url": "https://benchlm.ai/models/gpt-5-5-pro",
        "markdownUrl": "https://benchlm.ai/md/models/gpt-5-5-pro.md"
      },
      "overallWinner": "B",
      "winner": {
        "slug": "gpt-5-5-pro",
        "canonicalModelKey": "gpt-5-5-pro",
        "model": "GPT-5.5 Pro",
        "creator": "OpenAI",
        "sourceType": "Proprietary",
        "reasoningType": "Reasoning",
        "contextWindow": "1M",
        "contextWindowTokens": 1000000,
        "displayScore": 100,
        "rankingEligible": false,
        "overallRank": null,
        "url": "https://benchlm.ai/models/gpt-5-5-pro",
        "markdownUrl": "https://benchlm.ai/md/models/gpt-5-5-pro.md"
      },
      "scoreDiff": 20,
      "winsA": 0,
      "winsB": 0,
      "comparableCategoryCount": 0,
      "benchmarkCountA": 26,
      "benchmarkCountB": 4,
      "categoryResults": {
        "agentic": {
          "categoryLabel": "Agentic",
          "avgA": null,
          "avgB": 90.1,
          "winner": null,
          "benchmarkCount": 6
        },
        "coding": {
          "categoryLabel": "Coding",
          "avgA": null,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 4
        },
        "multimodalGrounded": {
          "categoryLabel": "Multimodal & Grounded",
          "avgA": 81.1,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 7
        },
        "reasoning": {
          "categoryLabel": "Reasoning",
          "avgA": 31.1,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 3
        },
        "knowledge": {
          "categoryLabel": "Knowledge",
          "avgA": null,
          "avgB": 57.2,
          "winner": null,
          "benchmarkCount": 8
        },
        "instructionFollowing": {
          "categoryLabel": "Instruction Following",
          "avgA": null,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 1
        },
        "multilingual": {
          "categoryLabel": "Multilingual",
          "avgA": null,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 0
        },
        "math": {
          "categoryLabel": "Mathematics",
          "avgA": null,
          "avgB": 52.4,
          "winner": null,
          "benchmarkCount": 1
        }
      }
    },
    {
      "slug": "gemini-3-pro-vs-holo3-35b-a3b",
      "url": "https://benchlm.ai/compare/gemini-3-pro-vs-holo3-35b-a3b",
      "markdownUrl": "https://benchlm.ai/md/compare/gemini-3-pro-vs-holo3-35b-a3b.md",
      "modelA": {
        "slug": "gemini-3-pro",
        "canonicalModelKey": "gemini-3-pro",
        "model": "Gemini 3 Pro",
        "creator": "Google",
        "sourceType": "Proprietary",
        "reasoningType": "Non-Reasoning",
        "contextWindow": "2M",
        "contextWindowTokens": 2000000,
        "displayScore": 80,
        "rankingEligible": true,
        "overallRank": 22,
        "url": "https://benchlm.ai/models/gemini-3-pro",
        "markdownUrl": "https://benchlm.ai/md/models/gemini-3-pro.md"
      },
      "modelB": {
        "slug": "holo3-35b-a3b",
        "canonicalModelKey": "holo3-35b-a3b",
        "model": "Holo3-35B-A3B",
        "creator": "H Company",
        "sourceType": "Open Weight",
        "reasoningType": "Non-Reasoning",
        "contextWindow": "64K",
        "contextWindowTokens": 64000,
        "displayScore": 100,
        "rankingEligible": false,
        "overallRank": null,
        "url": "https://benchlm.ai/models/holo3-35b-a3b",
        "markdownUrl": "https://benchlm.ai/md/models/holo3-35b-a3b.md"
      },
      "overallWinner": "B",
      "winner": {
        "slug": "holo3-35b-a3b",
        "canonicalModelKey": "holo3-35b-a3b",
        "model": "Holo3-35B-A3B",
        "creator": "H Company",
        "sourceType": "Open Weight",
        "reasoningType": "Non-Reasoning",
        "contextWindow": "64K",
        "contextWindowTokens": 64000,
        "displayScore": 100,
        "rankingEligible": false,
        "overallRank": null,
        "url": "https://benchlm.ai/models/holo3-35b-a3b",
        "markdownUrl": "https://benchlm.ai/md/models/holo3-35b-a3b.md"
      },
      "scoreDiff": 20,
      "winsA": 0,
      "winsB": 0,
      "comparableCategoryCount": 0,
      "benchmarkCountA": 26,
      "benchmarkCountB": 1,
      "categoryResults": {
        "agentic": {
          "categoryLabel": "Agentic",
          "avgA": null,
          "avgB": 82.6,
          "winner": null,
          "benchmarkCount": 6
        },
        "coding": {
          "categoryLabel": "Coding",
          "avgA": null,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 4
        },
        "multimodalGrounded": {
          "categoryLabel": "Multimodal & Grounded",
          "avgA": 81.1,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 7
        },
        "reasoning": {
          "categoryLabel": "Reasoning",
          "avgA": 31.1,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 3
        },
        "knowledge": {
          "categoryLabel": "Knowledge",
          "avgA": null,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 6
        },
        "instructionFollowing": {
          "categoryLabel": "Instruction Following",
          "avgA": null,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 1
        },
        "multilingual": {
          "categoryLabel": "Multilingual",
          "avgA": null,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 0
        },
        "math": {
          "categoryLabel": "Mathematics",
          "avgA": null,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 0
        }
      }
    },
    {
      "slug": "gpt-5-5-pro-vs-minimax-m3",
      "url": "https://benchlm.ai/compare/gpt-5-5-pro-vs-minimax-m3",
      "markdownUrl": "https://benchlm.ai/md/compare/gpt-5-5-pro-vs-minimax-m3.md",
      "modelA": {
        "slug": "minimax-m3",
        "canonicalModelKey": "minimax-m3",
        "model": "MiniMax M3",
        "creator": "MiniMax",
        "sourceType": "Open Weight",
        "reasoningType": "Non-Reasoning",
        "contextWindow": "1M",
        "contextWindowTokens": 1000000,
        "displayScore": 79,
        "rankingEligible": true,
        "overallRank": 23,
        "url": "https://benchlm.ai/models/minimax-m3",
        "markdownUrl": "https://benchlm.ai/md/models/minimax-m3.md"
      },
      "modelB": {
        "slug": "gpt-5-5-pro",
        "canonicalModelKey": "gpt-5-5-pro",
        "model": "GPT-5.5 Pro",
        "creator": "OpenAI",
        "sourceType": "Proprietary",
        "reasoningType": "Reasoning",
        "contextWindow": "1M",
        "contextWindowTokens": 1000000,
        "displayScore": 100,
        "rankingEligible": false,
        "overallRank": null,
        "url": "https://benchlm.ai/models/gpt-5-5-pro",
        "markdownUrl": "https://benchlm.ai/md/models/gpt-5-5-pro.md"
      },
      "overallWinner": "B",
      "winner": {
        "slug": "gpt-5-5-pro",
        "canonicalModelKey": "gpt-5-5-pro",
        "model": "GPT-5.5 Pro",
        "creator": "OpenAI",
        "sourceType": "Proprietary",
        "reasoningType": "Reasoning",
        "contextWindow": "1M",
        "contextWindowTokens": 1000000,
        "displayScore": 100,
        "rankingEligible": false,
        "overallRank": null,
        "url": "https://benchlm.ai/models/gpt-5-5-pro",
        "markdownUrl": "https://benchlm.ai/md/models/gpt-5-5-pro.md"
      },
      "scoreDiff": 21,
      "winsA": 0,
      "winsB": 1,
      "comparableCategoryCount": 1,
      "benchmarkCountA": 38,
      "benchmarkCountB": 4,
      "categoryResults": {
        "agentic": {
          "categoryLabel": "Agentic",
          "avgA": 71.9,
          "avgB": 90.1,
          "winner": "B",
          "benchmarkCount": 11
        },
        "coding": {
          "categoryLabel": "Coding",
          "avgA": 67,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 10
        },
        "multimodalGrounded": {
          "categoryLabel": "Multimodal & Grounded",
          "avgA": 64.9,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 7
        },
        "reasoning": {
          "categoryLabel": "Reasoning",
          "avgA": null,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 2
        },
        "knowledge": {
          "categoryLabel": "Knowledge",
          "avgA": null,
          "avgB": 57.2,
          "winner": null,
          "benchmarkCount": 8
        },
        "instructionFollowing": {
          "categoryLabel": "Instruction Following",
          "avgA": null,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 1
        },
        "multilingual": {
          "categoryLabel": "Multilingual",
          "avgA": null,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 0
        },
        "math": {
          "categoryLabel": "Mathematics",
          "avgA": null,
          "avgB": 52.4,
          "winner": null,
          "benchmarkCount": 2
        }
      }
    },
    {
      "slug": "holo3-35b-a3b-vs-minimax-m3",
      "url": "https://benchlm.ai/compare/holo3-35b-a3b-vs-minimax-m3",
      "markdownUrl": "https://benchlm.ai/md/compare/holo3-35b-a3b-vs-minimax-m3.md",
      "modelA": {
        "slug": "minimax-m3",
        "canonicalModelKey": "minimax-m3",
        "model": "MiniMax M3",
        "creator": "MiniMax",
        "sourceType": "Open Weight",
        "reasoningType": "Non-Reasoning",
        "contextWindow": "1M",
        "contextWindowTokens": 1000000,
        "displayScore": 79,
        "rankingEligible": true,
        "overallRank": 23,
        "url": "https://benchlm.ai/models/minimax-m3",
        "markdownUrl": "https://benchlm.ai/md/models/minimax-m3.md"
      },
      "modelB": {
        "slug": "holo3-35b-a3b",
        "canonicalModelKey": "holo3-35b-a3b",
        "model": "Holo3-35B-A3B",
        "creator": "H Company",
        "sourceType": "Open Weight",
        "reasoningType": "Non-Reasoning",
        "contextWindow": "64K",
        "contextWindowTokens": 64000,
        "displayScore": 100,
        "rankingEligible": false,
        "overallRank": null,
        "url": "https://benchlm.ai/models/holo3-35b-a3b",
        "markdownUrl": "https://benchlm.ai/md/models/holo3-35b-a3b.md"
      },
      "overallWinner": "B",
      "winner": {
        "slug": "holo3-35b-a3b",
        "canonicalModelKey": "holo3-35b-a3b",
        "model": "Holo3-35B-A3B",
        "creator": "H Company",
        "sourceType": "Open Weight",
        "reasoningType": "Non-Reasoning",
        "contextWindow": "64K",
        "contextWindowTokens": 64000,
        "displayScore": 100,
        "rankingEligible": false,
        "overallRank": null,
        "url": "https://benchlm.ai/models/holo3-35b-a3b",
        "markdownUrl": "https://benchlm.ai/md/models/holo3-35b-a3b.md"
      },
      "scoreDiff": 21,
      "winsA": 0,
      "winsB": 1,
      "comparableCategoryCount": 1,
      "benchmarkCountA": 38,
      "benchmarkCountB": 1,
      "categoryResults": {
        "agentic": {
          "categoryLabel": "Agentic",
          "avgA": 71.9,
          "avgB": 82.6,
          "winner": "B",
          "benchmarkCount": 11
        },
        "coding": {
          "categoryLabel": "Coding",
          "avgA": 67,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 10
        },
        "multimodalGrounded": {
          "categoryLabel": "Multimodal & Grounded",
          "avgA": 64.9,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 7
        },
        "reasoning": {
          "categoryLabel": "Reasoning",
          "avgA": null,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 2
        },
        "knowledge": {
          "categoryLabel": "Knowledge",
          "avgA": null,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 6
        },
        "instructionFollowing": {
          "categoryLabel": "Instruction Following",
          "avgA": null,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 1
        },
        "multilingual": {
          "categoryLabel": "Multilingual",
          "avgA": null,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 0
        },
        "math": {
          "categoryLabel": "Mathematics",
          "avgA": null,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 1
        }
      }
    },
    {
      "slug": "glm-5-reasoning-vs-gpt-5-5-pro",
      "url": "https://benchlm.ai/compare/glm-5-reasoning-vs-gpt-5-5-pro",
      "markdownUrl": "https://benchlm.ai/md/compare/glm-5-reasoning-vs-gpt-5-5-pro.md",
      "modelA": {
        "slug": "glm-5-reasoning",
        "canonicalModelKey": "glm-5-reasoning",
        "model": "GLM-5 (Reasoning)",
        "creator": "Z.AI",
        "sourceType": "Open Weight",
        "reasoningType": "Reasoning",
        "contextWindow": "200K",
        "contextWindowTokens": 200000,
        "displayScore": 79,
        "rankingEligible": true,
        "overallRank": 24,
        "url": "https://benchlm.ai/models/glm-5-reasoning",
        "markdownUrl": "https://benchlm.ai/md/models/glm-5-reasoning.md"
      },
      "modelB": {
        "slug": "gpt-5-5-pro",
        "canonicalModelKey": "gpt-5-5-pro",
        "model": "GPT-5.5 Pro",
        "creator": "OpenAI",
        "sourceType": "Proprietary",
        "reasoningType": "Reasoning",
        "contextWindow": "1M",
        "contextWindowTokens": 1000000,
        "displayScore": 100,
        "rankingEligible": false,
        "overallRank": null,
        "url": "https://benchlm.ai/models/gpt-5-5-pro",
        "markdownUrl": "https://benchlm.ai/md/models/gpt-5-5-pro.md"
      },
      "overallWinner": "B",
      "winner": {
        "slug": "gpt-5-5-pro",
        "canonicalModelKey": "gpt-5-5-pro",
        "model": "GPT-5.5 Pro",
        "creator": "OpenAI",
        "sourceType": "Proprietary",
        "reasoningType": "Reasoning",
        "contextWindow": "1M",
        "contextWindowTokens": 1000000,
        "displayScore": 100,
        "rankingEligible": false,
        "overallRank": null,
        "url": "https://benchlm.ai/models/gpt-5-5-pro",
        "markdownUrl": "https://benchlm.ai/md/models/gpt-5-5-pro.md"
      },
      "scoreDiff": 21,
      "winsA": 0,
      "winsB": 0,
      "comparableCategoryCount": 0,
      "benchmarkCountA": 2,
      "benchmarkCountB": 4,
      "categoryResults": {
        "agentic": {
          "categoryLabel": "Agentic",
          "avgA": null,
          "avgB": 90.1,
          "winner": null,
          "benchmarkCount": 1
        },
        "coding": {
          "categoryLabel": "Coding",
          "avgA": null,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 1
        },
        "multimodalGrounded": {
          "categoryLabel": "Multimodal & Grounded",
          "avgA": null,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 1
        },
        "reasoning": {
          "categoryLabel": "Reasoning",
          "avgA": null,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 0
        },
        "knowledge": {
          "categoryLabel": "Knowledge",
          "avgA": null,
          "avgB": 57.2,
          "winner": null,
          "benchmarkCount": 2
        },
        "instructionFollowing": {
          "categoryLabel": "Instruction Following",
          "avgA": null,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 0
        },
        "multilingual": {
          "categoryLabel": "Multilingual",
          "avgA": null,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 0
        },
        "math": {
          "categoryLabel": "Mathematics",
          "avgA": null,
          "avgB": 52.4,
          "winner": null,
          "benchmarkCount": 1
        }
      }
    },
    {
      "slug": "glm-5-reasoning-vs-holo3-35b-a3b",
      "url": "https://benchlm.ai/compare/glm-5-reasoning-vs-holo3-35b-a3b",
      "markdownUrl": "https://benchlm.ai/md/compare/glm-5-reasoning-vs-holo3-35b-a3b.md",
      "modelA": {
        "slug": "glm-5-reasoning",
        "canonicalModelKey": "glm-5-reasoning",
        "model": "GLM-5 (Reasoning)",
        "creator": "Z.AI",
        "sourceType": "Open Weight",
        "reasoningType": "Reasoning",
        "contextWindow": "200K",
        "contextWindowTokens": 200000,
        "displayScore": 79,
        "rankingEligible": true,
        "overallRank": 24,
        "url": "https://benchlm.ai/models/glm-5-reasoning",
        "markdownUrl": "https://benchlm.ai/md/models/glm-5-reasoning.md"
      },
      "modelB": {
        "slug": "holo3-35b-a3b",
        "canonicalModelKey": "holo3-35b-a3b",
        "model": "Holo3-35B-A3B",
        "creator": "H Company",
        "sourceType": "Open Weight",
        "reasoningType": "Non-Reasoning",
        "contextWindow": "64K",
        "contextWindowTokens": 64000,
        "displayScore": 100,
        "rankingEligible": false,
        "overallRank": null,
        "url": "https://benchlm.ai/models/holo3-35b-a3b",
        "markdownUrl": "https://benchlm.ai/md/models/holo3-35b-a3b.md"
      },
      "overallWinner": "B",
      "winner": {
        "slug": "holo3-35b-a3b",
        "canonicalModelKey": "holo3-35b-a3b",
        "model": "Holo3-35B-A3B",
        "creator": "H Company",
        "sourceType": "Open Weight",
        "reasoningType": "Non-Reasoning",
        "contextWindow": "64K",
        "contextWindowTokens": 64000,
        "displayScore": 100,
        "rankingEligible": false,
        "overallRank": null,
        "url": "https://benchlm.ai/models/holo3-35b-a3b",
        "markdownUrl": "https://benchlm.ai/md/models/holo3-35b-a3b.md"
      },
      "scoreDiff": 21,
      "winsA": 0,
      "winsB": 0,
      "comparableCategoryCount": 0,
      "benchmarkCountA": 2,
      "benchmarkCountB": 1,
      "categoryResults": {
        "agentic": {
          "categoryLabel": "Agentic",
          "avgA": null,
          "avgB": 82.6,
          "winner": null,
          "benchmarkCount": 1
        },
        "coding": {
          "categoryLabel": "Coding",
          "avgA": null,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 1
        },
        "multimodalGrounded": {
          "categoryLabel": "Multimodal & Grounded",
          "avgA": null,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 1
        },
        "reasoning": {
          "categoryLabel": "Reasoning",
          "avgA": null,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 0
        },
        "knowledge": {
          "categoryLabel": "Knowledge",
          "avgA": null,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 0
        },
        "instructionFollowing": {
          "categoryLabel": "Instruction Following",
          "avgA": null,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 0
        },
        "multilingual": {
          "categoryLabel": "Multilingual",
          "avgA": null,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 0
        },
        "math": {
          "categoryLabel": "Mathematics",
          "avgA": null,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 0
        }
      }
    },
    {
      "slug": "gpt-5-2-vs-gpt-5-5-pro",
      "url": "https://benchlm.ai/compare/gpt-5-2-vs-gpt-5-5-pro",
      "markdownUrl": "https://benchlm.ai/md/compare/gpt-5-2-vs-gpt-5-5-pro.md",
      "modelA": {
        "slug": "gpt-5-2",
        "canonicalModelKey": "gpt-5-2",
        "model": "GPT-5.2",
        "creator": "OpenAI",
        "sourceType": "Proprietary",
        "reasoningType": "Reasoning",
        "contextWindow": "400K",
        "contextWindowTokens": 400000,
        "displayScore": 78,
        "rankingEligible": true,
        "overallRank": 25,
        "url": "https://benchlm.ai/models/gpt-5-2",
        "markdownUrl": "https://benchlm.ai/md/models/gpt-5-2.md"
      },
      "modelB": {
        "slug": "gpt-5-5-pro",
        "canonicalModelKey": "gpt-5-5-pro",
        "model": "GPT-5.5 Pro",
        "creator": "OpenAI",
        "sourceType": "Proprietary",
        "reasoningType": "Reasoning",
        "contextWindow": "1M",
        "contextWindowTokens": 1000000,
        "displayScore": 100,
        "rankingEligible": false,
        "overallRank": null,
        "url": "https://benchlm.ai/models/gpt-5-5-pro",
        "markdownUrl": "https://benchlm.ai/md/models/gpt-5-5-pro.md"
      },
      "overallWinner": "B",
      "winner": {
        "slug": "gpt-5-5-pro",
        "canonicalModelKey": "gpt-5-5-pro",
        "model": "GPT-5.5 Pro",
        "creator": "OpenAI",
        "sourceType": "Proprietary",
        "reasoningType": "Reasoning",
        "contextWindow": "1M",
        "contextWindowTokens": 1000000,
        "displayScore": 100,
        "rankingEligible": false,
        "overallRank": null,
        "url": "https://benchlm.ai/models/gpt-5-5-pro",
        "markdownUrl": "https://benchlm.ai/md/models/gpt-5-5-pro.md"
      },
      "scoreDiff": 22,
      "winsA": 1,
      "winsB": 1,
      "comparableCategoryCount": 2,
      "benchmarkCountA": 29,
      "benchmarkCountB": 4,
      "categoryResults": {
        "agentic": {
          "categoryLabel": "Agentic",
          "avgA": 55.2,
          "avgB": 90.1,
          "winner": "B",
          "benchmarkCount": 7
        },
        "coding": {
          "categoryLabel": "Coding",
          "avgA": 64.7,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 6
        },
        "multimodalGrounded": {
          "categoryLabel": "Multimodal & Grounded",
          "avgA": 80.3,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 5
        },
        "reasoning": {
          "categoryLabel": "Reasoning",
          "avgA": 52.9,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 3
        },
        "knowledge": {
          "categoryLabel": "Knowledge",
          "avgA": 92.4,
          "avgB": 57.2,
          "winner": "A",
          "benchmarkCount": 9
        },
        "instructionFollowing": {
          "categoryLabel": "Instruction Following",
          "avgA": null,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 1
        },
        "multilingual": {
          "categoryLabel": "Multilingual",
          "avgA": null,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 0
        },
        "math": {
          "categoryLabel": "Mathematics",
          "avgA": null,
          "avgB": 52.4,
          "winner": null,
          "benchmarkCount": 1
        }
      }
    },
    {
      "slug": "gpt-5-2-vs-holo3-35b-a3b",
      "url": "https://benchlm.ai/compare/gpt-5-2-vs-holo3-35b-a3b",
      "markdownUrl": "https://benchlm.ai/md/compare/gpt-5-2-vs-holo3-35b-a3b.md",
      "modelA": {
        "slug": "gpt-5-2",
        "canonicalModelKey": "gpt-5-2",
        "model": "GPT-5.2",
        "creator": "OpenAI",
        "sourceType": "Proprietary",
        "reasoningType": "Reasoning",
        "contextWindow": "400K",
        "contextWindowTokens": 400000,
        "displayScore": 78,
        "rankingEligible": true,
        "overallRank": 25,
        "url": "https://benchlm.ai/models/gpt-5-2",
        "markdownUrl": "https://benchlm.ai/md/models/gpt-5-2.md"
      },
      "modelB": {
        "slug": "holo3-35b-a3b",
        "canonicalModelKey": "holo3-35b-a3b",
        "model": "Holo3-35B-A3B",
        "creator": "H Company",
        "sourceType": "Open Weight",
        "reasoningType": "Non-Reasoning",
        "contextWindow": "64K",
        "contextWindowTokens": 64000,
        "displayScore": 100,
        "rankingEligible": false,
        "overallRank": null,
        "url": "https://benchlm.ai/models/holo3-35b-a3b",
        "markdownUrl": "https://benchlm.ai/md/models/holo3-35b-a3b.md"
      },
      "overallWinner": "B",
      "winner": {
        "slug": "holo3-35b-a3b",
        "canonicalModelKey": "holo3-35b-a3b",
        "model": "Holo3-35B-A3B",
        "creator": "H Company",
        "sourceType": "Open Weight",
        "reasoningType": "Non-Reasoning",
        "contextWindow": "64K",
        "contextWindowTokens": 64000,
        "displayScore": 100,
        "rankingEligible": false,
        "overallRank": null,
        "url": "https://benchlm.ai/models/holo3-35b-a3b",
        "markdownUrl": "https://benchlm.ai/md/models/holo3-35b-a3b.md"
      },
      "scoreDiff": 22,
      "winsA": 0,
      "winsB": 1,
      "comparableCategoryCount": 1,
      "benchmarkCountA": 29,
      "benchmarkCountB": 1,
      "categoryResults": {
        "agentic": {
          "categoryLabel": "Agentic",
          "avgA": 55.2,
          "avgB": 82.6,
          "winner": "B",
          "benchmarkCount": 7
        },
        "coding": {
          "categoryLabel": "Coding",
          "avgA": 64.7,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 6
        },
        "multimodalGrounded": {
          "categoryLabel": "Multimodal & Grounded",
          "avgA": 80.3,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 5
        },
        "reasoning": {
          "categoryLabel": "Reasoning",
          "avgA": 52.9,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 3
        },
        "knowledge": {
          "categoryLabel": "Knowledge",
          "avgA": 92.4,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 7
        },
        "instructionFollowing": {
          "categoryLabel": "Instruction Following",
          "avgA": null,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 1
        },
        "multilingual": {
          "categoryLabel": "Multilingual",
          "avgA": null,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 0
        },
        "math": {
          "categoryLabel": "Mathematics",
          "avgA": null,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 0
        }
      }
    },
    {
      "slug": "gpt-5-5-pro-vs-qwen3-5-397b-reasoning",
      "url": "https://benchlm.ai/compare/gpt-5-5-pro-vs-qwen3-5-397b-reasoning",
      "markdownUrl": "https://benchlm.ai/md/compare/gpt-5-5-pro-vs-qwen3-5-397b-reasoning.md",
      "modelA": {
        "slug": "qwen3-5-397b-reasoning",
        "canonicalModelKey": "qwen3-5-397b-reasoning",
        "model": "Qwen3.5 397B (Reasoning)",
        "creator": "Alibaba",
        "sourceType": "Open Weight",
        "reasoningType": "Reasoning",
        "contextWindow": "128K",
        "contextWindowTokens": 128000,
        "displayScore": 77,
        "rankingEligible": true,
        "overallRank": 26,
        "url": "https://benchlm.ai/models/qwen3-5-397b-reasoning",
        "markdownUrl": "https://benchlm.ai/md/models/qwen3-5-397b-reasoning.md"
      },
      "modelB": {
        "slug": "gpt-5-5-pro",
        "canonicalModelKey": "gpt-5-5-pro",
        "model": "GPT-5.5 Pro",
        "creator": "OpenAI",
        "sourceType": "Proprietary",
        "reasoningType": "Reasoning",
        "contextWindow": "1M",
        "contextWindowTokens": 1000000,
        "displayScore": 100,
        "rankingEligible": false,
        "overallRank": null,
        "url": "https://benchlm.ai/models/gpt-5-5-pro",
        "markdownUrl": "https://benchlm.ai/md/models/gpt-5-5-pro.md"
      },
      "overallWinner": "B",
      "winner": {
        "slug": "gpt-5-5-pro",
        "canonicalModelKey": "gpt-5-5-pro",
        "model": "GPT-5.5 Pro",
        "creator": "OpenAI",
        "sourceType": "Proprietary",
        "reasoningType": "Reasoning",
        "contextWindow": "1M",
        "contextWindowTokens": 1000000,
        "displayScore": 100,
        "rankingEligible": false,
        "overallRank": null,
        "url": "https://benchlm.ai/models/gpt-5-5-pro",
        "markdownUrl": "https://benchlm.ai/md/models/gpt-5-5-pro.md"
      },
      "scoreDiff": 23,
      "winsA": 0,
      "winsB": 0,
      "comparableCategoryCount": 0,
      "benchmarkCountA": 18,
      "benchmarkCountB": 4,
      "categoryResults": {
        "agentic": {
          "categoryLabel": "Agentic",
          "avgA": null,
          "avgB": 90.1,
          "winner": null,
          "benchmarkCount": 6
        },
        "coding": {
          "categoryLabel": "Coding",
          "avgA": null,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 3
        },
        "multimodalGrounded": {
          "categoryLabel": "Multimodal & Grounded",
          "avgA": null,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 1
        },
        "reasoning": {
          "categoryLabel": "Reasoning",
          "avgA": null,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 2
        },
        "knowledge": {
          "categoryLabel": "Knowledge",
          "avgA": null,
          "avgB": 57.2,
          "winner": null,
          "benchmarkCount": 8
        },
        "instructionFollowing": {
          "categoryLabel": "Instruction Following",
          "avgA": null,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 1
        },
        "multilingual": {
          "categoryLabel": "Multilingual",
          "avgA": null,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 0
        },
        "math": {
          "categoryLabel": "Mathematics",
          "avgA": null,
          "avgB": 52.4,
          "winner": null,
          "benchmarkCount": 1
        }
      }
    },
    {
      "slug": "holo3-35b-a3b-vs-qwen3-5-397b-reasoning",
      "url": "https://benchlm.ai/compare/holo3-35b-a3b-vs-qwen3-5-397b-reasoning",
      "markdownUrl": "https://benchlm.ai/md/compare/holo3-35b-a3b-vs-qwen3-5-397b-reasoning.md",
      "modelA": {
        "slug": "qwen3-5-397b-reasoning",
        "canonicalModelKey": "qwen3-5-397b-reasoning",
        "model": "Qwen3.5 397B (Reasoning)",
        "creator": "Alibaba",
        "sourceType": "Open Weight",
        "reasoningType": "Reasoning",
        "contextWindow": "128K",
        "contextWindowTokens": 128000,
        "displayScore": 77,
        "rankingEligible": true,
        "overallRank": 26,
        "url": "https://benchlm.ai/models/qwen3-5-397b-reasoning",
        "markdownUrl": "https://benchlm.ai/md/models/qwen3-5-397b-reasoning.md"
      },
      "modelB": {
        "slug": "holo3-35b-a3b",
        "canonicalModelKey": "holo3-35b-a3b",
        "model": "Holo3-35B-A3B",
        "creator": "H Company",
        "sourceType": "Open Weight",
        "reasoningType": "Non-Reasoning",
        "contextWindow": "64K",
        "contextWindowTokens": 64000,
        "displayScore": 100,
        "rankingEligible": false,
        "overallRank": null,
        "url": "https://benchlm.ai/models/holo3-35b-a3b",
        "markdownUrl": "https://benchlm.ai/md/models/holo3-35b-a3b.md"
      },
      "overallWinner": "B",
      "winner": {
        "slug": "holo3-35b-a3b",
        "canonicalModelKey": "holo3-35b-a3b",
        "model": "Holo3-35B-A3B",
        "creator": "H Company",
        "sourceType": "Open Weight",
        "reasoningType": "Non-Reasoning",
        "contextWindow": "64K",
        "contextWindowTokens": 64000,
        "displayScore": 100,
        "rankingEligible": false,
        "overallRank": null,
        "url": "https://benchlm.ai/models/holo3-35b-a3b",
        "markdownUrl": "https://benchlm.ai/md/models/holo3-35b-a3b.md"
      },
      "scoreDiff": 23,
      "winsA": 0,
      "winsB": 0,
      "comparableCategoryCount": 0,
      "benchmarkCountA": 18,
      "benchmarkCountB": 1,
      "categoryResults": {
        "agentic": {
          "categoryLabel": "Agentic",
          "avgA": null,
          "avgB": 82.6,
          "winner": null,
          "benchmarkCount": 6
        },
        "coding": {
          "categoryLabel": "Coding",
          "avgA": null,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 3
        },
        "multimodalGrounded": {
          "categoryLabel": "Multimodal & Grounded",
          "avgA": null,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 1
        },
        "reasoning": {
          "categoryLabel": "Reasoning",
          "avgA": null,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 2
        },
        "knowledge": {
          "categoryLabel": "Knowledge",
          "avgA": null,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 6
        },
        "instructionFollowing": {
          "categoryLabel": "Instruction Following",
          "avgA": null,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 1
        },
        "multilingual": {
          "categoryLabel": "Multilingual",
          "avgA": null,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 0
        },
        "math": {
          "categoryLabel": "Mathematics",
          "avgA": null,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 0
        }
      }
    },
    {
      "slug": "gpt-5-1-vs-gpt-5-5-pro",
      "url": "https://benchlm.ai/compare/gpt-5-1-vs-gpt-5-5-pro",
      "markdownUrl": "https://benchlm.ai/md/compare/gpt-5-1-vs-gpt-5-5-pro.md",
      "modelA": {
        "slug": "gpt-5-1",
        "canonicalModelKey": "gpt-5-1",
        "model": "GPT-5.1",
        "creator": "OpenAI",
        "sourceType": "Proprietary",
        "reasoningType": "Reasoning",
        "contextWindow": "200K",
        "contextWindowTokens": 200000,
        "displayScore": 77,
        "rankingEligible": true,
        "overallRank": 27,
        "url": "https://benchlm.ai/models/gpt-5-1",
        "markdownUrl": "https://benchlm.ai/md/models/gpt-5-1.md"
      },
      "modelB": {
        "slug": "gpt-5-5-pro",
        "canonicalModelKey": "gpt-5-5-pro",
        "model": "GPT-5.5 Pro",
        "creator": "OpenAI",
        "sourceType": "Proprietary",
        "reasoningType": "Reasoning",
        "contextWindow": "1M",
        "contextWindowTokens": 1000000,
        "displayScore": 100,
        "rankingEligible": false,
        "overallRank": null,
        "url": "https://benchlm.ai/models/gpt-5-5-pro",
        "markdownUrl": "https://benchlm.ai/md/models/gpt-5-5-pro.md"
      },
      "overallWinner": "B",
      "winner": {
        "slug": "gpt-5-5-pro",
        "canonicalModelKey": "gpt-5-5-pro",
        "model": "GPT-5.5 Pro",
        "creator": "OpenAI",
        "sourceType": "Proprietary",
        "reasoningType": "Reasoning",
        "contextWindow": "1M",
        "contextWindowTokens": 1000000,
        "displayScore": 100,
        "rankingEligible": false,
        "overallRank": null,
        "url": "https://benchlm.ai/models/gpt-5-5-pro",
        "markdownUrl": "https://benchlm.ai/md/models/gpt-5-5-pro.md"
      },
      "scoreDiff": 23,
      "winsA": 0,
      "winsB": 0,
      "comparableCategoryCount": 0,
      "benchmarkCountA": 20,
      "benchmarkCountB": 4,
      "categoryResults": {
        "agentic": {
          "categoryLabel": "Agentic",
          "avgA": null,
          "avgB": 90.1,
          "winner": null,
          "benchmarkCount": 6
        },
        "coding": {
          "categoryLabel": "Coding",
          "avgA": null,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 4
        },
        "multimodalGrounded": {
          "categoryLabel": "Multimodal & Grounded",
          "avgA": null,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 2
        },
        "reasoning": {
          "categoryLabel": "Reasoning",
          "avgA": null,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 2
        },
        "knowledge": {
          "categoryLabel": "Knowledge",
          "avgA": null,
          "avgB": 57.2,
          "winner": null,
          "benchmarkCount": 8
        },
        "instructionFollowing": {
          "categoryLabel": "Instruction Following",
          "avgA": null,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 1
        },
        "multilingual": {
          "categoryLabel": "Multilingual",
          "avgA": null,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 0
        },
        "math": {
          "categoryLabel": "Mathematics",
          "avgA": null,
          "avgB": 52.4,
          "winner": null,
          "benchmarkCount": 1
        }
      }
    },
    {
      "slug": "gpt-5-1-vs-holo3-35b-a3b",
      "url": "https://benchlm.ai/compare/gpt-5-1-vs-holo3-35b-a3b",
      "markdownUrl": "https://benchlm.ai/md/compare/gpt-5-1-vs-holo3-35b-a3b.md",
      "modelA": {
        "slug": "gpt-5-1",
        "canonicalModelKey": "gpt-5-1",
        "model": "GPT-5.1",
        "creator": "OpenAI",
        "sourceType": "Proprietary",
        "reasoningType": "Reasoning",
        "contextWindow": "200K",
        "contextWindowTokens": 200000,
        "displayScore": 77,
        "rankingEligible": true,
        "overallRank": 27,
        "url": "https://benchlm.ai/models/gpt-5-1",
        "markdownUrl": "https://benchlm.ai/md/models/gpt-5-1.md"
      },
      "modelB": {
        "slug": "holo3-35b-a3b",
        "canonicalModelKey": "holo3-35b-a3b",
        "model": "Holo3-35B-A3B",
        "creator": "H Company",
        "sourceType": "Open Weight",
        "reasoningType": "Non-Reasoning",
        "contextWindow": "64K",
        "contextWindowTokens": 64000,
        "displayScore": 100,
        "rankingEligible": false,
        "overallRank": null,
        "url": "https://benchlm.ai/models/holo3-35b-a3b",
        "markdownUrl": "https://benchlm.ai/md/models/holo3-35b-a3b.md"
      },
      "overallWinner": "B",
      "winner": {
        "slug": "holo3-35b-a3b",
        "canonicalModelKey": "holo3-35b-a3b",
        "model": "Holo3-35B-A3B",
        "creator": "H Company",
        "sourceType": "Open Weight",
        "reasoningType": "Non-Reasoning",
        "contextWindow": "64K",
        "contextWindowTokens": 64000,
        "displayScore": 100,
        "rankingEligible": false,
        "overallRank": null,
        "url": "https://benchlm.ai/models/holo3-35b-a3b",
        "markdownUrl": "https://benchlm.ai/md/models/holo3-35b-a3b.md"
      },
      "scoreDiff": 23,
      "winsA": 0,
      "winsB": 0,
      "comparableCategoryCount": 0,
      "benchmarkCountA": 20,
      "benchmarkCountB": 1,
      "categoryResults": {
        "agentic": {
          "categoryLabel": "Agentic",
          "avgA": null,
          "avgB": 82.6,
          "winner": null,
          "benchmarkCount": 6
        },
        "coding": {
          "categoryLabel": "Coding",
          "avgA": null,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 4
        },
        "multimodalGrounded": {
          "categoryLabel": "Multimodal & Grounded",
          "avgA": null,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 2
        },
        "reasoning": {
          "categoryLabel": "Reasoning",
          "avgA": null,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 2
        },
        "knowledge": {
          "categoryLabel": "Knowledge",
          "avgA": null,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 6
        },
        "instructionFollowing": {
          "categoryLabel": "Instruction Following",
          "avgA": null,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 1
        },
        "multilingual": {
          "categoryLabel": "Multilingual",
          "avgA": null,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 0
        },
        "math": {
          "categoryLabel": "Mathematics",
          "avgA": null,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 0
        }
      }
    },
    {
      "slug": "claude-opus-4-5-vs-gpt-5-5-pro",
      "url": "https://benchlm.ai/compare/claude-opus-4-5-vs-gpt-5-5-pro",
      "markdownUrl": "https://benchlm.ai/md/compare/claude-opus-4-5-vs-gpt-5-5-pro.md",
      "modelA": {
        "slug": "claude-opus-4-5",
        "canonicalModelKey": "claude-opus-4-5",
        "model": "Claude Opus 4.5",
        "creator": "Anthropic",
        "sourceType": "Proprietary",
        "reasoningType": "Non-Reasoning",
        "contextWindow": "200K",
        "contextWindowTokens": 200000,
        "displayScore": 76,
        "rankingEligible": true,
        "overallRank": 28,
        "url": "https://benchlm.ai/models/claude-opus-4-5",
        "markdownUrl": "https://benchlm.ai/md/models/claude-opus-4-5.md"
      },
      "modelB": {
        "slug": "gpt-5-5-pro",
        "canonicalModelKey": "gpt-5-5-pro",
        "model": "GPT-5.5 Pro",
        "creator": "OpenAI",
        "sourceType": "Proprietary",
        "reasoningType": "Reasoning",
        "contextWindow": "1M",
        "contextWindowTokens": 1000000,
        "displayScore": 100,
        "rankingEligible": false,
        "overallRank": null,
        "url": "https://benchlm.ai/models/gpt-5-5-pro",
        "markdownUrl": "https://benchlm.ai/md/models/gpt-5-5-pro.md"
      },
      "overallWinner": "B",
      "winner": {
        "slug": "gpt-5-5-pro",
        "canonicalModelKey": "gpt-5-5-pro",
        "model": "GPT-5.5 Pro",
        "creator": "OpenAI",
        "sourceType": "Proprietary",
        "reasoningType": "Reasoning",
        "contextWindow": "1M",
        "contextWindowTokens": 1000000,
        "displayScore": 100,
        "rankingEligible": false,
        "overallRank": null,
        "url": "https://benchlm.ai/models/gpt-5-5-pro",
        "markdownUrl": "https://benchlm.ai/md/models/gpt-5-5-pro.md"
      },
      "scoreDiff": 24,
      "winsA": 1,
      "winsB": 1,
      "comparableCategoryCount": 2,
      "benchmarkCountA": 60,
      "benchmarkCountB": 4,
      "categoryResults": {
        "agentic": {
          "categoryLabel": "Agentic",
          "avgA": 62.5,
          "avgB": 90.1,
          "winner": "B",
          "benchmarkCount": 19
        },
        "coding": {
          "categoryLabel": "Coding",
          "avgA": 65.9,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 8
        },
        "multimodalGrounded": {
          "categoryLabel": "Multimodal & Grounded",
          "avgA": 70,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 8
        },
        "reasoning": {
          "categoryLabel": "Reasoning",
          "avgA": 64.4,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 4
        },
        "knowledge": {
          "categoryLabel": "Knowledge",
          "avgA": 66.2,
          "avgB": 57.2,
          "winner": "A",
          "benchmarkCount": 13
        },
        "instructionFollowing": {
          "categoryLabel": "Instruction Following",
          "avgA": 79.4,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 3
        },
        "multilingual": {
          "categoryLabel": "Multilingual",
          "avgA": 85.7,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 2
        },
        "math": {
          "categoryLabel": "Mathematics",
          "avgA": null,
          "avgB": 52.4,
          "winner": null,
          "benchmarkCount": 6
        }
      }
    },
    {
      "slug": "claude-opus-4-5-vs-holo3-35b-a3b",
      "url": "https://benchlm.ai/compare/claude-opus-4-5-vs-holo3-35b-a3b",
      "markdownUrl": "https://benchlm.ai/md/compare/claude-opus-4-5-vs-holo3-35b-a3b.md",
      "modelA": {
        "slug": "claude-opus-4-5",
        "canonicalModelKey": "claude-opus-4-5",
        "model": "Claude Opus 4.5",
        "creator": "Anthropic",
        "sourceType": "Proprietary",
        "reasoningType": "Non-Reasoning",
        "contextWindow": "200K",
        "contextWindowTokens": 200000,
        "displayScore": 76,
        "rankingEligible": true,
        "overallRank": 28,
        "url": "https://benchlm.ai/models/claude-opus-4-5",
        "markdownUrl": "https://benchlm.ai/md/models/claude-opus-4-5.md"
      },
      "modelB": {
        "slug": "holo3-35b-a3b",
        "canonicalModelKey": "holo3-35b-a3b",
        "model": "Holo3-35B-A3B",
        "creator": "H Company",
        "sourceType": "Open Weight",
        "reasoningType": "Non-Reasoning",
        "contextWindow": "64K",
        "contextWindowTokens": 64000,
        "displayScore": 100,
        "rankingEligible": false,
        "overallRank": null,
        "url": "https://benchlm.ai/models/holo3-35b-a3b",
        "markdownUrl": "https://benchlm.ai/md/models/holo3-35b-a3b.md"
      },
      "overallWinner": "B",
      "winner": {
        "slug": "holo3-35b-a3b",
        "canonicalModelKey": "holo3-35b-a3b",
        "model": "Holo3-35B-A3B",
        "creator": "H Company",
        "sourceType": "Open Weight",
        "reasoningType": "Non-Reasoning",
        "contextWindow": "64K",
        "contextWindowTokens": 64000,
        "displayScore": 100,
        "rankingEligible": false,
        "overallRank": null,
        "url": "https://benchlm.ai/models/holo3-35b-a3b",
        "markdownUrl": "https://benchlm.ai/md/models/holo3-35b-a3b.md"
      },
      "scoreDiff": 24,
      "winsA": 0,
      "winsB": 1,
      "comparableCategoryCount": 1,
      "benchmarkCountA": 60,
      "benchmarkCountB": 1,
      "categoryResults": {
        "agentic": {
          "categoryLabel": "Agentic",
          "avgA": 62.5,
          "avgB": 82.6,
          "winner": "B",
          "benchmarkCount": 18
        },
        "coding": {
          "categoryLabel": "Coding",
          "avgA": 65.9,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 8
        },
        "multimodalGrounded": {
          "categoryLabel": "Multimodal & Grounded",
          "avgA": 70,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 8
        },
        "reasoning": {
          "categoryLabel": "Reasoning",
          "avgA": 64.4,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 4
        },
        "knowledge": {
          "categoryLabel": "Knowledge",
          "avgA": 66.2,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 12
        },
        "instructionFollowing": {
          "categoryLabel": "Instruction Following",
          "avgA": 79.4,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 3
        },
        "multilingual": {
          "categoryLabel": "Multilingual",
          "avgA": 85.7,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 2
        },
        "math": {
          "categoryLabel": "Mathematics",
          "avgA": null,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 5
        }
      }
    },
    {
      "slug": "gpt-5-5-pro-vs-gpt-5-high",
      "url": "https://benchlm.ai/compare/gpt-5-5-pro-vs-gpt-5-high",
      "markdownUrl": "https://benchlm.ai/md/compare/gpt-5-5-pro-vs-gpt-5-high.md",
      "modelA": {
        "slug": "gpt-5-high",
        "canonicalModelKey": "gpt-5-high",
        "model": "GPT-5 (high)",
        "creator": "OpenAI",
        "sourceType": "Proprietary",
        "reasoningType": "Reasoning",
        "contextWindow": "128K",
        "contextWindowTokens": 128000,
        "displayScore": 76,
        "rankingEligible": true,
        "overallRank": 29,
        "url": "https://benchlm.ai/models/gpt-5-high",
        "markdownUrl": "https://benchlm.ai/md/models/gpt-5-high.md"
      },
      "modelB": {
        "slug": "gpt-5-5-pro",
        "canonicalModelKey": "gpt-5-5-pro",
        "model": "GPT-5.5 Pro",
        "creator": "OpenAI",
        "sourceType": "Proprietary",
        "reasoningType": "Reasoning",
        "contextWindow": "1M",
        "contextWindowTokens": 1000000,
        "displayScore": 100,
        "rankingEligible": false,
        "overallRank": null,
        "url": "https://benchlm.ai/models/gpt-5-5-pro",
        "markdownUrl": "https://benchlm.ai/md/models/gpt-5-5-pro.md"
      },
      "overallWinner": "B",
      "winner": {
        "slug": "gpt-5-5-pro",
        "canonicalModelKey": "gpt-5-5-pro",
        "model": "GPT-5.5 Pro",
        "creator": "OpenAI",
        "sourceType": "Proprietary",
        "reasoningType": "Reasoning",
        "contextWindow": "1M",
        "contextWindowTokens": 1000000,
        "displayScore": 100,
        "rankingEligible": false,
        "overallRank": null,
        "url": "https://benchlm.ai/models/gpt-5-5-pro",
        "markdownUrl": "https://benchlm.ai/md/models/gpt-5-5-pro.md"
      },
      "scoreDiff": 24,
      "winsA": 0,
      "winsB": 0,
      "comparableCategoryCount": 0,
      "benchmarkCountA": 19,
      "benchmarkCountB": 4,
      "categoryResults": {
        "agentic": {
          "categoryLabel": "Agentic",
          "avgA": null,
          "avgB": 90.1,
          "winner": null,
          "benchmarkCount": 5
        },
        "coding": {
          "categoryLabel": "Coding",
          "avgA": null,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 4
        },
        "multimodalGrounded": {
          "categoryLabel": "Multimodal & Grounded",
          "avgA": null,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 2
        },
        "reasoning": {
          "categoryLabel": "Reasoning",
          "avgA": null,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 2
        },
        "knowledge": {
          "categoryLabel": "Knowledge",
          "avgA": null,
          "avgB": 57.2,
          "winner": null,
          "benchmarkCount": 8
        },
        "instructionFollowing": {
          "categoryLabel": "Instruction Following",
          "avgA": null,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 1
        },
        "multilingual": {
          "categoryLabel": "Multilingual",
          "avgA": null,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 0
        },
        "math": {
          "categoryLabel": "Mathematics",
          "avgA": null,
          "avgB": 52.4,
          "winner": null,
          "benchmarkCount": 1
        }
      }
    },
    {
      "slug": "gpt-5-high-vs-holo3-35b-a3b",
      "url": "https://benchlm.ai/compare/gpt-5-high-vs-holo3-35b-a3b",
      "markdownUrl": "https://benchlm.ai/md/compare/gpt-5-high-vs-holo3-35b-a3b.md",
      "modelA": {
        "slug": "gpt-5-high",
        "canonicalModelKey": "gpt-5-high",
        "model": "GPT-5 (high)",
        "creator": "OpenAI",
        "sourceType": "Proprietary",
        "reasoningType": "Reasoning",
        "contextWindow": "128K",
        "contextWindowTokens": 128000,
        "displayScore": 76,
        "rankingEligible": true,
        "overallRank": 29,
        "url": "https://benchlm.ai/models/gpt-5-high",
        "markdownUrl": "https://benchlm.ai/md/models/gpt-5-high.md"
      },
      "modelB": {
        "slug": "holo3-35b-a3b",
        "canonicalModelKey": "holo3-35b-a3b",
        "model": "Holo3-35B-A3B",
        "creator": "H Company",
        "sourceType": "Open Weight",
        "reasoningType": "Non-Reasoning",
        "contextWindow": "64K",
        "contextWindowTokens": 64000,
        "displayScore": 100,
        "rankingEligible": false,
        "overallRank": null,
        "url": "https://benchlm.ai/models/holo3-35b-a3b",
        "markdownUrl": "https://benchlm.ai/md/models/holo3-35b-a3b.md"
      },
      "overallWinner": "B",
      "winner": {
        "slug": "holo3-35b-a3b",
        "canonicalModelKey": "holo3-35b-a3b",
        "model": "Holo3-35B-A3B",
        "creator": "H Company",
        "sourceType": "Open Weight",
        "reasoningType": "Non-Reasoning",
        "contextWindow": "64K",
        "contextWindowTokens": 64000,
        "displayScore": 100,
        "rankingEligible": false,
        "overallRank": null,
        "url": "https://benchlm.ai/models/holo3-35b-a3b",
        "markdownUrl": "https://benchlm.ai/md/models/holo3-35b-a3b.md"
      },
      "scoreDiff": 24,
      "winsA": 0,
      "winsB": 0,
      "comparableCategoryCount": 0,
      "benchmarkCountA": 19,
      "benchmarkCountB": 1,
      "categoryResults": {
        "agentic": {
          "categoryLabel": "Agentic",
          "avgA": null,
          "avgB": 82.6,
          "winner": null,
          "benchmarkCount": 5
        },
        "coding": {
          "categoryLabel": "Coding",
          "avgA": null,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 4
        },
        "multimodalGrounded": {
          "categoryLabel": "Multimodal & Grounded",
          "avgA": null,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 2
        },
        "reasoning": {
          "categoryLabel": "Reasoning",
          "avgA": null,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 2
        },
        "knowledge": {
          "categoryLabel": "Knowledge",
          "avgA": null,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 6
        },
        "instructionFollowing": {
          "categoryLabel": "Instruction Following",
          "avgA": null,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 1
        },
        "multilingual": {
          "categoryLabel": "Multilingual",
          "avgA": null,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 0
        },
        "math": {
          "categoryLabel": "Mathematics",
          "avgA": null,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 0
        }
      }
    },
    {
      "slug": "gpt-5-2-codex-vs-gpt-5-5-pro",
      "url": "https://benchlm.ai/compare/gpt-5-2-codex-vs-gpt-5-5-pro",
      "markdownUrl": "https://benchlm.ai/md/compare/gpt-5-2-codex-vs-gpt-5-5-pro.md",
      "modelA": {
        "slug": "gpt-5-2-codex",
        "canonicalModelKey": "gpt-5-2-codex",
        "model": "GPT-5.2-Codex",
        "creator": "OpenAI",
        "sourceType": "Proprietary",
        "reasoningType": "Reasoning",
        "contextWindow": "400K",
        "contextWindowTokens": 400000,
        "displayScore": 76,
        "rankingEligible": true,
        "overallRank": 30,
        "url": "https://benchlm.ai/models/gpt-5-2-codex",
        "markdownUrl": "https://benchlm.ai/md/models/gpt-5-2-codex.md"
      },
      "modelB": {
        "slug": "gpt-5-5-pro",
        "canonicalModelKey": "gpt-5-5-pro",
        "model": "GPT-5.5 Pro",
        "creator": "OpenAI",
        "sourceType": "Proprietary",
        "reasoningType": "Reasoning",
        "contextWindow": "1M",
        "contextWindowTokens": 1000000,
        "displayScore": 100,
        "rankingEligible": false,
        "overallRank": null,
        "url": "https://benchlm.ai/models/gpt-5-5-pro",
        "markdownUrl": "https://benchlm.ai/md/models/gpt-5-5-pro.md"
      },
      "overallWinner": "B",
      "winner": {
        "slug": "gpt-5-5-pro",
        "canonicalModelKey": "gpt-5-5-pro",
        "model": "GPT-5.5 Pro",
        "creator": "OpenAI",
        "sourceType": "Proprietary",
        "reasoningType": "Reasoning",
        "contextWindow": "1M",
        "contextWindowTokens": 1000000,
        "displayScore": 100,
        "rankingEligible": false,
        "overallRank": null,
        "url": "https://benchlm.ai/models/gpt-5-5-pro",
        "markdownUrl": "https://benchlm.ai/md/models/gpt-5-5-pro.md"
      },
      "scoreDiff": 24,
      "winsA": 0,
      "winsB": 0,
      "comparableCategoryCount": 0,
      "benchmarkCountA": 19,
      "benchmarkCountB": 4,
      "categoryResults": {
        "agentic": {
          "categoryLabel": "Agentic",
          "avgA": null,
          "avgB": 90.1,
          "winner": null,
          "benchmarkCount": 6
        },
        "coding": {
          "categoryLabel": "Coding",
          "avgA": null,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 4
        },
        "multimodalGrounded": {
          "categoryLabel": "Multimodal & Grounded",
          "avgA": null,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 1
        },
        "reasoning": {
          "categoryLabel": "Reasoning",
          "avgA": null,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 2
        },
        "knowledge": {
          "categoryLabel": "Knowledge",
          "avgA": null,
          "avgB": 57.2,
          "winner": null,
          "benchmarkCount": 8
        },
        "instructionFollowing": {
          "categoryLabel": "Instruction Following",
          "avgA": null,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 1
        },
        "multilingual": {
          "categoryLabel": "Multilingual",
          "avgA": null,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 0
        },
        "math": {
          "categoryLabel": "Mathematics",
          "avgA": null,
          "avgB": 52.4,
          "winner": null,
          "benchmarkCount": 1
        }
      }
    },
    {
      "slug": "gpt-5-2-codex-vs-holo3-35b-a3b",
      "url": "https://benchlm.ai/compare/gpt-5-2-codex-vs-holo3-35b-a3b",
      "markdownUrl": "https://benchlm.ai/md/compare/gpt-5-2-codex-vs-holo3-35b-a3b.md",
      "modelA": {
        "slug": "gpt-5-2-codex",
        "canonicalModelKey": "gpt-5-2-codex",
        "model": "GPT-5.2-Codex",
        "creator": "OpenAI",
        "sourceType": "Proprietary",
        "reasoningType": "Reasoning",
        "contextWindow": "400K",
        "contextWindowTokens": 400000,
        "displayScore": 76,
        "rankingEligible": true,
        "overallRank": 30,
        "url": "https://benchlm.ai/models/gpt-5-2-codex",
        "markdownUrl": "https://benchlm.ai/md/models/gpt-5-2-codex.md"
      },
      "modelB": {
        "slug": "holo3-35b-a3b",
        "canonicalModelKey": "holo3-35b-a3b",
        "model": "Holo3-35B-A3B",
        "creator": "H Company",
        "sourceType": "Open Weight",
        "reasoningType": "Non-Reasoning",
        "contextWindow": "64K",
        "contextWindowTokens": 64000,
        "displayScore": 100,
        "rankingEligible": false,
        "overallRank": null,
        "url": "https://benchlm.ai/models/holo3-35b-a3b",
        "markdownUrl": "https://benchlm.ai/md/models/holo3-35b-a3b.md"
      },
      "overallWinner": "B",
      "winner": {
        "slug": "holo3-35b-a3b",
        "canonicalModelKey": "holo3-35b-a3b",
        "model": "Holo3-35B-A3B",
        "creator": "H Company",
        "sourceType": "Open Weight",
        "reasoningType": "Non-Reasoning",
        "contextWindow": "64K",
        "contextWindowTokens": 64000,
        "displayScore": 100,
        "rankingEligible": false,
        "overallRank": null,
        "url": "https://benchlm.ai/models/holo3-35b-a3b",
        "markdownUrl": "https://benchlm.ai/md/models/holo3-35b-a3b.md"
      },
      "scoreDiff": 24,
      "winsA": 0,
      "winsB": 0,
      "comparableCategoryCount": 0,
      "benchmarkCountA": 19,
      "benchmarkCountB": 1,
      "categoryResults": {
        "agentic": {
          "categoryLabel": "Agentic",
          "avgA": null,
          "avgB": 82.6,
          "winner": null,
          "benchmarkCount": 6
        },
        "coding": {
          "categoryLabel": "Coding",
          "avgA": null,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 4
        },
        "multimodalGrounded": {
          "categoryLabel": "Multimodal & Grounded",
          "avgA": null,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 1
        },
        "reasoning": {
          "categoryLabel": "Reasoning",
          "avgA": null,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 2
        },
        "knowledge": {
          "categoryLabel": "Knowledge",
          "avgA": null,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 6
        },
        "instructionFollowing": {
          "categoryLabel": "Instruction Following",
          "avgA": null,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 1
        },
        "multilingual": {
          "categoryLabel": "Multilingual",
          "avgA": null,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 0
        },
        "math": {
          "categoryLabel": "Mathematics",
          "avgA": null,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 0
        }
      }
    },
    {
      "slug": "gpt-5-5-pro-vs-kimi-k2-5-reasoning",
      "url": "https://benchlm.ai/compare/gpt-5-5-pro-vs-kimi-k2-5-reasoning",
      "markdownUrl": "https://benchlm.ai/md/compare/gpt-5-5-pro-vs-kimi-k2-5-reasoning.md",
      "modelA": {
        "slug": "kimi-k2-5-reasoning",
        "canonicalModelKey": "kimi-k2-5-reasoning",
        "model": "Kimi K2.5 (Reasoning)",
        "creator": "Moonshot AI",
        "sourceType": "Proprietary",
        "reasoningType": "Reasoning",
        "contextWindow": "128K",
        "contextWindowTokens": 128000,
        "displayScore": 75,
        "rankingEligible": true,
        "overallRank": 31,
        "url": "https://benchlm.ai/models/kimi-k2-5-reasoning",
        "markdownUrl": "https://benchlm.ai/md/models/kimi-k2-5-reasoning.md"
      },
      "modelB": {
        "slug": "gpt-5-5-pro",
        "canonicalModelKey": "gpt-5-5-pro",
        "model": "GPT-5.5 Pro",
        "creator": "OpenAI",
        "sourceType": "Proprietary",
        "reasoningType": "Reasoning",
        "contextWindow": "1M",
        "contextWindowTokens": 1000000,
        "displayScore": 100,
        "rankingEligible": false,
        "overallRank": null,
        "url": "https://benchlm.ai/models/gpt-5-5-pro",
        "markdownUrl": "https://benchlm.ai/md/models/gpt-5-5-pro.md"
      },
      "overallWinner": "B",
      "winner": {
        "slug": "gpt-5-5-pro",
        "canonicalModelKey": "gpt-5-5-pro",
        "model": "GPT-5.5 Pro",
        "creator": "OpenAI",
        "sourceType": "Proprietary",
        "reasoningType": "Reasoning",
        "contextWindow": "1M",
        "contextWindowTokens": 1000000,
        "displayScore": 100,
        "rankingEligible": false,
        "overallRank": null,
        "url": "https://benchlm.ai/models/gpt-5-5-pro",
        "markdownUrl": "https://benchlm.ai/md/models/gpt-5-5-pro.md"
      },
      "scoreDiff": 25,
      "winsA": 2,
      "winsB": 1,
      "comparableCategoryCount": 3,
      "benchmarkCountA": 28,
      "benchmarkCountB": 4,
      "categoryResults": {
        "agentic": {
          "categoryLabel": "Agentic",
          "avgA": 54.6,
          "avgB": 90.1,
          "winner": "B",
          "benchmarkCount": 8
        },
        "coding": {
          "categoryLabel": "Coding",
          "avgA": 76.8,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 5
        },
        "multimodalGrounded": {
          "categoryLabel": "Multimodal & Grounded",
          "avgA": 78.5,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 3
        },
        "reasoning": {
          "categoryLabel": "Reasoning",
          "avgA": null,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 2
        },
        "knowledge": {
          "categoryLabel": "Knowledge",
          "avgA": 87.3,
          "avgB": 57.2,
          "winner": "A",
          "benchmarkCount": 10
        },
        "instructionFollowing": {
          "categoryLabel": "Instruction Following",
          "avgA": null,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 1
        },
        "multilingual": {
          "categoryLabel": "Multilingual",
          "avgA": null,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 0
        },
        "math": {
          "categoryLabel": "Mathematics",
          "avgA": 96.1,
          "avgB": 52.4,
          "winner": "A",
          "benchmarkCount": 2
        }
      }
    },
    {
      "slug": "holo3-35b-a3b-vs-kimi-k2-5-reasoning",
      "url": "https://benchlm.ai/compare/holo3-35b-a3b-vs-kimi-k2-5-reasoning",
      "markdownUrl": "https://benchlm.ai/md/compare/holo3-35b-a3b-vs-kimi-k2-5-reasoning.md",
      "modelA": {
        "slug": "kimi-k2-5-reasoning",
        "canonicalModelKey": "kimi-k2-5-reasoning",
        "model": "Kimi K2.5 (Reasoning)",
        "creator": "Moonshot AI",
        "sourceType": "Proprietary",
        "reasoningType": "Reasoning",
        "contextWindow": "128K",
        "contextWindowTokens": 128000,
        "displayScore": 75,
        "rankingEligible": true,
        "overallRank": 31,
        "url": "https://benchlm.ai/models/kimi-k2-5-reasoning",
        "markdownUrl": "https://benchlm.ai/md/models/kimi-k2-5-reasoning.md"
      },
      "modelB": {
        "slug": "holo3-35b-a3b",
        "canonicalModelKey": "holo3-35b-a3b",
        "model": "Holo3-35B-A3B",
        "creator": "H Company",
        "sourceType": "Open Weight",
        "reasoningType": "Non-Reasoning",
        "contextWindow": "64K",
        "contextWindowTokens": 64000,
        "displayScore": 100,
        "rankingEligible": false,
        "overallRank": null,
        "url": "https://benchlm.ai/models/holo3-35b-a3b",
        "markdownUrl": "https://benchlm.ai/md/models/holo3-35b-a3b.md"
      },
      "overallWinner": "B",
      "winner": {
        "slug": "holo3-35b-a3b",
        "canonicalModelKey": "holo3-35b-a3b",
        "model": "Holo3-35B-A3B",
        "creator": "H Company",
        "sourceType": "Open Weight",
        "reasoningType": "Non-Reasoning",
        "contextWindow": "64K",
        "contextWindowTokens": 64000,
        "displayScore": 100,
        "rankingEligible": false,
        "overallRank": null,
        "url": "https://benchlm.ai/models/holo3-35b-a3b",
        "markdownUrl": "https://benchlm.ai/md/models/holo3-35b-a3b.md"
      },
      "scoreDiff": 25,
      "winsA": 0,
      "winsB": 1,
      "comparableCategoryCount": 1,
      "benchmarkCountA": 28,
      "benchmarkCountB": 1,
      "categoryResults": {
        "agentic": {
          "categoryLabel": "Agentic",
          "avgA": 54.6,
          "avgB": 82.6,
          "winner": "B",
          "benchmarkCount": 9
        },
        "coding": {
          "categoryLabel": "Coding",
          "avgA": 76.8,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 5
        },
        "multimodalGrounded": {
          "categoryLabel": "Multimodal & Grounded",
          "avgA": 78.5,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 3
        },
        "reasoning": {
          "categoryLabel": "Reasoning",
          "avgA": null,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 2
        },
        "knowledge": {
          "categoryLabel": "Knowledge",
          "avgA": 87.3,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 8
        },
        "instructionFollowing": {
          "categoryLabel": "Instruction Following",
          "avgA": null,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 1
        },
        "multilingual": {
          "categoryLabel": "Multilingual",
          "avgA": null,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 0
        },
        "math": {
          "categoryLabel": "Mathematics",
          "avgA": 96.1,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 1
        }
      }
    },
    {
      "slug": "gpt-5-1-codex-max-vs-gpt-5-5-pro",
      "url": "https://benchlm.ai/compare/gpt-5-1-codex-max-vs-gpt-5-5-pro",
      "markdownUrl": "https://benchlm.ai/md/compare/gpt-5-1-codex-max-vs-gpt-5-5-pro.md",
      "modelA": {
        "slug": "gpt-5-1-codex-max",
        "canonicalModelKey": "gpt-5-1-codex-max",
        "model": "GPT-5.1-Codex-Max",
        "creator": "OpenAI",
        "sourceType": "Proprietary",
        "reasoningType": "Reasoning",
        "contextWindow": "400K",
        "contextWindowTokens": 400000,
        "displayScore": 75,
        "rankingEligible": true,
        "overallRank": 32,
        "url": "https://benchlm.ai/models/gpt-5-1-codex-max",
        "markdownUrl": "https://benchlm.ai/md/models/gpt-5-1-codex-max.md"
      },
      "modelB": {
        "slug": "gpt-5-5-pro",
        "canonicalModelKey": "gpt-5-5-pro",
        "model": "GPT-5.5 Pro",
        "creator": "OpenAI",
        "sourceType": "Proprietary",
        "reasoningType": "Reasoning",
        "contextWindow": "1M",
        "contextWindowTokens": 1000000,
        "displayScore": 100,
        "rankingEligible": false,
        "overallRank": null,
        "url": "https://benchlm.ai/models/gpt-5-5-pro",
        "markdownUrl": "https://benchlm.ai/md/models/gpt-5-5-pro.md"
      },
      "overallWinner": "B",
      "winner": {
        "slug": "gpt-5-5-pro",
        "canonicalModelKey": "gpt-5-5-pro",
        "model": "GPT-5.5 Pro",
        "creator": "OpenAI",
        "sourceType": "Proprietary",
        "reasoningType": "Reasoning",
        "contextWindow": "1M",
        "contextWindowTokens": 1000000,
        "displayScore": 100,
        "rankingEligible": false,
        "overallRank": null,
        "url": "https://benchlm.ai/models/gpt-5-5-pro",
        "markdownUrl": "https://benchlm.ai/md/models/gpt-5-5-pro.md"
      },
      "scoreDiff": 25,
      "winsA": 0,
      "winsB": 0,
      "comparableCategoryCount": 0,
      "benchmarkCountA": 18,
      "benchmarkCountB": 4,
      "categoryResults": {
        "agentic": {
          "categoryLabel": "Agentic",
          "avgA": null,
          "avgB": 90.1,
          "winner": null,
          "benchmarkCount": 5
        },
        "coding": {
          "categoryLabel": "Coding",
          "avgA": null,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 4
        },
        "multimodalGrounded": {
          "categoryLabel": "Multimodal & Grounded",
          "avgA": null,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 1
        },
        "reasoning": {
          "categoryLabel": "Reasoning",
          "avgA": null,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 2
        },
        "knowledge": {
          "categoryLabel": "Knowledge",
          "avgA": null,
          "avgB": 57.2,
          "winner": null,
          "benchmarkCount": 8
        },
        "instructionFollowing": {
          "categoryLabel": "Instruction Following",
          "avgA": null,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 1
        },
        "multilingual": {
          "categoryLabel": "Multilingual",
          "avgA": null,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 0
        },
        "math": {
          "categoryLabel": "Mathematics",
          "avgA": null,
          "avgB": 52.4,
          "winner": null,
          "benchmarkCount": 1
        }
      }
    },
    {
      "slug": "gpt-5-1-codex-max-vs-holo3-35b-a3b",
      "url": "https://benchlm.ai/compare/gpt-5-1-codex-max-vs-holo3-35b-a3b",
      "markdownUrl": "https://benchlm.ai/md/compare/gpt-5-1-codex-max-vs-holo3-35b-a3b.md",
      "modelA": {
        "slug": "gpt-5-1-codex-max",
        "canonicalModelKey": "gpt-5-1-codex-max",
        "model": "GPT-5.1-Codex-Max",
        "creator": "OpenAI",
        "sourceType": "Proprietary",
        "reasoningType": "Reasoning",
        "contextWindow": "400K",
        "contextWindowTokens": 400000,
        "displayScore": 75,
        "rankingEligible": true,
        "overallRank": 32,
        "url": "https://benchlm.ai/models/gpt-5-1-codex-max",
        "markdownUrl": "https://benchlm.ai/md/models/gpt-5-1-codex-max.md"
      },
      "modelB": {
        "slug": "holo3-35b-a3b",
        "canonicalModelKey": "holo3-35b-a3b",
        "model": "Holo3-35B-A3B",
        "creator": "H Company",
        "sourceType": "Open Weight",
        "reasoningType": "Non-Reasoning",
        "contextWindow": "64K",
        "contextWindowTokens": 64000,
        "displayScore": 100,
        "rankingEligible": false,
        "overallRank": null,
        "url": "https://benchlm.ai/models/holo3-35b-a3b",
        "markdownUrl": "https://benchlm.ai/md/models/holo3-35b-a3b.md"
      },
      "overallWinner": "B",
      "winner": {
        "slug": "holo3-35b-a3b",
        "canonicalModelKey": "holo3-35b-a3b",
        "model": "Holo3-35B-A3B",
        "creator": "H Company",
        "sourceType": "Open Weight",
        "reasoningType": "Non-Reasoning",
        "contextWindow": "64K",
        "contextWindowTokens": 64000,
        "displayScore": 100,
        "rankingEligible": false,
        "overallRank": null,
        "url": "https://benchlm.ai/models/holo3-35b-a3b",
        "markdownUrl": "https://benchlm.ai/md/models/holo3-35b-a3b.md"
      },
      "scoreDiff": 25,
      "winsA": 0,
      "winsB": 0,
      "comparableCategoryCount": 0,
      "benchmarkCountA": 18,
      "benchmarkCountB": 1,
      "categoryResults": {
        "agentic": {
          "categoryLabel": "Agentic",
          "avgA": null,
          "avgB": 82.6,
          "winner": null,
          "benchmarkCount": 5
        },
        "coding": {
          "categoryLabel": "Coding",
          "avgA": null,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 4
        },
        "multimodalGrounded": {
          "categoryLabel": "Multimodal & Grounded",
          "avgA": null,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 1
        },
        "reasoning": {
          "categoryLabel": "Reasoning",
          "avgA": null,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 2
        },
        "knowledge": {
          "categoryLabel": "Knowledge",
          "avgA": null,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 6
        },
        "instructionFollowing": {
          "categoryLabel": "Instruction Following",
          "avgA": null,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 1
        },
        "multilingual": {
          "categoryLabel": "Multilingual",
          "avgA": null,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 0
        },
        "math": {
          "categoryLabel": "Mathematics",
          "avgA": null,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 0
        }
      }
    },
    {
      "slug": "deepseek-v4-flash-max-vs-gpt-5-5-pro",
      "url": "https://benchlm.ai/compare/deepseek-v4-flash-max-vs-gpt-5-5-pro",
      "markdownUrl": "https://benchlm.ai/md/compare/deepseek-v4-flash-max-vs-gpt-5-5-pro.md",
      "modelA": {
        "slug": "deepseek-v4-flash-max",
        "canonicalModelKey": "deepseek-v4-flash-max",
        "model": "DeepSeek V4 Flash (Max)",
        "creator": "DeepSeek",
        "sourceType": "Open Weight",
        "reasoningType": "Reasoning",
        "contextWindow": "1M",
        "contextWindowTokens": 1000000,
        "displayScore": 74,
        "rankingEligible": true,
        "overallRank": 33,
        "url": "https://benchlm.ai/models/deepseek-v4-flash-max",
        "markdownUrl": "https://benchlm.ai/md/models/deepseek-v4-flash-max.md"
      },
      "modelB": {
        "slug": "gpt-5-5-pro",
        "canonicalModelKey": "gpt-5-5-pro",
        "model": "GPT-5.5 Pro",
        "creator": "OpenAI",
        "sourceType": "Proprietary",
        "reasoningType": "Reasoning",
        "contextWindow": "1M",
        "contextWindowTokens": 1000000,
        "displayScore": 100,
        "rankingEligible": false,
        "overallRank": null,
        "url": "https://benchlm.ai/models/gpt-5-5-pro",
        "markdownUrl": "https://benchlm.ai/md/models/gpt-5-5-pro.md"
      },
      "overallWinner": "B",
      "winner": {
        "slug": "gpt-5-5-pro",
        "canonicalModelKey": "gpt-5-5-pro",
        "model": "GPT-5.5 Pro",
        "creator": "OpenAI",
        "sourceType": "Proprietary",
        "reasoningType": "Reasoning",
        "contextWindow": "1M",
        "contextWindowTokens": 1000000,
        "displayScore": 100,
        "rankingEligible": false,
        "overallRank": null,
        "url": "https://benchlm.ai/models/gpt-5-5-pro",
        "markdownUrl": "https://benchlm.ai/md/models/gpt-5-5-pro.md"
      },
      "scoreDiff": 26,
      "winsA": 1,
      "winsB": 1,
      "comparableCategoryCount": 2,
      "benchmarkCountA": 40,
      "benchmarkCountB": 4,
      "categoryResults": {
        "agentic": {
          "categoryLabel": "Agentic",
          "avgA": 63.3,
          "avgB": 90.1,
          "winner": "B",
          "benchmarkCount": 9
        },
        "coding": {
          "categoryLabel": "Coding",
          "avgA": 73.7,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 9
        },
        "multimodalGrounded": {
          "categoryLabel": "Multimodal & Grounded",
          "avgA": null,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 1
        },
        "reasoning": {
          "categoryLabel": "Reasoning",
          "avgA": null,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 4
        },
        "knowledge": {
          "categoryLabel": "Knowledge",
          "avgA": 60,
          "avgB": 57.2,
          "winner": "A",
          "benchmarkCount": 13
        },
        "instructionFollowing": {
          "categoryLabel": "Instruction Following",
          "avgA": null,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 1
        },
        "multilingual": {
          "categoryLabel": "Multilingual",
          "avgA": null,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 0
        },
        "math": {
          "categoryLabel": "Mathematics",
          "avgA": null,
          "avgB": 52.4,
          "winner": null,
          "benchmarkCount": 5
        }
      }
    },
    {
      "slug": "deepseek-v4-flash-max-vs-holo3-35b-a3b",
      "url": "https://benchlm.ai/compare/deepseek-v4-flash-max-vs-holo3-35b-a3b",
      "markdownUrl": "https://benchlm.ai/md/compare/deepseek-v4-flash-max-vs-holo3-35b-a3b.md",
      "modelA": {
        "slug": "deepseek-v4-flash-max",
        "canonicalModelKey": "deepseek-v4-flash-max",
        "model": "DeepSeek V4 Flash (Max)",
        "creator": "DeepSeek",
        "sourceType": "Open Weight",
        "reasoningType": "Reasoning",
        "contextWindow": "1M",
        "contextWindowTokens": 1000000,
        "displayScore": 74,
        "rankingEligible": true,
        "overallRank": 33,
        "url": "https://benchlm.ai/models/deepseek-v4-flash-max",
        "markdownUrl": "https://benchlm.ai/md/models/deepseek-v4-flash-max.md"
      },
      "modelB": {
        "slug": "holo3-35b-a3b",
        "canonicalModelKey": "holo3-35b-a3b",
        "model": "Holo3-35B-A3B",
        "creator": "H Company",
        "sourceType": "Open Weight",
        "reasoningType": "Non-Reasoning",
        "contextWindow": "64K",
        "contextWindowTokens": 64000,
        "displayScore": 100,
        "rankingEligible": false,
        "overallRank": null,
        "url": "https://benchlm.ai/models/holo3-35b-a3b",
        "markdownUrl": "https://benchlm.ai/md/models/holo3-35b-a3b.md"
      },
      "overallWinner": "B",
      "winner": {
        "slug": "holo3-35b-a3b",
        "canonicalModelKey": "holo3-35b-a3b",
        "model": "Holo3-35B-A3B",
        "creator": "H Company",
        "sourceType": "Open Weight",
        "reasoningType": "Non-Reasoning",
        "contextWindow": "64K",
        "contextWindowTokens": 64000,
        "displayScore": 100,
        "rankingEligible": false,
        "overallRank": null,
        "url": "https://benchlm.ai/models/holo3-35b-a3b",
        "markdownUrl": "https://benchlm.ai/md/models/holo3-35b-a3b.md"
      },
      "scoreDiff": 26,
      "winsA": 0,
      "winsB": 1,
      "comparableCategoryCount": 1,
      "benchmarkCountA": 40,
      "benchmarkCountB": 1,
      "categoryResults": {
        "agentic": {
          "categoryLabel": "Agentic",
          "avgA": 63.3,
          "avgB": 82.6,
          "winner": "B",
          "benchmarkCount": 10
        },
        "coding": {
          "categoryLabel": "Coding",
          "avgA": 73.7,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 9
        },
        "multimodalGrounded": {
          "categoryLabel": "Multimodal & Grounded",
          "avgA": null,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 1
        },
        "reasoning": {
          "categoryLabel": "Reasoning",
          "avgA": null,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 4
        },
        "knowledge": {
          "categoryLabel": "Knowledge",
          "avgA": 60,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 12
        },
        "instructionFollowing": {
          "categoryLabel": "Instruction Following",
          "avgA": null,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 1
        },
        "multilingual": {
          "categoryLabel": "Multilingual",
          "avgA": null,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 0
        },
        "math": {
          "categoryLabel": "Mathematics",
          "avgA": null,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 4
        }
      }
    },
    {
      "slug": "gpt-5-5-pro-vs-qwen3-6-27b",
      "url": "https://benchlm.ai/compare/gpt-5-5-pro-vs-qwen3-6-27b",
      "markdownUrl": "https://benchlm.ai/md/compare/gpt-5-5-pro-vs-qwen3-6-27b.md",
      "modelA": {
        "slug": "qwen3-6-27b",
        "canonicalModelKey": "qwen3-6-27b",
        "model": "Qwen3.6-27B",
        "creator": "Alibaba",
        "sourceType": "Open Weight",
        "reasoningType": "Reasoning",
        "contextWindow": "262K",
        "contextWindowTokens": 262000,
        "displayScore": 72,
        "rankingEligible": true,
        "overallRank": 34,
        "url": "https://benchlm.ai/models/qwen3-6-27b",
        "markdownUrl": "https://benchlm.ai/md/models/qwen3-6-27b.md"
      },
      "modelB": {
        "slug": "gpt-5-5-pro",
        "canonicalModelKey": "gpt-5-5-pro",
        "model": "GPT-5.5 Pro",
        "creator": "OpenAI",
        "sourceType": "Proprietary",
        "reasoningType": "Reasoning",
        "contextWindow": "1M",
        "contextWindowTokens": 1000000,
        "displayScore": 100,
        "rankingEligible": false,
        "overallRank": null,
        "url": "https://benchlm.ai/models/gpt-5-5-pro",
        "markdownUrl": "https://benchlm.ai/md/models/gpt-5-5-pro.md"
      },
      "overallWinner": "B",
      "winner": {
        "slug": "gpt-5-5-pro",
        "canonicalModelKey": "gpt-5-5-pro",
        "model": "GPT-5.5 Pro",
        "creator": "OpenAI",
        "sourceType": "Proprietary",
        "reasoningType": "Reasoning",
        "contextWindow": "1M",
        "contextWindowTokens": 1000000,
        "displayScore": 100,
        "rankingEligible": false,
        "overallRank": null,
        "url": "https://benchlm.ai/models/gpt-5-5-pro",
        "markdownUrl": "https://benchlm.ai/md/models/gpt-5-5-pro.md"
      },
      "scoreDiff": 28,
      "winsA": 1,
      "winsB": 1,
      "comparableCategoryCount": 2,
      "benchmarkCountA": 55,
      "benchmarkCountB": 4,
      "categoryResults": {
        "agentic": {
          "categoryLabel": "Agentic",
          "avgA": 59.3,
          "avgB": 90.1,
          "winner": "B",
          "benchmarkCount": 11
        },
        "coding": {
          "categoryLabel": "Coding",
          "avgA": 70.6,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 9
        },
        "multimodalGrounded": {
          "categoryLabel": "Multimodal & Grounded",
          "avgA": 76.6,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 16
        },
        "reasoning": {
          "categoryLabel": "Reasoning",
          "avgA": null,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 2
        },
        "knowledge": {
          "categoryLabel": "Knowledge",
          "avgA": 62.2,
          "avgB": 57.2,
          "winner": "A",
          "benchmarkCount": 13
        },
        "instructionFollowing": {
          "categoryLabel": "Instruction Following",
          "avgA": null,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 1
        },
        "multilingual": {
          "categoryLabel": "Multilingual",
          "avgA": null,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 0
        },
        "math": {
          "categoryLabel": "Mathematics",
          "avgA": null,
          "avgB": 52.4,
          "winner": null,
          "benchmarkCount": 6
        }
      }
    },
    {
      "slug": "holo3-35b-a3b-vs-qwen3-6-27b",
      "url": "https://benchlm.ai/compare/holo3-35b-a3b-vs-qwen3-6-27b",
      "markdownUrl": "https://benchlm.ai/md/compare/holo3-35b-a3b-vs-qwen3-6-27b.md",
      "modelA": {
        "slug": "qwen3-6-27b",
        "canonicalModelKey": "qwen3-6-27b",
        "model": "Qwen3.6-27B",
        "creator": "Alibaba",
        "sourceType": "Open Weight",
        "reasoningType": "Reasoning",
        "contextWindow": "262K",
        "contextWindowTokens": 262000,
        "displayScore": 72,
        "rankingEligible": true,
        "overallRank": 34,
        "url": "https://benchlm.ai/models/qwen3-6-27b",
        "markdownUrl": "https://benchlm.ai/md/models/qwen3-6-27b.md"
      },
      "modelB": {
        "slug": "holo3-35b-a3b",
        "canonicalModelKey": "holo3-35b-a3b",
        "model": "Holo3-35B-A3B",
        "creator": "H Company",
        "sourceType": "Open Weight",
        "reasoningType": "Non-Reasoning",
        "contextWindow": "64K",
        "contextWindowTokens": 64000,
        "displayScore": 100,
        "rankingEligible": false,
        "overallRank": null,
        "url": "https://benchlm.ai/models/holo3-35b-a3b",
        "markdownUrl": "https://benchlm.ai/md/models/holo3-35b-a3b.md"
      },
      "overallWinner": "B",
      "winner": {
        "slug": "holo3-35b-a3b",
        "canonicalModelKey": "holo3-35b-a3b",
        "model": "Holo3-35B-A3B",
        "creator": "H Company",
        "sourceType": "Open Weight",
        "reasoningType": "Non-Reasoning",
        "contextWindow": "64K",
        "contextWindowTokens": 64000,
        "displayScore": 100,
        "rankingEligible": false,
        "overallRank": null,
        "url": "https://benchlm.ai/models/holo3-35b-a3b",
        "markdownUrl": "https://benchlm.ai/md/models/holo3-35b-a3b.md"
      },
      "scoreDiff": 28,
      "winsA": 0,
      "winsB": 1,
      "comparableCategoryCount": 1,
      "benchmarkCountA": 55,
      "benchmarkCountB": 1,
      "categoryResults": {
        "agentic": {
          "categoryLabel": "Agentic",
          "avgA": 59.3,
          "avgB": 82.6,
          "winner": "B",
          "benchmarkCount": 11
        },
        "coding": {
          "categoryLabel": "Coding",
          "avgA": 70.6,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 9
        },
        "multimodalGrounded": {
          "categoryLabel": "Multimodal & Grounded",
          "avgA": 76.6,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 16
        },
        "reasoning": {
          "categoryLabel": "Reasoning",
          "avgA": null,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 2
        },
        "knowledge": {
          "categoryLabel": "Knowledge",
          "avgA": 62.2,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 12
        },
        "instructionFollowing": {
          "categoryLabel": "Instruction Following",
          "avgA": null,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 1
        },
        "multilingual": {
          "categoryLabel": "Multilingual",
          "avgA": null,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 0
        },
        "math": {
          "categoryLabel": "Mathematics",
          "avgA": null,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 5
        }
      }
    },
    {
      "slug": "gpt-5-5-pro-vs-grok-4-20-beta",
      "url": "https://benchlm.ai/compare/gpt-5-5-pro-vs-grok-4-20-beta",
      "markdownUrl": "https://benchlm.ai/md/compare/gpt-5-5-pro-vs-grok-4-20-beta.md",
      "modelA": {
        "slug": "grok-4-20-beta",
        "canonicalModelKey": "grok-4-20-beta",
        "model": "Grok 4.20",
        "creator": "xAI",
        "sourceType": "Proprietary",
        "reasoningType": "Reasoning",
        "contextWindow": "2M",
        "contextWindowTokens": 2000000,
        "displayScore": 71,
        "rankingEligible": true,
        "overallRank": 35,
        "url": "https://benchlm.ai/models/grok-4-20-beta",
        "markdownUrl": "https://benchlm.ai/md/models/grok-4-20-beta.md"
      },
      "modelB": {
        "slug": "gpt-5-5-pro",
        "canonicalModelKey": "gpt-5-5-pro",
        "model": "GPT-5.5 Pro",
        "creator": "OpenAI",
        "sourceType": "Proprietary",
        "reasoningType": "Reasoning",
        "contextWindow": "1M",
        "contextWindowTokens": 1000000,
        "displayScore": 100,
        "rankingEligible": false,
        "overallRank": null,
        "url": "https://benchlm.ai/models/gpt-5-5-pro",
        "markdownUrl": "https://benchlm.ai/md/models/gpt-5-5-pro.md"
      },
      "overallWinner": "B",
      "winner": {
        "slug": "gpt-5-5-pro",
        "canonicalModelKey": "gpt-5-5-pro",
        "model": "GPT-5.5 Pro",
        "creator": "OpenAI",
        "sourceType": "Proprietary",
        "reasoningType": "Reasoning",
        "contextWindow": "1M",
        "contextWindowTokens": 1000000,
        "displayScore": 100,
        "rankingEligible": false,
        "overallRank": null,
        "url": "https://benchlm.ai/models/gpt-5-5-pro",
        "markdownUrl": "https://benchlm.ai/md/models/gpt-5-5-pro.md"
      },
      "scoreDiff": 29,
      "winsA": 0,
      "winsB": 1,
      "comparableCategoryCount": 1,
      "benchmarkCountA": 18,
      "benchmarkCountB": 4,
      "categoryResults": {
        "agentic": {
          "categoryLabel": "Agentic",
          "avgA": 47.1,
          "avgB": 90.1,
          "winner": "B",
          "benchmarkCount": 4
        },
        "coding": {
          "categoryLabel": "Coding",
          "avgA": 61,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 4
        },
        "multimodalGrounded": {
          "categoryLabel": "Multimodal & Grounded",
          "avgA": 70.8,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 6
        },
        "reasoning": {
          "categoryLabel": "Reasoning",
          "avgA": 53.3,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 1
        },
        "knowledge": {
          "categoryLabel": "Knowledge",
          "avgA": null,
          "avgB": 57.2,
          "winner": null,
          "benchmarkCount": 5
        },
        "instructionFollowing": {
          "categoryLabel": "Instruction Following",
          "avgA": null,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 0
        },
        "multilingual": {
          "categoryLabel": "Multilingual",
          "avgA": null,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 0
        },
        "math": {
          "categoryLabel": "Mathematics",
          "avgA": null,
          "avgB": 52.4,
          "winner": null,
          "benchmarkCount": 1
        }
      }
    },
    {
      "slug": "grok-4-20-beta-vs-holo3-35b-a3b",
      "url": "https://benchlm.ai/compare/grok-4-20-beta-vs-holo3-35b-a3b",
      "markdownUrl": "https://benchlm.ai/md/compare/grok-4-20-beta-vs-holo3-35b-a3b.md",
      "modelA": {
        "slug": "grok-4-20-beta",
        "canonicalModelKey": "grok-4-20-beta",
        "model": "Grok 4.20",
        "creator": "xAI",
        "sourceType": "Proprietary",
        "reasoningType": "Reasoning",
        "contextWindow": "2M",
        "contextWindowTokens": 2000000,
        "displayScore": 71,
        "rankingEligible": true,
        "overallRank": 35,
        "url": "https://benchlm.ai/models/grok-4-20-beta",
        "markdownUrl": "https://benchlm.ai/md/models/grok-4-20-beta.md"
      },
      "modelB": {
        "slug": "holo3-35b-a3b",
        "canonicalModelKey": "holo3-35b-a3b",
        "model": "Holo3-35B-A3B",
        "creator": "H Company",
        "sourceType": "Open Weight",
        "reasoningType": "Non-Reasoning",
        "contextWindow": "64K",
        "contextWindowTokens": 64000,
        "displayScore": 100,
        "rankingEligible": false,
        "overallRank": null,
        "url": "https://benchlm.ai/models/holo3-35b-a3b",
        "markdownUrl": "https://benchlm.ai/md/models/holo3-35b-a3b.md"
      },
      "overallWinner": "B",
      "winner": {
        "slug": "holo3-35b-a3b",
        "canonicalModelKey": "holo3-35b-a3b",
        "model": "Holo3-35B-A3B",
        "creator": "H Company",
        "sourceType": "Open Weight",
        "reasoningType": "Non-Reasoning",
        "contextWindow": "64K",
        "contextWindowTokens": 64000,
        "displayScore": 100,
        "rankingEligible": false,
        "overallRank": null,
        "url": "https://benchlm.ai/models/holo3-35b-a3b",
        "markdownUrl": "https://benchlm.ai/md/models/holo3-35b-a3b.md"
      },
      "scoreDiff": 29,
      "winsA": 0,
      "winsB": 1,
      "comparableCategoryCount": 1,
      "benchmarkCountA": 18,
      "benchmarkCountB": 1,
      "categoryResults": {
        "agentic": {
          "categoryLabel": "Agentic",
          "avgA": 47.1,
          "avgB": 82.6,
          "winner": "B",
          "benchmarkCount": 4
        },
        "coding": {
          "categoryLabel": "Coding",
          "avgA": 61,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 4
        },
        "multimodalGrounded": {
          "categoryLabel": "Multimodal & Grounded",
          "avgA": 70.8,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 6
        },
        "reasoning": {
          "categoryLabel": "Reasoning",
          "avgA": 53.3,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 1
        },
        "knowledge": {
          "categoryLabel": "Knowledge",
          "avgA": null,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 4
        },
        "instructionFollowing": {
          "categoryLabel": "Instruction Following",
          "avgA": null,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 0
        },
        "multilingual": {
          "categoryLabel": "Multilingual",
          "avgA": null,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 0
        },
        "math": {
          "categoryLabel": "Mathematics",
          "avgA": null,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 0
        }
      }
    },
    {
      "slug": "deepseek-v4-flash-high-vs-gpt-5-5-pro",
      "url": "https://benchlm.ai/compare/deepseek-v4-flash-high-vs-gpt-5-5-pro",
      "markdownUrl": "https://benchlm.ai/md/compare/deepseek-v4-flash-high-vs-gpt-5-5-pro.md",
      "modelA": {
        "slug": "deepseek-v4-flash-high",
        "canonicalModelKey": "deepseek-v4-flash-high",
        "model": "DeepSeek V4 Flash (High)",
        "creator": "DeepSeek",
        "sourceType": "Open Weight",
        "reasoningType": "Reasoning",
        "contextWindow": "1M",
        "contextWindowTokens": 1000000,
        "displayScore": 71,
        "rankingEligible": true,
        "overallRank": 36,
        "url": "https://benchlm.ai/models/deepseek-v4-flash-high",
        "markdownUrl": "https://benchlm.ai/md/models/deepseek-v4-flash-high.md"
      },
      "modelB": {
        "slug": "gpt-5-5-pro",
        "canonicalModelKey": "gpt-5-5-pro",
        "model": "GPT-5.5 Pro",
        "creator": "OpenAI",
        "sourceType": "Proprietary",
        "reasoningType": "Reasoning",
        "contextWindow": "1M",
        "contextWindowTokens": 1000000,
        "displayScore": 100,
        "rankingEligible": false,
        "overallRank": null,
        "url": "https://benchlm.ai/models/gpt-5-5-pro",
        "markdownUrl": "https://benchlm.ai/md/models/gpt-5-5-pro.md"
      },
      "overallWinner": "B",
      "winner": {
        "slug": "gpt-5-5-pro",
        "canonicalModelKey": "gpt-5-5-pro",
        "model": "GPT-5.5 Pro",
        "creator": "OpenAI",
        "sourceType": "Proprietary",
        "reasoningType": "Reasoning",
        "contextWindow": "1M",
        "contextWindowTokens": 1000000,
        "displayScore": 100,
        "rankingEligible": false,
        "overallRank": null,
        "url": "https://benchlm.ai/models/gpt-5-5-pro",
        "markdownUrl": "https://benchlm.ai/md/models/gpt-5-5-pro.md"
      },
      "scoreDiff": 29,
      "winsA": 0,
      "winsB": 1,
      "comparableCategoryCount": 2,
      "benchmarkCountA": 40,
      "benchmarkCountB": 4,
      "categoryResults": {
        "agentic": {
          "categoryLabel": "Agentic",
          "avgA": 55.4,
          "avgB": 90.1,
          "winner": "B",
          "benchmarkCount": 9
        },
        "coding": {
          "categoryLabel": "Coding",
          "avgA": 72.2,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 9
        },
        "multimodalGrounded": {
          "categoryLabel": "Multimodal & Grounded",
          "avgA": null,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 1
        },
        "reasoning": {
          "categoryLabel": "Reasoning",
          "avgA": null,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 4
        },
        "knowledge": {
          "categoryLabel": "Knowledge",
          "avgA": 57.2,
          "avgB": 57.2,
          "winner": "tie",
          "benchmarkCount": 13
        },
        "instructionFollowing": {
          "categoryLabel": "Instruction Following",
          "avgA": null,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 1
        },
        "multilingual": {
          "categoryLabel": "Multilingual",
          "avgA": null,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 0
        },
        "math": {
          "categoryLabel": "Mathematics",
          "avgA": null,
          "avgB": 52.4,
          "winner": null,
          "benchmarkCount": 5
        }
      }
    },
    {
      "slug": "deepseek-v4-flash-high-vs-holo3-35b-a3b",
      "url": "https://benchlm.ai/compare/deepseek-v4-flash-high-vs-holo3-35b-a3b",
      "markdownUrl": "https://benchlm.ai/md/compare/deepseek-v4-flash-high-vs-holo3-35b-a3b.md",
      "modelA": {
        "slug": "deepseek-v4-flash-high",
        "canonicalModelKey": "deepseek-v4-flash-high",
        "model": "DeepSeek V4 Flash (High)",
        "creator": "DeepSeek",
        "sourceType": "Open Weight",
        "reasoningType": "Reasoning",
        "contextWindow": "1M",
        "contextWindowTokens": 1000000,
        "displayScore": 71,
        "rankingEligible": true,
        "overallRank": 36,
        "url": "https://benchlm.ai/models/deepseek-v4-flash-high",
        "markdownUrl": "https://benchlm.ai/md/models/deepseek-v4-flash-high.md"
      },
      "modelB": {
        "slug": "holo3-35b-a3b",
        "canonicalModelKey": "holo3-35b-a3b",
        "model": "Holo3-35B-A3B",
        "creator": "H Company",
        "sourceType": "Open Weight",
        "reasoningType": "Non-Reasoning",
        "contextWindow": "64K",
        "contextWindowTokens": 64000,
        "displayScore": 100,
        "rankingEligible": false,
        "overallRank": null,
        "url": "https://benchlm.ai/models/holo3-35b-a3b",
        "markdownUrl": "https://benchlm.ai/md/models/holo3-35b-a3b.md"
      },
      "overallWinner": "B",
      "winner": {
        "slug": "holo3-35b-a3b",
        "canonicalModelKey": "holo3-35b-a3b",
        "model": "Holo3-35B-A3B",
        "creator": "H Company",
        "sourceType": "Open Weight",
        "reasoningType": "Non-Reasoning",
        "contextWindow": "64K",
        "contextWindowTokens": 64000,
        "displayScore": 100,
        "rankingEligible": false,
        "overallRank": null,
        "url": "https://benchlm.ai/models/holo3-35b-a3b",
        "markdownUrl": "https://benchlm.ai/md/models/holo3-35b-a3b.md"
      },
      "scoreDiff": 29,
      "winsA": 0,
      "winsB": 1,
      "comparableCategoryCount": 1,
      "benchmarkCountA": 40,
      "benchmarkCountB": 1,
      "categoryResults": {
        "agentic": {
          "categoryLabel": "Agentic",
          "avgA": 55.4,
          "avgB": 82.6,
          "winner": "B",
          "benchmarkCount": 10
        },
        "coding": {
          "categoryLabel": "Coding",
          "avgA": 72.2,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 9
        },
        "multimodalGrounded": {
          "categoryLabel": "Multimodal & Grounded",
          "avgA": null,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 1
        },
        "reasoning": {
          "categoryLabel": "Reasoning",
          "avgA": null,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 4
        },
        "knowledge": {
          "categoryLabel": "Knowledge",
          "avgA": 57.2,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 12
        },
        "instructionFollowing": {
          "categoryLabel": "Instruction Following",
          "avgA": null,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 1
        },
        "multilingual": {
          "categoryLabel": "Multilingual",
          "avgA": null,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 0
        },
        "math": {
          "categoryLabel": "Mathematics",
          "avgA": null,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 4
        }
      }
    },
    {
      "slug": "gpt-5-5-pro-vs-gpt-5-medium",
      "url": "https://benchlm.ai/compare/gpt-5-5-pro-vs-gpt-5-medium",
      "markdownUrl": "https://benchlm.ai/md/compare/gpt-5-5-pro-vs-gpt-5-medium.md",
      "modelA": {
        "slug": "gpt-5-medium",
        "canonicalModelKey": "gpt-5-medium",
        "model": "GPT-5 (medium)",
        "creator": "OpenAI",
        "sourceType": "Proprietary",
        "reasoningType": "Reasoning",
        "contextWindow": "128K",
        "contextWindowTokens": 128000,
        "displayScore": 70,
        "rankingEligible": true,
        "overallRank": 37,
        "url": "https://benchlm.ai/models/gpt-5-medium",
        "markdownUrl": "https://benchlm.ai/md/models/gpt-5-medium.md"
      },
      "modelB": {
        "slug": "gpt-5-5-pro",
        "canonicalModelKey": "gpt-5-5-pro",
        "model": "GPT-5.5 Pro",
        "creator": "OpenAI",
        "sourceType": "Proprietary",
        "reasoningType": "Reasoning",
        "contextWindow": "1M",
        "contextWindowTokens": 1000000,
        "displayScore": 100,
        "rankingEligible": false,
        "overallRank": null,
        "url": "https://benchlm.ai/models/gpt-5-5-pro",
        "markdownUrl": "https://benchlm.ai/md/models/gpt-5-5-pro.md"
      },
      "overallWinner": "B",
      "winner": {
        "slug": "gpt-5-5-pro",
        "canonicalModelKey": "gpt-5-5-pro",
        "model": "GPT-5.5 Pro",
        "creator": "OpenAI",
        "sourceType": "Proprietary",
        "reasoningType": "Reasoning",
        "contextWindow": "1M",
        "contextWindowTokens": 1000000,
        "displayScore": 100,
        "rankingEligible": false,
        "overallRank": null,
        "url": "https://benchlm.ai/models/gpt-5-5-pro",
        "markdownUrl": "https://benchlm.ai/md/models/gpt-5-5-pro.md"
      },
      "scoreDiff": 30,
      "winsA": 0,
      "winsB": 0,
      "comparableCategoryCount": 0,
      "benchmarkCountA": 18,
      "benchmarkCountB": 4,
      "categoryResults": {
        "agentic": {
          "categoryLabel": "Agentic",
          "avgA": null,
          "avgB": 90.1,
          "winner": null,
          "benchmarkCount": 5
        },
        "coding": {
          "categoryLabel": "Coding",
          "avgA": null,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 3
        },
        "multimodalGrounded": {
          "categoryLabel": "Multimodal & Grounded",
          "avgA": null,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 2
        },
        "reasoning": {
          "categoryLabel": "Reasoning",
          "avgA": null,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 2
        },
        "knowledge": {
          "categoryLabel": "Knowledge",
          "avgA": null,
          "avgB": 57.2,
          "winner": null,
          "benchmarkCount": 8
        },
        "instructionFollowing": {
          "categoryLabel": "Instruction Following",
          "avgA": null,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 1
        },
        "multilingual": {
          "categoryLabel": "Multilingual",
          "avgA": null,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 0
        },
        "math": {
          "categoryLabel": "Mathematics",
          "avgA": null,
          "avgB": 52.4,
          "winner": null,
          "benchmarkCount": 1
        }
      }
    },
    {
      "slug": "gpt-5-medium-vs-holo3-35b-a3b",
      "url": "https://benchlm.ai/compare/gpt-5-medium-vs-holo3-35b-a3b",
      "markdownUrl": "https://benchlm.ai/md/compare/gpt-5-medium-vs-holo3-35b-a3b.md",
      "modelA": {
        "slug": "gpt-5-medium",
        "canonicalModelKey": "gpt-5-medium",
        "model": "GPT-5 (medium)",
        "creator": "OpenAI",
        "sourceType": "Proprietary",
        "reasoningType": "Reasoning",
        "contextWindow": "128K",
        "contextWindowTokens": 128000,
        "displayScore": 70,
        "rankingEligible": true,
        "overallRank": 37,
        "url": "https://benchlm.ai/models/gpt-5-medium",
        "markdownUrl": "https://benchlm.ai/md/models/gpt-5-medium.md"
      },
      "modelB": {
        "slug": "holo3-35b-a3b",
        "canonicalModelKey": "holo3-35b-a3b",
        "model": "Holo3-35B-A3B",
        "creator": "H Company",
        "sourceType": "Open Weight",
        "reasoningType": "Non-Reasoning",
        "contextWindow": "64K",
        "contextWindowTokens": 64000,
        "displayScore": 100,
        "rankingEligible": false,
        "overallRank": null,
        "url": "https://benchlm.ai/models/holo3-35b-a3b",
        "markdownUrl": "https://benchlm.ai/md/models/holo3-35b-a3b.md"
      },
      "overallWinner": "B",
      "winner": {
        "slug": "holo3-35b-a3b",
        "canonicalModelKey": "holo3-35b-a3b",
        "model": "Holo3-35B-A3B",
        "creator": "H Company",
        "sourceType": "Open Weight",
        "reasoningType": "Non-Reasoning",
        "contextWindow": "64K",
        "contextWindowTokens": 64000,
        "displayScore": 100,
        "rankingEligible": false,
        "overallRank": null,
        "url": "https://benchlm.ai/models/holo3-35b-a3b",
        "markdownUrl": "https://benchlm.ai/md/models/holo3-35b-a3b.md"
      },
      "scoreDiff": 30,
      "winsA": 0,
      "winsB": 0,
      "comparableCategoryCount": 0,
      "benchmarkCountA": 18,
      "benchmarkCountB": 1,
      "categoryResults": {
        "agentic": {
          "categoryLabel": "Agentic",
          "avgA": null,
          "avgB": 82.6,
          "winner": null,
          "benchmarkCount": 5
        },
        "coding": {
          "categoryLabel": "Coding",
          "avgA": null,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 3
        },
        "multimodalGrounded": {
          "categoryLabel": "Multimodal & Grounded",
          "avgA": null,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 2
        },
        "reasoning": {
          "categoryLabel": "Reasoning",
          "avgA": null,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 2
        },
        "knowledge": {
          "categoryLabel": "Knowledge",
          "avgA": null,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 6
        },
        "instructionFollowing": {
          "categoryLabel": "Instruction Following",
          "avgA": null,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 1
        },
        "multilingual": {
          "categoryLabel": "Multilingual",
          "avgA": null,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 0
        },
        "math": {
          "categoryLabel": "Mathematics",
          "avgA": null,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 0
        }
      }
    },
    {
      "slug": "gpt-5-5-pro-vs-nemotron-3-ultra",
      "url": "https://benchlm.ai/compare/gpt-5-5-pro-vs-nemotron-3-ultra",
      "markdownUrl": "https://benchlm.ai/md/compare/gpt-5-5-pro-vs-nemotron-3-ultra.md",
      "modelA": {
        "slug": "nemotron-3-ultra",
        "canonicalModelKey": "nemotron-3-ultra-500b",
        "model": "Nemotron 3 Ultra",
        "creator": "NVIDIA",
        "sourceType": "Open Weight",
        "reasoningType": "Reasoning",
        "contextWindow": "1M",
        "contextWindowTokens": 1000000,
        "displayScore": 68,
        "rankingEligible": true,
        "overallRank": 38,
        "url": "https://benchlm.ai/models/nemotron-3-ultra",
        "markdownUrl": "https://benchlm.ai/md/models/nemotron-3-ultra.md"
      },
      "modelB": {
        "slug": "gpt-5-5-pro",
        "canonicalModelKey": "gpt-5-5-pro",
        "model": "GPT-5.5 Pro",
        "creator": "OpenAI",
        "sourceType": "Proprietary",
        "reasoningType": "Reasoning",
        "contextWindow": "1M",
        "contextWindowTokens": 1000000,
        "displayScore": 100,
        "rankingEligible": false,
        "overallRank": null,
        "url": "https://benchlm.ai/models/gpt-5-5-pro",
        "markdownUrl": "https://benchlm.ai/md/models/gpt-5-5-pro.md"
      },
      "overallWinner": "B",
      "winner": {
        "slug": "gpt-5-5-pro",
        "canonicalModelKey": "gpt-5-5-pro",
        "model": "GPT-5.5 Pro",
        "creator": "OpenAI",
        "sourceType": "Proprietary",
        "reasoningType": "Reasoning",
        "contextWindow": "1M",
        "contextWindowTokens": 1000000,
        "displayScore": 100,
        "rankingEligible": false,
        "overallRank": null,
        "url": "https://benchlm.ai/models/gpt-5-5-pro",
        "markdownUrl": "https://benchlm.ai/md/models/gpt-5-5-pro.md"
      },
      "scoreDiff": 32,
      "winsA": 1,
      "winsB": 1,
      "comparableCategoryCount": 2,
      "benchmarkCountA": 34,
      "benchmarkCountB": 4,
      "categoryResults": {
        "agentic": {
          "categoryLabel": "Agentic",
          "avgA": 51.7,
          "avgB": 90.1,
          "winner": "B",
          "benchmarkCount": 9
        },
        "coding": {
          "categoryLabel": "Coding",
          "avgA": 74.2,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 8
        },
        "multimodalGrounded": {
          "categoryLabel": "Multimodal & Grounded",
          "avgA": null,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 0
        },
        "reasoning": {
          "categoryLabel": "Reasoning",
          "avgA": 61.9,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 3
        },
        "knowledge": {
          "categoryLabel": "Knowledge",
          "avgA": 62.6,
          "avgB": 57.2,
          "winner": "A",
          "benchmarkCount": 11
        },
        "instructionFollowing": {
          "categoryLabel": "Instruction Following",
          "avgA": 81.7,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 2
        },
        "multilingual": {
          "categoryLabel": "Multilingual",
          "avgA": 83,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 1
        },
        "math": {
          "categoryLabel": "Mathematics",
          "avgA": null,
          "avgB": 52.4,
          "winner": null,
          "benchmarkCount": 1
        }
      }
    },
    {
      "slug": "holo3-35b-a3b-vs-nemotron-3-ultra",
      "url": "https://benchlm.ai/compare/holo3-35b-a3b-vs-nemotron-3-ultra",
      "markdownUrl": "https://benchlm.ai/md/compare/holo3-35b-a3b-vs-nemotron-3-ultra.md",
      "modelA": {
        "slug": "nemotron-3-ultra",
        "canonicalModelKey": "nemotron-3-ultra-500b",
        "model": "Nemotron 3 Ultra",
        "creator": "NVIDIA",
        "sourceType": "Open Weight",
        "reasoningType": "Reasoning",
        "contextWindow": "1M",
        "contextWindowTokens": 1000000,
        "displayScore": 68,
        "rankingEligible": true,
        "overallRank": 38,
        "url": "https://benchlm.ai/models/nemotron-3-ultra",
        "markdownUrl": "https://benchlm.ai/md/models/nemotron-3-ultra.md"
      },
      "modelB": {
        "slug": "holo3-35b-a3b",
        "canonicalModelKey": "holo3-35b-a3b",
        "model": "Holo3-35B-A3B",
        "creator": "H Company",
        "sourceType": "Open Weight",
        "reasoningType": "Non-Reasoning",
        "contextWindow": "64K",
        "contextWindowTokens": 64000,
        "displayScore": 100,
        "rankingEligible": false,
        "overallRank": null,
        "url": "https://benchlm.ai/models/holo3-35b-a3b",
        "markdownUrl": "https://benchlm.ai/md/models/holo3-35b-a3b.md"
      },
      "overallWinner": "B",
      "winner": {
        "slug": "holo3-35b-a3b",
        "canonicalModelKey": "holo3-35b-a3b",
        "model": "Holo3-35B-A3B",
        "creator": "H Company",
        "sourceType": "Open Weight",
        "reasoningType": "Non-Reasoning",
        "contextWindow": "64K",
        "contextWindowTokens": 64000,
        "displayScore": 100,
        "rankingEligible": false,
        "overallRank": null,
        "url": "https://benchlm.ai/models/holo3-35b-a3b",
        "markdownUrl": "https://benchlm.ai/md/models/holo3-35b-a3b.md"
      },
      "scoreDiff": 32,
      "winsA": 0,
      "winsB": 1,
      "comparableCategoryCount": 1,
      "benchmarkCountA": 34,
      "benchmarkCountB": 1,
      "categoryResults": {
        "agentic": {
          "categoryLabel": "Agentic",
          "avgA": 51.7,
          "avgB": 82.6,
          "winner": "B",
          "benchmarkCount": 10
        },
        "coding": {
          "categoryLabel": "Coding",
          "avgA": 74.2,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 8
        },
        "multimodalGrounded": {
          "categoryLabel": "Multimodal & Grounded",
          "avgA": null,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 0
        },
        "reasoning": {
          "categoryLabel": "Reasoning",
          "avgA": 61.9,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 3
        },
        "knowledge": {
          "categoryLabel": "Knowledge",
          "avgA": 62.6,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 11
        },
        "instructionFollowing": {
          "categoryLabel": "Instruction Following",
          "avgA": 81.7,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 2
        },
        "multilingual": {
          "categoryLabel": "Multilingual",
          "avgA": 83,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 1
        },
        "math": {
          "categoryLabel": "Mathematics",
          "avgA": null,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 0
        }
      }
    },
    {
      "slug": "deepseek-v4-pro-vs-gpt-5-5-pro",
      "url": "https://benchlm.ai/compare/deepseek-v4-pro-vs-gpt-5-5-pro",
      "markdownUrl": "https://benchlm.ai/md/compare/deepseek-v4-pro-vs-gpt-5-5-pro.md",
      "modelA": {
        "slug": "deepseek-v4-pro",
        "canonicalModelKey": "deepseek-v4-pro",
        "model": "DeepSeek V4 Pro",
        "creator": "DeepSeek",
        "sourceType": "Open Weight",
        "reasoningType": "Non-Reasoning",
        "contextWindow": "1M",
        "contextWindowTokens": 1000000,
        "displayScore": 68,
        "rankingEligible": true,
        "overallRank": 39,
        "url": "https://benchlm.ai/models/deepseek-v4-pro",
        "markdownUrl": "https://benchlm.ai/md/models/deepseek-v4-pro.md"
      },
      "modelB": {
        "slug": "gpt-5-5-pro",
        "canonicalModelKey": "gpt-5-5-pro",
        "model": "GPT-5.5 Pro",
        "creator": "OpenAI",
        "sourceType": "Proprietary",
        "reasoningType": "Reasoning",
        "contextWindow": "1M",
        "contextWindowTokens": 1000000,
        "displayScore": 100,
        "rankingEligible": false,
        "overallRank": null,
        "url": "https://benchlm.ai/models/gpt-5-5-pro",
        "markdownUrl": "https://benchlm.ai/md/models/gpt-5-5-pro.md"
      },
      "overallWinner": "B",
      "winner": {
        "slug": "gpt-5-5-pro",
        "canonicalModelKey": "gpt-5-5-pro",
        "model": "GPT-5.5 Pro",
        "creator": "OpenAI",
        "sourceType": "Proprietary",
        "reasoningType": "Reasoning",
        "contextWindow": "1M",
        "contextWindowTokens": 1000000,
        "displayScore": 100,
        "rankingEligible": false,
        "overallRank": null,
        "url": "https://benchlm.ai/models/gpt-5-5-pro",
        "markdownUrl": "https://benchlm.ai/md/models/gpt-5-5-pro.md"
      },
      "scoreDiff": 32,
      "winsA": 0,
      "winsB": 2,
      "comparableCategoryCount": 2,
      "benchmarkCountA": 23,
      "benchmarkCountB": 4,
      "categoryResults": {
        "agentic": {
          "categoryLabel": "Agentic",
          "avgA": 59.1,
          "avgB": 90.1,
          "winner": "B",
          "benchmarkCount": 6
        },
        "coding": {
          "categoryLabel": "Coding",
          "avgA": 58.8,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 5
        },
        "multimodalGrounded": {
          "categoryLabel": "Multimodal & Grounded",
          "avgA": null,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 1
        },
        "reasoning": {
          "categoryLabel": "Reasoning",
          "avgA": null,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 2
        },
        "knowledge": {
          "categoryLabel": "Knowledge",
          "avgA": 49.4,
          "avgB": 57.2,
          "winner": "B",
          "benchmarkCount": 7
        },
        "instructionFollowing": {
          "categoryLabel": "Instruction Following",
          "avgA": null,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 0
        },
        "multilingual": {
          "categoryLabel": "Multilingual",
          "avgA": null,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 0
        },
        "math": {
          "categoryLabel": "Mathematics",
          "avgA": null,
          "avgB": 52.4,
          "winner": null,
          "benchmarkCount": 5
        }
      }
    },
    {
      "slug": "deepseek-v4-pro-vs-holo3-35b-a3b",
      "url": "https://benchlm.ai/compare/deepseek-v4-pro-vs-holo3-35b-a3b",
      "markdownUrl": "https://benchlm.ai/md/compare/deepseek-v4-pro-vs-holo3-35b-a3b.md",
      "modelA": {
        "slug": "deepseek-v4-pro",
        "canonicalModelKey": "deepseek-v4-pro",
        "model": "DeepSeek V4 Pro",
        "creator": "DeepSeek",
        "sourceType": "Open Weight",
        "reasoningType": "Non-Reasoning",
        "contextWindow": "1M",
        "contextWindowTokens": 1000000,
        "displayScore": 68,
        "rankingEligible": true,
        "overallRank": 39,
        "url": "https://benchlm.ai/models/deepseek-v4-pro",
        "markdownUrl": "https://benchlm.ai/md/models/deepseek-v4-pro.md"
      },
      "modelB": {
        "slug": "holo3-35b-a3b",
        "canonicalModelKey": "holo3-35b-a3b",
        "model": "Holo3-35B-A3B",
        "creator": "H Company",
        "sourceType": "Open Weight",
        "reasoningType": "Non-Reasoning",
        "contextWindow": "64K",
        "contextWindowTokens": 64000,
        "displayScore": 100,
        "rankingEligible": false,
        "overallRank": null,
        "url": "https://benchlm.ai/models/holo3-35b-a3b",
        "markdownUrl": "https://benchlm.ai/md/models/holo3-35b-a3b.md"
      },
      "overallWinner": "B",
      "winner": {
        "slug": "holo3-35b-a3b",
        "canonicalModelKey": "holo3-35b-a3b",
        "model": "Holo3-35B-A3B",
        "creator": "H Company",
        "sourceType": "Open Weight",
        "reasoningType": "Non-Reasoning",
        "contextWindow": "64K",
        "contextWindowTokens": 64000,
        "displayScore": 100,
        "rankingEligible": false,
        "overallRank": null,
        "url": "https://benchlm.ai/models/holo3-35b-a3b",
        "markdownUrl": "https://benchlm.ai/md/models/holo3-35b-a3b.md"
      },
      "scoreDiff": 32,
      "winsA": 0,
      "winsB": 1,
      "comparableCategoryCount": 1,
      "benchmarkCountA": 23,
      "benchmarkCountB": 1,
      "categoryResults": {
        "agentic": {
          "categoryLabel": "Agentic",
          "avgA": 59.1,
          "avgB": 82.6,
          "winner": "B",
          "benchmarkCount": 6
        },
        "coding": {
          "categoryLabel": "Coding",
          "avgA": 58.8,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 5
        },
        "multimodalGrounded": {
          "categoryLabel": "Multimodal & Grounded",
          "avgA": null,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 1
        },
        "reasoning": {
          "categoryLabel": "Reasoning",
          "avgA": null,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 2
        },
        "knowledge": {
          "categoryLabel": "Knowledge",
          "avgA": 49.4,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 6
        },
        "instructionFollowing": {
          "categoryLabel": "Instruction Following",
          "avgA": null,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 0
        },
        "multilingual": {
          "categoryLabel": "Multilingual",
          "avgA": null,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 0
        },
        "math": {
          "categoryLabel": "Mathematics",
          "avgA": null,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 4
        }
      }
    },
    {
      "slug": "glm-4-7-vs-gpt-5-5-pro",
      "url": "https://benchlm.ai/compare/glm-4-7-vs-gpt-5-5-pro",
      "markdownUrl": "https://benchlm.ai/md/compare/glm-4-7-vs-gpt-5-5-pro.md",
      "modelA": {
        "slug": "glm-4-7",
        "canonicalModelKey": "glm-4-7",
        "model": "GLM-4.7",
        "creator": "Z.AI",
        "sourceType": "Open Weight",
        "reasoningType": "Reasoning",
        "contextWindow": "200K",
        "contextWindowTokens": 200000,
        "displayScore": 68,
        "rankingEligible": true,
        "overallRank": 40,
        "url": "https://benchlm.ai/models/glm-4-7",
        "markdownUrl": "https://benchlm.ai/md/models/glm-4-7.md"
      },
      "modelB": {
        "slug": "gpt-5-5-pro",
        "canonicalModelKey": "gpt-5-5-pro",
        "model": "GPT-5.5 Pro",
        "creator": "OpenAI",
        "sourceType": "Proprietary",
        "reasoningType": "Reasoning",
        "contextWindow": "1M",
        "contextWindowTokens": 1000000,
        "displayScore": 100,
        "rankingEligible": false,
        "overallRank": null,
        "url": "https://benchlm.ai/models/gpt-5-5-pro",
        "markdownUrl": "https://benchlm.ai/md/models/gpt-5-5-pro.md"
      },
      "overallWinner": "B",
      "winner": {
        "slug": "gpt-5-5-pro",
        "canonicalModelKey": "gpt-5-5-pro",
        "model": "GPT-5.5 Pro",
        "creator": "OpenAI",
        "sourceType": "Proprietary",
        "reasoningType": "Reasoning",
        "contextWindow": "1M",
        "contextWindowTokens": 1000000,
        "displayScore": 100,
        "rankingEligible": false,
        "overallRank": null,
        "url": "https://benchlm.ai/models/gpt-5-5-pro",
        "markdownUrl": "https://benchlm.ai/md/models/gpt-5-5-pro.md"
      },
      "scoreDiff": 32,
      "winsA": 2,
      "winsB": 1,
      "comparableCategoryCount": 3,
      "benchmarkCountA": 28,
      "benchmarkCountB": 4,
      "categoryResults": {
        "agentic": {
          "categoryLabel": "Agentic",
          "avgA": 45.3,
          "avgB": 90.1,
          "winner": "B",
          "benchmarkCount": 8
        },
        "coding": {
          "categoryLabel": "Coding",
          "avgA": 70.6,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 6
        },
        "multimodalGrounded": {
          "categoryLabel": "Multimodal & Grounded",
          "avgA": null,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 1
        },
        "reasoning": {
          "categoryLabel": "Reasoning",
          "avgA": null,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 2
        },
        "knowledge": {
          "categoryLabel": "Knowledge",
          "avgA": 60.6,
          "avgB": 57.2,
          "winner": "A",
          "benchmarkCount": 10
        },
        "instructionFollowing": {
          "categoryLabel": "Instruction Following",
          "avgA": null,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 1
        },
        "multilingual": {
          "categoryLabel": "Multilingual",
          "avgA": null,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 0
        },
        "math": {
          "categoryLabel": "Mathematics",
          "avgA": 95.7,
          "avgB": 52.4,
          "winner": "A",
          "benchmarkCount": 2
        }
      }
    },
    {
      "slug": "glm-4-7-vs-holo3-35b-a3b",
      "url": "https://benchlm.ai/compare/glm-4-7-vs-holo3-35b-a3b",
      "markdownUrl": "https://benchlm.ai/md/compare/glm-4-7-vs-holo3-35b-a3b.md",
      "modelA": {
        "slug": "glm-4-7",
        "canonicalModelKey": "glm-4-7",
        "model": "GLM-4.7",
        "creator": "Z.AI",
        "sourceType": "Open Weight",
        "reasoningType": "Reasoning",
        "contextWindow": "200K",
        "contextWindowTokens": 200000,
        "displayScore": 68,
        "rankingEligible": true,
        "overallRank": 40,
        "url": "https://benchlm.ai/models/glm-4-7",
        "markdownUrl": "https://benchlm.ai/md/models/glm-4-7.md"
      },
      "modelB": {
        "slug": "holo3-35b-a3b",
        "canonicalModelKey": "holo3-35b-a3b",
        "model": "Holo3-35B-A3B",
        "creator": "H Company",
        "sourceType": "Open Weight",
        "reasoningType": "Non-Reasoning",
        "contextWindow": "64K",
        "contextWindowTokens": 64000,
        "displayScore": 100,
        "rankingEligible": false,
        "overallRank": null,
        "url": "https://benchlm.ai/models/holo3-35b-a3b",
        "markdownUrl": "https://benchlm.ai/md/models/holo3-35b-a3b.md"
      },
      "overallWinner": "B",
      "winner": {
        "slug": "holo3-35b-a3b",
        "canonicalModelKey": "holo3-35b-a3b",
        "model": "Holo3-35B-A3B",
        "creator": "H Company",
        "sourceType": "Open Weight",
        "reasoningType": "Non-Reasoning",
        "contextWindow": "64K",
        "contextWindowTokens": 64000,
        "displayScore": 100,
        "rankingEligible": false,
        "overallRank": null,
        "url": "https://benchlm.ai/models/holo3-35b-a3b",
        "markdownUrl": "https://benchlm.ai/md/models/holo3-35b-a3b.md"
      },
      "scoreDiff": 32,
      "winsA": 0,
      "winsB": 1,
      "comparableCategoryCount": 1,
      "benchmarkCountA": 28,
      "benchmarkCountB": 1,
      "categoryResults": {
        "agentic": {
          "categoryLabel": "Agentic",
          "avgA": 45.3,
          "avgB": 82.6,
          "winner": "B",
          "benchmarkCount": 9
        },
        "coding": {
          "categoryLabel": "Coding",
          "avgA": 70.6,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 6
        },
        "multimodalGrounded": {
          "categoryLabel": "Multimodal & Grounded",
          "avgA": null,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 1
        },
        "reasoning": {
          "categoryLabel": "Reasoning",
          "avgA": null,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 2
        },
        "knowledge": {
          "categoryLabel": "Knowledge",
          "avgA": 60.6,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 9
        },
        "instructionFollowing": {
          "categoryLabel": "Instruction Following",
          "avgA": null,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 1
        },
        "multilingual": {
          "categoryLabel": "Multilingual",
          "avgA": null,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 0
        },
        "math": {
          "categoryLabel": "Mathematics",
          "avgA": 95.7,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 1
        }
      }
    },
    {
      "slug": "gpt-5-5-pro-vs-grok-4-1-fast",
      "url": "https://benchlm.ai/compare/gpt-5-5-pro-vs-grok-4-1-fast",
      "markdownUrl": "https://benchlm.ai/md/compare/gpt-5-5-pro-vs-grok-4-1-fast.md",
      "modelA": {
        "slug": "grok-4-1-fast",
        "canonicalModelKey": "grok-4-1-fast",
        "model": "Grok 4.1 Fast",
        "creator": "xAI",
        "sourceType": "Proprietary",
        "reasoningType": "Non-Reasoning",
        "contextWindow": "1M",
        "contextWindowTokens": 1000000,
        "displayScore": 68,
        "rankingEligible": true,
        "overallRank": 41,
        "url": "https://benchlm.ai/models/grok-4-1-fast",
        "markdownUrl": "https://benchlm.ai/md/models/grok-4-1-fast.md"
      },
      "modelB": {
        "slug": "gpt-5-5-pro",
        "canonicalModelKey": "gpt-5-5-pro",
        "model": "GPT-5.5 Pro",
        "creator": "OpenAI",
        "sourceType": "Proprietary",
        "reasoningType": "Reasoning",
        "contextWindow": "1M",
        "contextWindowTokens": 1000000,
        "displayScore": 100,
        "rankingEligible": false,
        "overallRank": null,
        "url": "https://benchlm.ai/models/gpt-5-5-pro",
        "markdownUrl": "https://benchlm.ai/md/models/gpt-5-5-pro.md"
      },
      "overallWinner": "B",
      "winner": {
        "slug": "gpt-5-5-pro",
        "canonicalModelKey": "gpt-5-5-pro",
        "model": "GPT-5.5 Pro",
        "creator": "OpenAI",
        "sourceType": "Proprietary",
        "reasoningType": "Reasoning",
        "contextWindow": "1M",
        "contextWindowTokens": 1000000,
        "displayScore": 100,
        "rankingEligible": false,
        "overallRank": null,
        "url": "https://benchlm.ai/models/gpt-5-5-pro",
        "markdownUrl": "https://benchlm.ai/md/models/gpt-5-5-pro.md"
      },
      "scoreDiff": 32,
      "winsA": 0,
      "winsB": 0,
      "comparableCategoryCount": 0,
      "benchmarkCountA": 18,
      "benchmarkCountB": 4,
      "categoryResults": {
        "agentic": {
          "categoryLabel": "Agentic",
          "avgA": null,
          "avgB": 90.1,
          "winner": null,
          "benchmarkCount": 6
        },
        "coding": {
          "categoryLabel": "Coding",
          "avgA": null,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 3
        },
        "multimodalGrounded": {
          "categoryLabel": "Multimodal & Grounded",
          "avgA": null,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 1
        },
        "reasoning": {
          "categoryLabel": "Reasoning",
          "avgA": null,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 2
        },
        "knowledge": {
          "categoryLabel": "Knowledge",
          "avgA": null,
          "avgB": 57.2,
          "winner": null,
          "benchmarkCount": 8
        },
        "instructionFollowing": {
          "categoryLabel": "Instruction Following",
          "avgA": null,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 1
        },
        "multilingual": {
          "categoryLabel": "Multilingual",
          "avgA": null,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 0
        },
        "math": {
          "categoryLabel": "Mathematics",
          "avgA": null,
          "avgB": 52.4,
          "winner": null,
          "benchmarkCount": 1
        }
      }
    },
    {
      "slug": "grok-4-1-fast-vs-holo3-35b-a3b",
      "url": "https://benchlm.ai/compare/grok-4-1-fast-vs-holo3-35b-a3b",
      "markdownUrl": "https://benchlm.ai/md/compare/grok-4-1-fast-vs-holo3-35b-a3b.md",
      "modelA": {
        "slug": "grok-4-1-fast",
        "canonicalModelKey": "grok-4-1-fast",
        "model": "Grok 4.1 Fast",
        "creator": "xAI",
        "sourceType": "Proprietary",
        "reasoningType": "Non-Reasoning",
        "contextWindow": "1M",
        "contextWindowTokens": 1000000,
        "displayScore": 68,
        "rankingEligible": true,
        "overallRank": 41,
        "url": "https://benchlm.ai/models/grok-4-1-fast",
        "markdownUrl": "https://benchlm.ai/md/models/grok-4-1-fast.md"
      },
      "modelB": {
        "slug": "holo3-35b-a3b",
        "canonicalModelKey": "holo3-35b-a3b",
        "model": "Holo3-35B-A3B",
        "creator": "H Company",
        "sourceType": "Open Weight",
        "reasoningType": "Non-Reasoning",
        "contextWindow": "64K",
        "contextWindowTokens": 64000,
        "displayScore": 100,
        "rankingEligible": false,
        "overallRank": null,
        "url": "https://benchlm.ai/models/holo3-35b-a3b",
        "markdownUrl": "https://benchlm.ai/md/models/holo3-35b-a3b.md"
      },
      "overallWinner": "B",
      "winner": {
        "slug": "holo3-35b-a3b",
        "canonicalModelKey": "holo3-35b-a3b",
        "model": "Holo3-35B-A3B",
        "creator": "H Company",
        "sourceType": "Open Weight",
        "reasoningType": "Non-Reasoning",
        "contextWindow": "64K",
        "contextWindowTokens": 64000,
        "displayScore": 100,
        "rankingEligible": false,
        "overallRank": null,
        "url": "https://benchlm.ai/models/holo3-35b-a3b",
        "markdownUrl": "https://benchlm.ai/md/models/holo3-35b-a3b.md"
      },
      "scoreDiff": 32,
      "winsA": 0,
      "winsB": 0,
      "comparableCategoryCount": 0,
      "benchmarkCountA": 18,
      "benchmarkCountB": 1,
      "categoryResults": {
        "agentic": {
          "categoryLabel": "Agentic",
          "avgA": null,
          "avgB": 82.6,
          "winner": null,
          "benchmarkCount": 6
        },
        "coding": {
          "categoryLabel": "Coding",
          "avgA": null,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 3
        },
        "multimodalGrounded": {
          "categoryLabel": "Multimodal & Grounded",
          "avgA": null,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 1
        },
        "reasoning": {
          "categoryLabel": "Reasoning",
          "avgA": null,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 2
        },
        "knowledge": {
          "categoryLabel": "Knowledge",
          "avgA": null,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 6
        },
        "instructionFollowing": {
          "categoryLabel": "Instruction Following",
          "avgA": null,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 1
        },
        "multilingual": {
          "categoryLabel": "Multilingual",
          "avgA": null,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 0
        },
        "math": {
          "categoryLabel": "Mathematics",
          "avgA": null,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 0
        }
      }
    },
    {
      "slug": "glm-5-vs-gpt-5-5-pro",
      "url": "https://benchlm.ai/compare/glm-5-vs-gpt-5-5-pro",
      "markdownUrl": "https://benchlm.ai/md/compare/glm-5-vs-gpt-5-5-pro.md",
      "modelA": {
        "slug": "glm-5",
        "canonicalModelKey": "glm-5",
        "model": "GLM-5",
        "creator": "Z.AI",
        "sourceType": "Open Weight",
        "reasoningType": "Non-Reasoning",
        "contextWindow": "200K",
        "contextWindowTokens": 200000,
        "displayScore": 67,
        "rankingEligible": true,
        "overallRank": 42,
        "url": "https://benchlm.ai/models/glm-5",
        "markdownUrl": "https://benchlm.ai/md/models/glm-5.md"
      },
      "modelB": {
        "slug": "gpt-5-5-pro",
        "canonicalModelKey": "gpt-5-5-pro",
        "model": "GPT-5.5 Pro",
        "creator": "OpenAI",
        "sourceType": "Proprietary",
        "reasoningType": "Reasoning",
        "contextWindow": "1M",
        "contextWindowTokens": 1000000,
        "displayScore": 100,
        "rankingEligible": false,
        "overallRank": null,
        "url": "https://benchlm.ai/models/gpt-5-5-pro",
        "markdownUrl": "https://benchlm.ai/md/models/gpt-5-5-pro.md"
      },
      "overallWinner": "B",
      "winner": {
        "slug": "gpt-5-5-pro",
        "canonicalModelKey": "gpt-5-5-pro",
        "model": "GPT-5.5 Pro",
        "creator": "OpenAI",
        "sourceType": "Proprietary",
        "reasoningType": "Reasoning",
        "contextWindow": "1M",
        "contextWindowTokens": 1000000,
        "displayScore": 100,
        "rankingEligible": false,
        "overallRank": null,
        "url": "https://benchlm.ai/models/gpt-5-5-pro",
        "markdownUrl": "https://benchlm.ai/md/models/gpt-5-5-pro.md"
      },
      "scoreDiff": 33,
      "winsA": 1,
      "winsB": 1,
      "comparableCategoryCount": 2,
      "benchmarkCountA": 52,
      "benchmarkCountB": 4,
      "categoryResults": {
        "agentic": {
          "categoryLabel": "Agentic",
          "avgA": 56.2,
          "avgB": 90.1,
          "winner": "B",
          "benchmarkCount": 17
        },
        "coding": {
          "categoryLabel": "Coding",
          "avgA": 63.2,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 9
        },
        "multimodalGrounded": {
          "categoryLabel": "Multimodal & Grounded",
          "avgA": null,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 1
        },
        "reasoning": {
          "categoryLabel": "Reasoning",
          "avgA": 60.8,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 4
        },
        "knowledge": {
          "categoryLabel": "Knowledge",
          "avgA": 70.7,
          "avgB": 57.2,
          "winner": "A",
          "benchmarkCount": 13
        },
        "instructionFollowing": {
          "categoryLabel": "Instruction Following",
          "avgA": 92.6,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 2
        },
        "multilingual": {
          "categoryLabel": "Multilingual",
          "avgA": 83.1,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 2
        },
        "math": {
          "categoryLabel": "Mathematics",
          "avgA": null,
          "avgB": 52.4,
          "winner": null,
          "benchmarkCount": 7
        }
      }
    },
    {
      "slug": "glm-5-vs-holo3-35b-a3b",
      "url": "https://benchlm.ai/compare/glm-5-vs-holo3-35b-a3b",
      "markdownUrl": "https://benchlm.ai/md/compare/glm-5-vs-holo3-35b-a3b.md",
      "modelA": {
        "slug": "glm-5",
        "canonicalModelKey": "glm-5",
        "model": "GLM-5",
        "creator": "Z.AI",
        "sourceType": "Open Weight",
        "reasoningType": "Non-Reasoning",
        "contextWindow": "200K",
        "contextWindowTokens": 200000,
        "displayScore": 67,
        "rankingEligible": true,
        "overallRank": 42,
        "url": "https://benchlm.ai/models/glm-5",
        "markdownUrl": "https://benchlm.ai/md/models/glm-5.md"
      },
      "modelB": {
        "slug": "holo3-35b-a3b",
        "canonicalModelKey": "holo3-35b-a3b",
        "model": "Holo3-35B-A3B",
        "creator": "H Company",
        "sourceType": "Open Weight",
        "reasoningType": "Non-Reasoning",
        "contextWindow": "64K",
        "contextWindowTokens": 64000,
        "displayScore": 100,
        "rankingEligible": false,
        "overallRank": null,
        "url": "https://benchlm.ai/models/holo3-35b-a3b",
        "markdownUrl": "https://benchlm.ai/md/models/holo3-35b-a3b.md"
      },
      "overallWinner": "B",
      "winner": {
        "slug": "holo3-35b-a3b",
        "canonicalModelKey": "holo3-35b-a3b",
        "model": "Holo3-35B-A3B",
        "creator": "H Company",
        "sourceType": "Open Weight",
        "reasoningType": "Non-Reasoning",
        "contextWindow": "64K",
        "contextWindowTokens": 64000,
        "displayScore": 100,
        "rankingEligible": false,
        "overallRank": null,
        "url": "https://benchlm.ai/models/holo3-35b-a3b",
        "markdownUrl": "https://benchlm.ai/md/models/holo3-35b-a3b.md"
      },
      "scoreDiff": 33,
      "winsA": 0,
      "winsB": 1,
      "comparableCategoryCount": 1,
      "benchmarkCountA": 52,
      "benchmarkCountB": 1,
      "categoryResults": {
        "agentic": {
          "categoryLabel": "Agentic",
          "avgA": 56.2,
          "avgB": 82.6,
          "winner": "B",
          "benchmarkCount": 17
        },
        "coding": {
          "categoryLabel": "Coding",
          "avgA": 63.2,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 9
        },
        "multimodalGrounded": {
          "categoryLabel": "Multimodal & Grounded",
          "avgA": null,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 1
        },
        "reasoning": {
          "categoryLabel": "Reasoning",
          "avgA": 60.8,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 4
        },
        "knowledge": {
          "categoryLabel": "Knowledge",
          "avgA": 70.7,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 12
        },
        "instructionFollowing": {
          "categoryLabel": "Instruction Following",
          "avgA": 92.6,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 2
        },
        "multilingual": {
          "categoryLabel": "Multilingual",
          "avgA": 83.1,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 2
        },
        "math": {
          "categoryLabel": "Mathematics",
          "avgA": null,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 6
        }
      }
    },
    {
      "slug": "gpt-5-5-pro-vs-qwen3-6-plus",
      "url": "https://benchlm.ai/compare/gpt-5-5-pro-vs-qwen3-6-plus",
      "markdownUrl": "https://benchlm.ai/md/compare/gpt-5-5-pro-vs-qwen3-6-plus.md",
      "modelA": {
        "slug": "qwen3-6-plus",
        "canonicalModelKey": "qwen3-6-plus",
        "model": "Qwen3.6 Plus",
        "creator": "Alibaba",
        "sourceType": "Proprietary",
        "reasoningType": "Reasoning",
        "contextWindow": "1M",
        "contextWindowTokens": 1000000,
        "displayScore": 66,
        "rankingEligible": true,
        "overallRank": 43,
        "url": "https://benchlm.ai/models/qwen3-6-plus",
        "markdownUrl": "https://benchlm.ai/md/models/qwen3-6-plus.md"
      },
      "modelB": {
        "slug": "gpt-5-5-pro",
        "canonicalModelKey": "gpt-5-5-pro",
        "model": "GPT-5.5 Pro",
        "creator": "OpenAI",
        "sourceType": "Proprietary",
        "reasoningType": "Reasoning",
        "contextWindow": "1M",
        "contextWindowTokens": 1000000,
        "displayScore": 100,
        "rankingEligible": false,
        "overallRank": null,
        "url": "https://benchlm.ai/models/gpt-5-5-pro",
        "markdownUrl": "https://benchlm.ai/md/models/gpt-5-5-pro.md"
      },
      "overallWinner": "B",
      "winner": {
        "slug": "gpt-5-5-pro",
        "canonicalModelKey": "gpt-5-5-pro",
        "model": "GPT-5.5 Pro",
        "creator": "OpenAI",
        "sourceType": "Proprietary",
        "reasoningType": "Reasoning",
        "contextWindow": "1M",
        "contextWindowTokens": 1000000,
        "displayScore": 100,
        "rankingEligible": false,
        "overallRank": null,
        "url": "https://benchlm.ai/models/gpt-5-5-pro",
        "markdownUrl": "https://benchlm.ai/md/models/gpt-5-5-pro.md"
      },
      "scoreDiff": 34,
      "winsA": 1,
      "winsB": 1,
      "comparableCategoryCount": 2,
      "benchmarkCountA": 58,
      "benchmarkCountB": 4,
      "categoryResults": {
        "agentic": {
          "categoryLabel": "Agentic",
          "avgA": 61.6,
          "avgB": 90.1,
          "winner": "B",
          "benchmarkCount": 16
        },
        "coding": {
          "categoryLabel": "Coding",
          "avgA": 64.8,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 8
        },
        "multimodalGrounded": {
          "categoryLabel": "Multimodal & Grounded",
          "avgA": 79.6,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 9
        },
        "reasoning": {
          "categoryLabel": "Reasoning",
          "avgA": 62,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 4
        },
        "knowledge": {
          "categoryLabel": "Knowledge",
          "avgA": 66,
          "avgB": 57.2,
          "winner": "A",
          "benchmarkCount": 13
        },
        "instructionFollowing": {
          "categoryLabel": "Instruction Following",
          "avgA": 87.8,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 3
        },
        "multilingual": {
          "categoryLabel": "Multilingual",
          "avgA": 84.7,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 2
        },
        "math": {
          "categoryLabel": "Mathematics",
          "avgA": null,
          "avgB": 52.4,
          "winner": null,
          "benchmarkCount": 6
        }
      }
    },
    {
      "slug": "holo3-35b-a3b-vs-qwen3-6-plus",
      "url": "https://benchlm.ai/compare/holo3-35b-a3b-vs-qwen3-6-plus",
      "markdownUrl": "https://benchlm.ai/md/compare/holo3-35b-a3b-vs-qwen3-6-plus.md",
      "modelA": {
        "slug": "qwen3-6-plus",
        "canonicalModelKey": "qwen3-6-plus",
        "model": "Qwen3.6 Plus",
        "creator": "Alibaba",
        "sourceType": "Proprietary",
        "reasoningType": "Reasoning",
        "contextWindow": "1M",
        "contextWindowTokens": 1000000,
        "displayScore": 66,
        "rankingEligible": true,
        "overallRank": 43,
        "url": "https://benchlm.ai/models/qwen3-6-plus",
        "markdownUrl": "https://benchlm.ai/md/models/qwen3-6-plus.md"
      },
      "modelB": {
        "slug": "holo3-35b-a3b",
        "canonicalModelKey": "holo3-35b-a3b",
        "model": "Holo3-35B-A3B",
        "creator": "H Company",
        "sourceType": "Open Weight",
        "reasoningType": "Non-Reasoning",
        "contextWindow": "64K",
        "contextWindowTokens": 64000,
        "displayScore": 100,
        "rankingEligible": false,
        "overallRank": null,
        "url": "https://benchlm.ai/models/holo3-35b-a3b",
        "markdownUrl": "https://benchlm.ai/md/models/holo3-35b-a3b.md"
      },
      "overallWinner": "B",
      "winner": {
        "slug": "holo3-35b-a3b",
        "canonicalModelKey": "holo3-35b-a3b",
        "model": "Holo3-35B-A3B",
        "creator": "H Company",
        "sourceType": "Open Weight",
        "reasoningType": "Non-Reasoning",
        "contextWindow": "64K",
        "contextWindowTokens": 64000,
        "displayScore": 100,
        "rankingEligible": false,
        "overallRank": null,
        "url": "https://benchlm.ai/models/holo3-35b-a3b",
        "markdownUrl": "https://benchlm.ai/md/models/holo3-35b-a3b.md"
      },
      "scoreDiff": 34,
      "winsA": 0,
      "winsB": 1,
      "comparableCategoryCount": 1,
      "benchmarkCountA": 58,
      "benchmarkCountB": 1,
      "categoryResults": {
        "agentic": {
          "categoryLabel": "Agentic",
          "avgA": 61.6,
          "avgB": 82.6,
          "winner": "B",
          "benchmarkCount": 16
        },
        "coding": {
          "categoryLabel": "Coding",
          "avgA": 64.8,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 8
        },
        "multimodalGrounded": {
          "categoryLabel": "Multimodal & Grounded",
          "avgA": 79.6,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 9
        },
        "reasoning": {
          "categoryLabel": "Reasoning",
          "avgA": 62,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 4
        },
        "knowledge": {
          "categoryLabel": "Knowledge",
          "avgA": 66,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 12
        },
        "instructionFollowing": {
          "categoryLabel": "Instruction Following",
          "avgA": 87.8,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 3
        },
        "multilingual": {
          "categoryLabel": "Multilingual",
          "avgA": 84.7,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 2
        },
        "math": {
          "categoryLabel": "Mathematics",
          "avgA": null,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 5
        }
      }
    },
    {
      "slug": "gpt-5-5-pro-vs-mai-thinking-1",
      "url": "https://benchlm.ai/compare/gpt-5-5-pro-vs-mai-thinking-1",
      "markdownUrl": "https://benchlm.ai/md/compare/gpt-5-5-pro-vs-mai-thinking-1.md",
      "modelA": {
        "slug": "mai-thinking-1",
        "canonicalModelKey": "mai-thinking-1",
        "model": "MAI-Thinking-1",
        "creator": "Microsoft",
        "sourceType": "Proprietary",
        "reasoningType": "Reasoning",
        "contextWindow": "256K",
        "contextWindowTokens": 256000,
        "displayScore": 65,
        "rankingEligible": true,
        "overallRank": 44,
        "url": "https://benchlm.ai/models/mai-thinking-1",
        "markdownUrl": "https://benchlm.ai/md/models/mai-thinking-1.md"
      },
      "modelB": {
        "slug": "gpt-5-5-pro",
        "canonicalModelKey": "gpt-5-5-pro",
        "model": "GPT-5.5 Pro",
        "creator": "OpenAI",
        "sourceType": "Proprietary",
        "reasoningType": "Reasoning",
        "contextWindow": "1M",
        "contextWindowTokens": 1000000,
        "displayScore": 100,
        "rankingEligible": false,
        "overallRank": null,
        "url": "https://benchlm.ai/models/gpt-5-5-pro",
        "markdownUrl": "https://benchlm.ai/md/models/gpt-5-5-pro.md"
      },
      "overallWinner": "B",
      "winner": {
        "slug": "gpt-5-5-pro",
        "canonicalModelKey": "gpt-5-5-pro",
        "model": "GPT-5.5 Pro",
        "creator": "OpenAI",
        "sourceType": "Proprietary",
        "reasoningType": "Reasoning",
        "contextWindow": "1M",
        "contextWindowTokens": 1000000,
        "displayScore": 100,
        "rankingEligible": false,
        "overallRank": null,
        "url": "https://benchlm.ai/models/gpt-5-5-pro",
        "markdownUrl": "https://benchlm.ai/md/models/gpt-5-5-pro.md"
      },
      "scoreDiff": 35,
      "winsA": 2,
      "winsB": 1,
      "comparableCategoryCount": 3,
      "benchmarkCountA": 14,
      "benchmarkCountB": 4,
      "categoryResults": {
        "agentic": {
          "categoryLabel": "Agentic",
          "avgA": 46,
          "avgB": 90.1,
          "winner": "B",
          "benchmarkCount": 2
        },
        "coding": {
          "categoryLabel": "Coding",
          "avgA": 71,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 4
        },
        "multimodalGrounded": {
          "categoryLabel": "Multimodal & Grounded",
          "avgA": null,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 0
        },
        "reasoning": {
          "categoryLabel": "Reasoning",
          "avgA": null,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 1
        },
        "knowledge": {
          "categoryLabel": "Knowledge",
          "avgA": 69.9,
          "avgB": 57.2,
          "winner": "A",
          "benchmarkCount": 6
        },
        "instructionFollowing": {
          "categoryLabel": "Instruction Following",
          "avgA": 85,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 1
        },
        "multilingual": {
          "categoryLabel": "Multilingual",
          "avgA": null,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 0
        },
        "math": {
          "categoryLabel": "Mathematics",
          "avgA": 97,
          "avgB": 52.4,
          "winner": "A",
          "benchmarkCount": 4
        }
      }
    },
    {
      "slug": "holo3-35b-a3b-vs-mai-thinking-1",
      "url": "https://benchlm.ai/compare/holo3-35b-a3b-vs-mai-thinking-1",
      "markdownUrl": "https://benchlm.ai/md/compare/holo3-35b-a3b-vs-mai-thinking-1.md",
      "modelA": {
        "slug": "mai-thinking-1",
        "canonicalModelKey": "mai-thinking-1",
        "model": "MAI-Thinking-1",
        "creator": "Microsoft",
        "sourceType": "Proprietary",
        "reasoningType": "Reasoning",
        "contextWindow": "256K",
        "contextWindowTokens": 256000,
        "displayScore": 65,
        "rankingEligible": true,
        "overallRank": 44,
        "url": "https://benchlm.ai/models/mai-thinking-1",
        "markdownUrl": "https://benchlm.ai/md/models/mai-thinking-1.md"
      },
      "modelB": {
        "slug": "holo3-35b-a3b",
        "canonicalModelKey": "holo3-35b-a3b",
        "model": "Holo3-35B-A3B",
        "creator": "H Company",
        "sourceType": "Open Weight",
        "reasoningType": "Non-Reasoning",
        "contextWindow": "64K",
        "contextWindowTokens": 64000,
        "displayScore": 100,
        "rankingEligible": false,
        "overallRank": null,
        "url": "https://benchlm.ai/models/holo3-35b-a3b",
        "markdownUrl": "https://benchlm.ai/md/models/holo3-35b-a3b.md"
      },
      "overallWinner": "B",
      "winner": {
        "slug": "holo3-35b-a3b",
        "canonicalModelKey": "holo3-35b-a3b",
        "model": "Holo3-35B-A3B",
        "creator": "H Company",
        "sourceType": "Open Weight",
        "reasoningType": "Non-Reasoning",
        "contextWindow": "64K",
        "contextWindowTokens": 64000,
        "displayScore": 100,
        "rankingEligible": false,
        "overallRank": null,
        "url": "https://benchlm.ai/models/holo3-35b-a3b",
        "markdownUrl": "https://benchlm.ai/md/models/holo3-35b-a3b.md"
      },
      "scoreDiff": 35,
      "winsA": 0,
      "winsB": 1,
      "comparableCategoryCount": 1,
      "benchmarkCountA": 14,
      "benchmarkCountB": 1,
      "categoryResults": {
        "agentic": {
          "categoryLabel": "Agentic",
          "avgA": 46,
          "avgB": 82.6,
          "winner": "B",
          "benchmarkCount": 2
        },
        "coding": {
          "categoryLabel": "Coding",
          "avgA": 71,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 4
        },
        "multimodalGrounded": {
          "categoryLabel": "Multimodal & Grounded",
          "avgA": null,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 0
        },
        "reasoning": {
          "categoryLabel": "Reasoning",
          "avgA": null,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 1
        },
        "knowledge": {
          "categoryLabel": "Knowledge",
          "avgA": 69.9,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 4
        },
        "instructionFollowing": {
          "categoryLabel": "Instruction Following",
          "avgA": 85,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 1
        },
        "multilingual": {
          "categoryLabel": "Multilingual",
          "avgA": null,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 0
        },
        "math": {
          "categoryLabel": "Mathematics",
          "avgA": 97,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 3
        }
      }
    },
    {
      "slug": "gpt-5-5-pro-vs-qwen3-6-35b-a3b",
      "url": "https://benchlm.ai/compare/gpt-5-5-pro-vs-qwen3-6-35b-a3b",
      "markdownUrl": "https://benchlm.ai/md/compare/gpt-5-5-pro-vs-qwen3-6-35b-a3b.md",
      "modelA": {
        "slug": "qwen3-6-35b-a3b",
        "canonicalModelKey": "qwen3-6-35b-a3b",
        "model": "Qwen3.6-35B-A3B",
        "creator": "Alibaba",
        "sourceType": "Open Weight",
        "reasoningType": "Reasoning",
        "contextWindow": "262K",
        "contextWindowTokens": 262000,
        "displayScore": 65,
        "rankingEligible": true,
        "overallRank": 45,
        "url": "https://benchlm.ai/models/qwen3-6-35b-a3b",
        "markdownUrl": "https://benchlm.ai/md/models/qwen3-6-35b-a3b.md"
      },
      "modelB": {
        "slug": "gpt-5-5-pro",
        "canonicalModelKey": "gpt-5-5-pro",
        "model": "GPT-5.5 Pro",
        "creator": "OpenAI",
        "sourceType": "Proprietary",
        "reasoningType": "Reasoning",
        "contextWindow": "1M",
        "contextWindowTokens": 1000000,
        "displayScore": 100,
        "rankingEligible": false,
        "overallRank": null,
        "url": "https://benchlm.ai/models/gpt-5-5-pro",
        "markdownUrl": "https://benchlm.ai/md/models/gpt-5-5-pro.md"
      },
      "overallWinner": "B",
      "winner": {
        "slug": "gpt-5-5-pro",
        "canonicalModelKey": "gpt-5-5-pro",
        "model": "GPT-5.5 Pro",
        "creator": "OpenAI",
        "sourceType": "Proprietary",
        "reasoningType": "Reasoning",
        "contextWindow": "1M",
        "contextWindowTokens": 1000000,
        "displayScore": 100,
        "rankingEligible": false,
        "overallRank": null,
        "url": "https://benchlm.ai/models/gpt-5-5-pro",
        "markdownUrl": "https://benchlm.ai/md/models/gpt-5-5-pro.md"
      },
      "scoreDiff": 35,
      "winsA": 1,
      "winsB": 1,
      "comparableCategoryCount": 2,
      "benchmarkCountA": 58,
      "benchmarkCountB": 4,
      "categoryResults": {
        "agentic": {
          "categoryLabel": "Agentic",
          "avgA": 51.5,
          "avgB": 90.1,
          "winner": "B",
          "benchmarkCount": 16
        },
        "coding": {
          "categoryLabel": "Coding",
          "avgA": 66.9,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 9
        },
        "multimodalGrounded": {
          "categoryLabel": "Multimodal & Grounded",
          "avgA": 76.1,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 15
        },
        "reasoning": {
          "categoryLabel": "Reasoning",
          "avgA": null,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 2
        },
        "knowledge": {
          "categoryLabel": "Knowledge",
          "avgA": 60.5,
          "avgB": 57.2,
          "winner": "A",
          "benchmarkCount": 12
        },
        "instructionFollowing": {
          "categoryLabel": "Instruction Following",
          "avgA": null,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 1
        },
        "multilingual": {
          "categoryLabel": "Multilingual",
          "avgA": null,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 0
        },
        "math": {
          "categoryLabel": "Mathematics",
          "avgA": null,
          "avgB": 52.4,
          "winner": null,
          "benchmarkCount": 6
        }
      }
    },
    {
      "slug": "holo3-35b-a3b-vs-qwen3-6-35b-a3b",
      "url": "https://benchlm.ai/compare/holo3-35b-a3b-vs-qwen3-6-35b-a3b",
      "markdownUrl": "https://benchlm.ai/md/compare/holo3-35b-a3b-vs-qwen3-6-35b-a3b.md",
      "modelA": {
        "slug": "qwen3-6-35b-a3b",
        "canonicalModelKey": "qwen3-6-35b-a3b",
        "model": "Qwen3.6-35B-A3B",
        "creator": "Alibaba",
        "sourceType": "Open Weight",
        "reasoningType": "Reasoning",
        "contextWindow": "262K",
        "contextWindowTokens": 262000,
        "displayScore": 65,
        "rankingEligible": true,
        "overallRank": 45,
        "url": "https://benchlm.ai/models/qwen3-6-35b-a3b",
        "markdownUrl": "https://benchlm.ai/md/models/qwen3-6-35b-a3b.md"
      },
      "modelB": {
        "slug": "holo3-35b-a3b",
        "canonicalModelKey": "holo3-35b-a3b",
        "model": "Holo3-35B-A3B",
        "creator": "H Company",
        "sourceType": "Open Weight",
        "reasoningType": "Non-Reasoning",
        "contextWindow": "64K",
        "contextWindowTokens": 64000,
        "displayScore": 100,
        "rankingEligible": false,
        "overallRank": null,
        "url": "https://benchlm.ai/models/holo3-35b-a3b",
        "markdownUrl": "https://benchlm.ai/md/models/holo3-35b-a3b.md"
      },
      "overallWinner": "B",
      "winner": {
        "slug": "holo3-35b-a3b",
        "canonicalModelKey": "holo3-35b-a3b",
        "model": "Holo3-35B-A3B",
        "creator": "H Company",
        "sourceType": "Open Weight",
        "reasoningType": "Non-Reasoning",
        "contextWindow": "64K",
        "contextWindowTokens": 64000,
        "displayScore": 100,
        "rankingEligible": false,
        "overallRank": null,
        "url": "https://benchlm.ai/models/holo3-35b-a3b",
        "markdownUrl": "https://benchlm.ai/md/models/holo3-35b-a3b.md"
      },
      "scoreDiff": 35,
      "winsA": 0,
      "winsB": 1,
      "comparableCategoryCount": 1,
      "benchmarkCountA": 58,
      "benchmarkCountB": 1,
      "categoryResults": {
        "agentic": {
          "categoryLabel": "Agentic",
          "avgA": 51.5,
          "avgB": 82.6,
          "winner": "B",
          "benchmarkCount": 16
        },
        "coding": {
          "categoryLabel": "Coding",
          "avgA": 66.9,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 9
        },
        "multimodalGrounded": {
          "categoryLabel": "Multimodal & Grounded",
          "avgA": 76.1,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 15
        },
        "reasoning": {
          "categoryLabel": "Reasoning",
          "avgA": null,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 2
        },
        "knowledge": {
          "categoryLabel": "Knowledge",
          "avgA": 60.5,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 11
        },
        "instructionFollowing": {
          "categoryLabel": "Instruction Following",
          "avgA": null,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 1
        },
        "multilingual": {
          "categoryLabel": "Multilingual",
          "avgA": null,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 0
        },
        "math": {
          "categoryLabel": "Mathematics",
          "avgA": null,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 5
        }
      }
    },
    {
      "slug": "claude-sonnet-4-5-vs-gpt-5-5-pro",
      "url": "https://benchlm.ai/compare/claude-sonnet-4-5-vs-gpt-5-5-pro",
      "markdownUrl": "https://benchlm.ai/md/compare/claude-sonnet-4-5-vs-gpt-5-5-pro.md",
      "modelA": {
        "slug": "claude-sonnet-4-5",
        "canonicalModelKey": "claude-sonnet-4-5",
        "model": "Claude Sonnet 4.5",
        "creator": "Anthropic",
        "sourceType": "Proprietary",
        "reasoningType": "Non-Reasoning",
        "contextWindow": "200K",
        "contextWindowTokens": 200000,
        "displayScore": 64,
        "rankingEligible": true,
        "overallRank": 46,
        "url": "https://benchlm.ai/models/claude-sonnet-4-5",
        "markdownUrl": "https://benchlm.ai/md/models/claude-sonnet-4-5.md"
      },
      "modelB": {
        "slug": "gpt-5-5-pro",
        "canonicalModelKey": "gpt-5-5-pro",
        "model": "GPT-5.5 Pro",
        "creator": "OpenAI",
        "sourceType": "Proprietary",
        "reasoningType": "Reasoning",
        "contextWindow": "1M",
        "contextWindowTokens": 1000000,
        "displayScore": 100,
        "rankingEligible": false,
        "overallRank": null,
        "url": "https://benchlm.ai/models/gpt-5-5-pro",
        "markdownUrl": "https://benchlm.ai/md/models/gpt-5-5-pro.md"
      },
      "overallWinner": "B",
      "winner": {
        "slug": "gpt-5-5-pro",
        "canonicalModelKey": "gpt-5-5-pro",
        "model": "GPT-5.5 Pro",
        "creator": "OpenAI",
        "sourceType": "Proprietary",
        "reasoningType": "Reasoning",
        "contextWindow": "1M",
        "contextWindowTokens": 1000000,
        "displayScore": 100,
        "rankingEligible": false,
        "overallRank": null,
        "url": "https://benchlm.ai/models/gpt-5-5-pro",
        "markdownUrl": "https://benchlm.ai/md/models/gpt-5-5-pro.md"
      },
      "scoreDiff": 36,
      "winsA": 2,
      "winsB": 1,
      "comparableCategoryCount": 3,
      "benchmarkCountA": 9,
      "benchmarkCountB": 4,
      "categoryResults": {
        "agentic": {
          "categoryLabel": "Agentic",
          "avgA": 55.3,
          "avgB": 90.1,
          "winner": "B",
          "benchmarkCount": 5
        },
        "coding": {
          "categoryLabel": "Coding",
          "avgA": 77.2,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 1
        },
        "multimodalGrounded": {
          "categoryLabel": "Multimodal & Grounded",
          "avgA": null,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 1
        },
        "reasoning": {
          "categoryLabel": "Reasoning",
          "avgA": 13.6,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 1
        },
        "knowledge": {
          "categoryLabel": "Knowledge",
          "avgA": 83.4,
          "avgB": 57.2,
          "winner": "A",
          "benchmarkCount": 3
        },
        "instructionFollowing": {
          "categoryLabel": "Instruction Following",
          "avgA": null,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 0
        },
        "multilingual": {
          "categoryLabel": "Multilingual",
          "avgA": null,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 0
        },
        "math": {
          "categoryLabel": "Mathematics",
          "avgA": 87,
          "avgB": 52.4,
          "winner": "A",
          "benchmarkCount": 2
        }
      }
    },
    {
      "slug": "claude-sonnet-4-5-vs-holo3-35b-a3b",
      "url": "https://benchlm.ai/compare/claude-sonnet-4-5-vs-holo3-35b-a3b",
      "markdownUrl": "https://benchlm.ai/md/compare/claude-sonnet-4-5-vs-holo3-35b-a3b.md",
      "modelA": {
        "slug": "claude-sonnet-4-5",
        "canonicalModelKey": "claude-sonnet-4-5",
        "model": "Claude Sonnet 4.5",
        "creator": "Anthropic",
        "sourceType": "Proprietary",
        "reasoningType": "Non-Reasoning",
        "contextWindow": "200K",
        "contextWindowTokens": 200000,
        "displayScore": 64,
        "rankingEligible": true,
        "overallRank": 46,
        "url": "https://benchlm.ai/models/claude-sonnet-4-5",
        "markdownUrl": "https://benchlm.ai/md/models/claude-sonnet-4-5.md"
      },
      "modelB": {
        "slug": "holo3-35b-a3b",
        "canonicalModelKey": "holo3-35b-a3b",
        "model": "Holo3-35B-A3B",
        "creator": "H Company",
        "sourceType": "Open Weight",
        "reasoningType": "Non-Reasoning",
        "contextWindow": "64K",
        "contextWindowTokens": 64000,
        "displayScore": 100,
        "rankingEligible": false,
        "overallRank": null,
        "url": "https://benchlm.ai/models/holo3-35b-a3b",
        "markdownUrl": "https://benchlm.ai/md/models/holo3-35b-a3b.md"
      },
      "overallWinner": "B",
      "winner": {
        "slug": "holo3-35b-a3b",
        "canonicalModelKey": "holo3-35b-a3b",
        "model": "Holo3-35B-A3B",
        "creator": "H Company",
        "sourceType": "Open Weight",
        "reasoningType": "Non-Reasoning",
        "contextWindow": "64K",
        "contextWindowTokens": 64000,
        "displayScore": 100,
        "rankingEligible": false,
        "overallRank": null,
        "url": "https://benchlm.ai/models/holo3-35b-a3b",
        "markdownUrl": "https://benchlm.ai/md/models/holo3-35b-a3b.md"
      },
      "scoreDiff": 36,
      "winsA": 0,
      "winsB": 1,
      "comparableCategoryCount": 1,
      "benchmarkCountA": 9,
      "benchmarkCountB": 1,
      "categoryResults": {
        "agentic": {
          "categoryLabel": "Agentic",
          "avgA": 55.3,
          "avgB": 82.6,
          "winner": "B",
          "benchmarkCount": 4
        },
        "coding": {
          "categoryLabel": "Coding",
          "avgA": 77.2,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 1
        },
        "multimodalGrounded": {
          "categoryLabel": "Multimodal & Grounded",
          "avgA": null,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 1
        },
        "reasoning": {
          "categoryLabel": "Reasoning",
          "avgA": 13.6,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 1
        },
        "knowledge": {
          "categoryLabel": "Knowledge",
          "avgA": 83.4,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 1
        },
        "instructionFollowing": {
          "categoryLabel": "Instruction Following",
          "avgA": null,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 0
        },
        "multilingual": {
          "categoryLabel": "Multilingual",
          "avgA": null,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 0
        },
        "math": {
          "categoryLabel": "Mathematics",
          "avgA": 87,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 1
        }
      }
    },
    {
      "slug": "gpt-5-5-pro-vs-kimi-k2-5",
      "url": "https://benchlm.ai/compare/gpt-5-5-pro-vs-kimi-k2-5",
      "markdownUrl": "https://benchlm.ai/md/compare/gpt-5-5-pro-vs-kimi-k2-5.md",
      "modelA": {
        "slug": "kimi-k2-5",
        "canonicalModelKey": "kimi-k2-5",
        "model": "Kimi K2.5",
        "creator": "Moonshot AI",
        "sourceType": "Open Weight",
        "reasoningType": "Non-Reasoning",
        "contextWindow": "256K",
        "contextWindowTokens": 256000,
        "displayScore": 63,
        "rankingEligible": true,
        "overallRank": 47,
        "url": "https://benchlm.ai/models/kimi-k2-5",
        "markdownUrl": "https://benchlm.ai/md/models/kimi-k2-5.md"
      },
      "modelB": {
        "slug": "gpt-5-5-pro",
        "canonicalModelKey": "gpt-5-5-pro",
        "model": "GPT-5.5 Pro",
        "creator": "OpenAI",
        "sourceType": "Proprietary",
        "reasoningType": "Reasoning",
        "contextWindow": "1M",
        "contextWindowTokens": 1000000,
        "displayScore": 100,
        "rankingEligible": false,
        "overallRank": null,
        "url": "https://benchlm.ai/models/gpt-5-5-pro",
        "markdownUrl": "https://benchlm.ai/md/models/gpt-5-5-pro.md"
      },
      "overallWinner": "B",
      "winner": {
        "slug": "gpt-5-5-pro",
        "canonicalModelKey": "gpt-5-5-pro",
        "model": "GPT-5.5 Pro",
        "creator": "OpenAI",
        "sourceType": "Proprietary",
        "reasoningType": "Reasoning",
        "contextWindow": "1M",
        "contextWindowTokens": 1000000,
        "displayScore": 100,
        "rankingEligible": false,
        "overallRank": null,
        "url": "https://benchlm.ai/models/gpt-5-5-pro",
        "markdownUrl": "https://benchlm.ai/md/models/gpt-5-5-pro.md"
      },
      "scoreDiff": 37,
      "winsA": 2,
      "winsB": 1,
      "comparableCategoryCount": 3,
      "benchmarkCountA": 61,
      "benchmarkCountB": 4,
      "categoryResults": {
        "agentic": {
          "categoryLabel": "Agentic",
          "avgA": 54.6,
          "avgB": 90.1,
          "winner": "B",
          "benchmarkCount": 17
        },
        "coding": {
          "categoryLabel": "Coding",
          "avgA": 64.2,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 12
        },
        "multimodalGrounded": {
          "categoryLabel": "Multimodal & Grounded",
          "avgA": 78.5,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 6
        },
        "reasoning": {
          "categoryLabel": "Reasoning",
          "avgA": 61,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 3
        },
        "knowledge": {
          "categoryLabel": "Knowledge",
          "avgA": 65.1,
          "avgB": 57.2,
          "winner": "A",
          "benchmarkCount": 13
        },
        "instructionFollowing": {
          "categoryLabel": "Instruction Following",
          "avgA": 93.9,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 2
        },
        "multilingual": {
          "categoryLabel": "Multilingual",
          "avgA": 82.3,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 2
        },
        "math": {
          "categoryLabel": "Mathematics",
          "avgA": 96.1,
          "avgB": 52.4,
          "winner": "A",
          "benchmarkCount": 8
        }
      }
    },
    {
      "slug": "holo3-35b-a3b-vs-kimi-k2-5",
      "url": "https://benchlm.ai/compare/holo3-35b-a3b-vs-kimi-k2-5",
      "markdownUrl": "https://benchlm.ai/md/compare/holo3-35b-a3b-vs-kimi-k2-5.md",
      "modelA": {
        "slug": "kimi-k2-5",
        "canonicalModelKey": "kimi-k2-5",
        "model": "Kimi K2.5",
        "creator": "Moonshot AI",
        "sourceType": "Open Weight",
        "reasoningType": "Non-Reasoning",
        "contextWindow": "256K",
        "contextWindowTokens": 256000,
        "displayScore": 63,
        "rankingEligible": true,
        "overallRank": 47,
        "url": "https://benchlm.ai/models/kimi-k2-5",
        "markdownUrl": "https://benchlm.ai/md/models/kimi-k2-5.md"
      },
      "modelB": {
        "slug": "holo3-35b-a3b",
        "canonicalModelKey": "holo3-35b-a3b",
        "model": "Holo3-35B-A3B",
        "creator": "H Company",
        "sourceType": "Open Weight",
        "reasoningType": "Non-Reasoning",
        "contextWindow": "64K",
        "contextWindowTokens": 64000,
        "displayScore": 100,
        "rankingEligible": false,
        "overallRank": null,
        "url": "https://benchlm.ai/models/holo3-35b-a3b",
        "markdownUrl": "https://benchlm.ai/md/models/holo3-35b-a3b.md"
      },
      "overallWinner": "B",
      "winner": {
        "slug": "holo3-35b-a3b",
        "canonicalModelKey": "holo3-35b-a3b",
        "model": "Holo3-35B-A3B",
        "creator": "H Company",
        "sourceType": "Open Weight",
        "reasoningType": "Non-Reasoning",
        "contextWindow": "64K",
        "contextWindowTokens": 64000,
        "displayScore": 100,
        "rankingEligible": false,
        "overallRank": null,
        "url": "https://benchlm.ai/models/holo3-35b-a3b",
        "markdownUrl": "https://benchlm.ai/md/models/holo3-35b-a3b.md"
      },
      "scoreDiff": 37,
      "winsA": 0,
      "winsB": 1,
      "comparableCategoryCount": 1,
      "benchmarkCountA": 61,
      "benchmarkCountB": 1,
      "categoryResults": {
        "agentic": {
          "categoryLabel": "Agentic",
          "avgA": 54.6,
          "avgB": 82.6,
          "winner": "B",
          "benchmarkCount": 18
        },
        "coding": {
          "categoryLabel": "Coding",
          "avgA": 64.2,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 12
        },
        "multimodalGrounded": {
          "categoryLabel": "Multimodal & Grounded",
          "avgA": 78.5,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 6
        },
        "reasoning": {
          "categoryLabel": "Reasoning",
          "avgA": 61,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 3
        },
        "knowledge": {
          "categoryLabel": "Knowledge",
          "avgA": 65.1,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 12
        },
        "instructionFollowing": {
          "categoryLabel": "Instruction Following",
          "avgA": 93.9,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 2
        },
        "multilingual": {
          "categoryLabel": "Multilingual",
          "avgA": 82.3,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 2
        },
        "math": {
          "categoryLabel": "Mathematics",
          "avgA": 96.1,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 7
        }
      }
    },
    {
      "slug": "gpt-5-5-pro-vs-qwen3-5-122b-a10b",
      "url": "https://benchlm.ai/compare/gpt-5-5-pro-vs-qwen3-5-122b-a10b",
      "markdownUrl": "https://benchlm.ai/md/compare/gpt-5-5-pro-vs-qwen3-5-122b-a10b.md",
      "modelA": {
        "slug": "qwen3-5-122b-a10b",
        "canonicalModelKey": "qwen3-5-122b-a10b",
        "model": "Qwen3.5-122B-A10B",
        "creator": "Alibaba",
        "sourceType": "Open Weight",
        "reasoningType": "Reasoning",
        "contextWindow": "262K",
        "contextWindowTokens": 262000,
        "displayScore": 63,
        "rankingEligible": true,
        "overallRank": 48,
        "url": "https://benchlm.ai/models/qwen3-5-122b-a10b",
        "markdownUrl": "https://benchlm.ai/md/models/qwen3-5-122b-a10b.md"
      },
      "modelB": {
        "slug": "gpt-5-5-pro",
        "canonicalModelKey": "gpt-5-5-pro",
        "model": "GPT-5.5 Pro",
        "creator": "OpenAI",
        "sourceType": "Proprietary",
        "reasoningType": "Reasoning",
        "contextWindow": "1M",
        "contextWindowTokens": 1000000,
        "displayScore": 100,
        "rankingEligible": false,
        "overallRank": null,
        "url": "https://benchlm.ai/models/gpt-5-5-pro",
        "markdownUrl": "https://benchlm.ai/md/models/gpt-5-5-pro.md"
      },
      "overallWinner": "B",
      "winner": {
        "slug": "gpt-5-5-pro",
        "canonicalModelKey": "gpt-5-5-pro",
        "model": "GPT-5.5 Pro",
        "creator": "OpenAI",
        "sourceType": "Proprietary",
        "reasoningType": "Reasoning",
        "contextWindow": "1M",
        "contextWindowTokens": 1000000,
        "displayScore": 100,
        "rankingEligible": false,
        "overallRank": null,
        "url": "https://benchlm.ai/models/gpt-5-5-pro",
        "markdownUrl": "https://benchlm.ai/md/models/gpt-5-5-pro.md"
      },
      "scoreDiff": 37,
      "winsA": 1,
      "winsB": 1,
      "comparableCategoryCount": 2,
      "benchmarkCountA": 32,
      "benchmarkCountB": 4,
      "categoryResults": {
        "agentic": {
          "categoryLabel": "Agentic",
          "avgA": 56.1,
          "avgB": 90.1,
          "winner": "B",
          "benchmarkCount": 7
        },
        "coding": {
          "categoryLabel": "Coding",
          "avgA": 72,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 4
        },
        "multimodalGrounded": {
          "categoryLabel": "Multimodal & Grounded",
          "avgA": 77.2,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 6
        },
        "reasoning": {
          "categoryLabel": "Reasoning",
          "avgA": 60.2,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 3
        },
        "knowledge": {
          "categoryLabel": "Knowledge",
          "avgA": 81.6,
          "avgB": 57.2,
          "winner": "A",
          "benchmarkCount": 11
        },
        "instructionFollowing": {
          "categoryLabel": "Instruction Following",
          "avgA": 93.4,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 2
        },
        "multilingual": {
          "categoryLabel": "Multilingual",
          "avgA": 82.2,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 1
        },
        "math": {
          "categoryLabel": "Mathematics",
          "avgA": null,
          "avgB": 52.4,
          "winner": null,
          "benchmarkCount": 1
        }
      }
    },
    {
      "slug": "holo3-35b-a3b-vs-qwen3-5-122b-a10b",
      "url": "https://benchlm.ai/compare/holo3-35b-a3b-vs-qwen3-5-122b-a10b",
      "markdownUrl": "https://benchlm.ai/md/compare/holo3-35b-a3b-vs-qwen3-5-122b-a10b.md",
      "modelA": {
        "slug": "qwen3-5-122b-a10b",
        "canonicalModelKey": "qwen3-5-122b-a10b",
        "model": "Qwen3.5-122B-A10B",
        "creator": "Alibaba",
        "sourceType": "Open Weight",
        "reasoningType": "Reasoning",
        "contextWindow": "262K",
        "contextWindowTokens": 262000,
        "displayScore": 63,
        "rankingEligible": true,
        "overallRank": 48,
        "url": "https://benchlm.ai/models/qwen3-5-122b-a10b",
        "markdownUrl": "https://benchlm.ai/md/models/qwen3-5-122b-a10b.md"
      },
      "modelB": {
        "slug": "holo3-35b-a3b",
        "canonicalModelKey": "holo3-35b-a3b",
        "model": "Holo3-35B-A3B",
        "creator": "H Company",
        "sourceType": "Open Weight",
        "reasoningType": "Non-Reasoning",
        "contextWindow": "64K",
        "contextWindowTokens": 64000,
        "displayScore": 100,
        "rankingEligible": false,
        "overallRank": null,
        "url": "https://benchlm.ai/models/holo3-35b-a3b",
        "markdownUrl": "https://benchlm.ai/md/models/holo3-35b-a3b.md"
      },
      "overallWinner": "B",
      "winner": {
        "slug": "holo3-35b-a3b",
        "canonicalModelKey": "holo3-35b-a3b",
        "model": "Holo3-35B-A3B",
        "creator": "H Company",
        "sourceType": "Open Weight",
        "reasoningType": "Non-Reasoning",
        "contextWindow": "64K",
        "contextWindowTokens": 64000,
        "displayScore": 100,
        "rankingEligible": false,
        "overallRank": null,
        "url": "https://benchlm.ai/models/holo3-35b-a3b",
        "markdownUrl": "https://benchlm.ai/md/models/holo3-35b-a3b.md"
      },
      "scoreDiff": 37,
      "winsA": 0,
      "winsB": 1,
      "comparableCategoryCount": 1,
      "benchmarkCountA": 32,
      "benchmarkCountB": 1,
      "categoryResults": {
        "agentic": {
          "categoryLabel": "Agentic",
          "avgA": 56.1,
          "avgB": 82.6,
          "winner": "B",
          "benchmarkCount": 7
        },
        "coding": {
          "categoryLabel": "Coding",
          "avgA": 72,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 4
        },
        "multimodalGrounded": {
          "categoryLabel": "Multimodal & Grounded",
          "avgA": 77.2,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 6
        },
        "reasoning": {
          "categoryLabel": "Reasoning",
          "avgA": 60.2,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 3
        },
        "knowledge": {
          "categoryLabel": "Knowledge",
          "avgA": 81.6,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 9
        },
        "instructionFollowing": {
          "categoryLabel": "Instruction Following",
          "avgA": 93.4,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 2
        },
        "multilingual": {
          "categoryLabel": "Multilingual",
          "avgA": 82.2,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 1
        },
        "math": {
          "categoryLabel": "Mathematics",
          "avgA": null,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 0
        }
      }
    },
    {
      "slug": "gemini-2-5-pro-vs-gpt-5-5-pro",
      "url": "https://benchlm.ai/compare/gemini-2-5-pro-vs-gpt-5-5-pro",
      "markdownUrl": "https://benchlm.ai/md/compare/gemini-2-5-pro-vs-gpt-5-5-pro.md",
      "modelA": {
        "slug": "gemini-2-5-pro",
        "canonicalModelKey": "gemini-2-5-pro",
        "model": "Gemini 2.5 Pro",
        "creator": "Google",
        "sourceType": "Proprietary",
        "reasoningType": "Non-Reasoning",
        "contextWindow": "1M",
        "contextWindowTokens": 1000000,
        "displayScore": 63,
        "rankingEligible": true,
        "overallRank": 49,
        "url": "https://benchlm.ai/models/gemini-2-5-pro",
        "markdownUrl": "https://benchlm.ai/md/models/gemini-2-5-pro.md"
      },
      "modelB": {
        "slug": "gpt-5-5-pro",
        "canonicalModelKey": "gpt-5-5-pro",
        "model": "GPT-5.5 Pro",
        "creator": "OpenAI",
        "sourceType": "Proprietary",
        "reasoningType": "Reasoning",
        "contextWindow": "1M",
        "contextWindowTokens": 1000000,
        "displayScore": 100,
        "rankingEligible": false,
        "overallRank": null,
        "url": "https://benchlm.ai/models/gpt-5-5-pro",
        "markdownUrl": "https://benchlm.ai/md/models/gpt-5-5-pro.md"
      },
      "overallWinner": "B",
      "winner": {
        "slug": "gpt-5-5-pro",
        "canonicalModelKey": "gpt-5-5-pro",
        "model": "GPT-5.5 Pro",
        "creator": "OpenAI",
        "sourceType": "Proprietary",
        "reasoningType": "Reasoning",
        "contextWindow": "1M",
        "contextWindowTokens": 1000000,
        "displayScore": 100,
        "rankingEligible": false,
        "overallRank": null,
        "url": "https://benchlm.ai/models/gpt-5-5-pro",
        "markdownUrl": "https://benchlm.ai/md/models/gpt-5-5-pro.md"
      },
      "scoreDiff": 37,
      "winsA": 0,
      "winsB": 1,
      "comparableCategoryCount": 1,
      "benchmarkCountA": 23,
      "benchmarkCountB": 4,
      "categoryResults": {
        "agentic": {
          "categoryLabel": "Agentic",
          "avgA": null,
          "avgB": 90.1,
          "winner": null,
          "benchmarkCount": 6
        },
        "coding": {
          "categoryLabel": "Coding",
          "avgA": 63.8,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 5
        },
        "multimodalGrounded": {
          "categoryLabel": "Multimodal & Grounded",
          "avgA": null,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 2
        },
        "reasoning": {
          "categoryLabel": "Reasoning",
          "avgA": null,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 2
        },
        "knowledge": {
          "categoryLabel": "Knowledge",
          "avgA": 40.8,
          "avgB": 57.2,
          "winner": "B",
          "benchmarkCount": 9
        },
        "instructionFollowing": {
          "categoryLabel": "Instruction Following",
          "avgA": null,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 1
        },
        "multilingual": {
          "categoryLabel": "Multilingual",
          "avgA": null,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 0
        },
        "math": {
          "categoryLabel": "Mathematics",
          "avgA": null,
          "avgB": 52.4,
          "winner": null,
          "benchmarkCount": 1
        }
      }
    },
    {
      "slug": "gemini-2-5-pro-vs-holo3-35b-a3b",
      "url": "https://benchlm.ai/compare/gemini-2-5-pro-vs-holo3-35b-a3b",
      "markdownUrl": "https://benchlm.ai/md/compare/gemini-2-5-pro-vs-holo3-35b-a3b.md",
      "modelA": {
        "slug": "gemini-2-5-pro",
        "canonicalModelKey": "gemini-2-5-pro",
        "model": "Gemini 2.5 Pro",
        "creator": "Google",
        "sourceType": "Proprietary",
        "reasoningType": "Non-Reasoning",
        "contextWindow": "1M",
        "contextWindowTokens": 1000000,
        "displayScore": 63,
        "rankingEligible": true,
        "overallRank": 49,
        "url": "https://benchlm.ai/models/gemini-2-5-pro",
        "markdownUrl": "https://benchlm.ai/md/models/gemini-2-5-pro.md"
      },
      "modelB": {
        "slug": "holo3-35b-a3b",
        "canonicalModelKey": "holo3-35b-a3b",
        "model": "Holo3-35B-A3B",
        "creator": "H Company",
        "sourceType": "Open Weight",
        "reasoningType": "Non-Reasoning",
        "contextWindow": "64K",
        "contextWindowTokens": 64000,
        "displayScore": 100,
        "rankingEligible": false,
        "overallRank": null,
        "url": "https://benchlm.ai/models/holo3-35b-a3b",
        "markdownUrl": "https://benchlm.ai/md/models/holo3-35b-a3b.md"
      },
      "overallWinner": "B",
      "winner": {
        "slug": "holo3-35b-a3b",
        "canonicalModelKey": "holo3-35b-a3b",
        "model": "Holo3-35B-A3B",
        "creator": "H Company",
        "sourceType": "Open Weight",
        "reasoningType": "Non-Reasoning",
        "contextWindow": "64K",
        "contextWindowTokens": 64000,
        "displayScore": 100,
        "rankingEligible": false,
        "overallRank": null,
        "url": "https://benchlm.ai/models/holo3-35b-a3b",
        "markdownUrl": "https://benchlm.ai/md/models/holo3-35b-a3b.md"
      },
      "scoreDiff": 37,
      "winsA": 0,
      "winsB": 0,
      "comparableCategoryCount": 0,
      "benchmarkCountA": 23,
      "benchmarkCountB": 1,
      "categoryResults": {
        "agentic": {
          "categoryLabel": "Agentic",
          "avgA": null,
          "avgB": 82.6,
          "winner": null,
          "benchmarkCount": 6
        },
        "coding": {
          "categoryLabel": "Coding",
          "avgA": 63.8,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 5
        },
        "multimodalGrounded": {
          "categoryLabel": "Multimodal & Grounded",
          "avgA": null,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 2
        },
        "reasoning": {
          "categoryLabel": "Reasoning",
          "avgA": null,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 2
        },
        "knowledge": {
          "categoryLabel": "Knowledge",
          "avgA": 40.8,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 8
        },
        "instructionFollowing": {
          "categoryLabel": "Instruction Following",
          "avgA": null,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 1
        },
        "multilingual": {
          "categoryLabel": "Multilingual",
          "avgA": null,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 0
        },
        "math": {
          "categoryLabel": "Mathematics",
          "avgA": null,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 0
        }
      }
    },
    {
      "slug": "gpt-5-5-pro-vs-grok-4",
      "url": "https://benchlm.ai/compare/gpt-5-5-pro-vs-grok-4",
      "markdownUrl": "https://benchlm.ai/md/compare/gpt-5-5-pro-vs-grok-4.md",
      "modelA": {
        "slug": "grok-4",
        "canonicalModelKey": "grok-4",
        "model": "Grok 4",
        "creator": "xAI",
        "sourceType": "Proprietary",
        "reasoningType": "Non-Reasoning",
        "contextWindow": "128K",
        "contextWindowTokens": 128000,
        "displayScore": 63,
        "rankingEligible": true,
        "overallRank": 50,
        "url": "https://benchlm.ai/models/grok-4",
        "markdownUrl": "https://benchlm.ai/md/models/grok-4.md"
      },
      "modelB": {
        "slug": "gpt-5-5-pro",
        "canonicalModelKey": "gpt-5-5-pro",
        "model": "GPT-5.5 Pro",
        "creator": "OpenAI",
        "sourceType": "Proprietary",
        "reasoningType": "Reasoning",
        "contextWindow": "1M",
        "contextWindowTokens": 1000000,
        "displayScore": 100,
        "rankingEligible": false,
        "overallRank": null,
        "url": "https://benchlm.ai/models/gpt-5-5-pro",
        "markdownUrl": "https://benchlm.ai/md/models/gpt-5-5-pro.md"
      },
      "overallWinner": "B",
      "winner": {
        "slug": "gpt-5-5-pro",
        "canonicalModelKey": "gpt-5-5-pro",
        "model": "GPT-5.5 Pro",
        "creator": "OpenAI",
        "sourceType": "Proprietary",
        "reasoningType": "Reasoning",
        "contextWindow": "1M",
        "contextWindowTokens": 1000000,
        "displayScore": 100,
        "rankingEligible": false,
        "overallRank": null,
        "url": "https://benchlm.ai/models/gpt-5-5-pro",
        "markdownUrl": "https://benchlm.ai/md/models/gpt-5-5-pro.md"
      },
      "scoreDiff": 37,
      "winsA": 0,
      "winsB": 0,
      "comparableCategoryCount": 0,
      "benchmarkCountA": 19,
      "benchmarkCountB": 4,
      "categoryResults": {
        "agentic": {
          "categoryLabel": "Agentic",
          "avgA": null,
          "avgB": 90.1,
          "winner": null,
          "benchmarkCount": 6
        },
        "coding": {
          "categoryLabel": "Coding",
          "avgA": null,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 4
        },
        "multimodalGrounded": {
          "categoryLabel": "Multimodal & Grounded",
          "avgA": null,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 1
        },
        "reasoning": {
          "categoryLabel": "Reasoning",
          "avgA": null,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 2
        },
        "knowledge": {
          "categoryLabel": "Knowledge",
          "avgA": null,
          "avgB": 57.2,
          "winner": null,
          "benchmarkCount": 8
        },
        "instructionFollowing": {
          "categoryLabel": "Instruction Following",
          "avgA": null,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 1
        },
        "multilingual": {
          "categoryLabel": "Multilingual",
          "avgA": null,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 0
        },
        "math": {
          "categoryLabel": "Mathematics",
          "avgA": null,
          "avgB": 52.4,
          "winner": null,
          "benchmarkCount": 1
        }
      }
    },
    {
      "slug": "grok-4-vs-holo3-35b-a3b",
      "url": "https://benchlm.ai/compare/grok-4-vs-holo3-35b-a3b",
      "markdownUrl": "https://benchlm.ai/md/compare/grok-4-vs-holo3-35b-a3b.md",
      "modelA": {
        "slug": "grok-4",
        "canonicalModelKey": "grok-4",
        "model": "Grok 4",
        "creator": "xAI",
        "sourceType": "Proprietary",
        "reasoningType": "Non-Reasoning",
        "contextWindow": "128K",
        "contextWindowTokens": 128000,
        "displayScore": 63,
        "rankingEligible": true,
        "overallRank": 50,
        "url": "https://benchlm.ai/models/grok-4",
        "markdownUrl": "https://benchlm.ai/md/models/grok-4.md"
      },
      "modelB": {
        "slug": "holo3-35b-a3b",
        "canonicalModelKey": "holo3-35b-a3b",
        "model": "Holo3-35B-A3B",
        "creator": "H Company",
        "sourceType": "Open Weight",
        "reasoningType": "Non-Reasoning",
        "contextWindow": "64K",
        "contextWindowTokens": 64000,
        "displayScore": 100,
        "rankingEligible": false,
        "overallRank": null,
        "url": "https://benchlm.ai/models/holo3-35b-a3b",
        "markdownUrl": "https://benchlm.ai/md/models/holo3-35b-a3b.md"
      },
      "overallWinner": "B",
      "winner": {
        "slug": "holo3-35b-a3b",
        "canonicalModelKey": "holo3-35b-a3b",
        "model": "Holo3-35B-A3B",
        "creator": "H Company",
        "sourceType": "Open Weight",
        "reasoningType": "Non-Reasoning",
        "contextWindow": "64K",
        "contextWindowTokens": 64000,
        "displayScore": 100,
        "rankingEligible": false,
        "overallRank": null,
        "url": "https://benchlm.ai/models/holo3-35b-a3b",
        "markdownUrl": "https://benchlm.ai/md/models/holo3-35b-a3b.md"
      },
      "scoreDiff": 37,
      "winsA": 0,
      "winsB": 0,
      "comparableCategoryCount": 0,
      "benchmarkCountA": 19,
      "benchmarkCountB": 1,
      "categoryResults": {
        "agentic": {
          "categoryLabel": "Agentic",
          "avgA": null,
          "avgB": 82.6,
          "winner": null,
          "benchmarkCount": 6
        },
        "coding": {
          "categoryLabel": "Coding",
          "avgA": null,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 4
        },
        "multimodalGrounded": {
          "categoryLabel": "Multimodal & Grounded",
          "avgA": null,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 1
        },
        "reasoning": {
          "categoryLabel": "Reasoning",
          "avgA": null,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 2
        },
        "knowledge": {
          "categoryLabel": "Knowledge",
          "avgA": null,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 6
        },
        "instructionFollowing": {
          "categoryLabel": "Instruction Following",
          "avgA": null,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 1
        },
        "multilingual": {
          "categoryLabel": "Multilingual",
          "avgA": null,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 0
        },
        "math": {
          "categoryLabel": "Mathematics",
          "avgA": null,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 0
        }
      }
    },
    {
      "slug": "gpt-5-5-pro-vs-qwen3-5-397b",
      "url": "https://benchlm.ai/compare/gpt-5-5-pro-vs-qwen3-5-397b",
      "markdownUrl": "https://benchlm.ai/md/compare/gpt-5-5-pro-vs-qwen3-5-397b.md",
      "modelA": {
        "slug": "qwen3-5-397b",
        "canonicalModelKey": "qwen3-5-397b",
        "model": "Qwen3.5 397B",
        "creator": "Alibaba",
        "sourceType": "Open Weight",
        "reasoningType": "Non-Reasoning",
        "contextWindow": "128K",
        "contextWindowTokens": 128000,
        "displayScore": 62,
        "rankingEligible": true,
        "overallRank": 51,
        "url": "https://benchlm.ai/models/qwen3-5-397b",
        "markdownUrl": "https://benchlm.ai/md/models/qwen3-5-397b.md"
      },
      "modelB": {
        "slug": "gpt-5-5-pro",
        "canonicalModelKey": "gpt-5-5-pro",
        "model": "GPT-5.5 Pro",
        "creator": "OpenAI",
        "sourceType": "Proprietary",
        "reasoningType": "Reasoning",
        "contextWindow": "1M",
        "contextWindowTokens": 1000000,
        "displayScore": 100,
        "rankingEligible": false,
        "overallRank": null,
        "url": "https://benchlm.ai/models/gpt-5-5-pro",
        "markdownUrl": "https://benchlm.ai/md/models/gpt-5-5-pro.md"
      },
      "overallWinner": "B",
      "winner": {
        "slug": "gpt-5-5-pro",
        "canonicalModelKey": "gpt-5-5-pro",
        "model": "GPT-5.5 Pro",
        "creator": "OpenAI",
        "sourceType": "Proprietary",
        "reasoningType": "Reasoning",
        "contextWindow": "1M",
        "contextWindowTokens": 1000000,
        "displayScore": 100,
        "rankingEligible": false,
        "overallRank": null,
        "url": "https://benchlm.ai/models/gpt-5-5-pro",
        "markdownUrl": "https://benchlm.ai/md/models/gpt-5-5-pro.md"
      },
      "scoreDiff": 38,
      "winsA": 1,
      "winsB": 1,
      "comparableCategoryCount": 2,
      "benchmarkCountA": 54,
      "benchmarkCountB": 4,
      "categoryResults": {
        "agentic": {
          "categoryLabel": "Agentic",
          "avgA": 56.2,
          "avgB": 90.1,
          "winner": "B",
          "benchmarkCount": 16
        },
        "coding": {
          "categoryLabel": "Coding",
          "avgA": 60.3,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 6
        },
        "multimodalGrounded": {
          "categoryLabel": "Multimodal & Grounded",
          "avgA": 79.6,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 7
        },
        "reasoning": {
          "categoryLabel": "Reasoning",
          "avgA": 63.2,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 4
        },
        "knowledge": {
          "categoryLabel": "Knowledge",
          "avgA": 65.2,
          "avgB": 57.2,
          "winner": "A",
          "benchmarkCount": 13
        },
        "instructionFollowing": {
          "categoryLabel": "Instruction Following",
          "avgA": 92.6,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 2
        },
        "multilingual": {
          "categoryLabel": "Multilingual",
          "avgA": 84.7,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 2
        },
        "math": {
          "categoryLabel": "Mathematics",
          "avgA": null,
          "avgB": 52.4,
          "winner": null,
          "benchmarkCount": 6
        }
      }
    },
    {
      "slug": "holo3-35b-a3b-vs-qwen3-5-397b",
      "url": "https://benchlm.ai/compare/holo3-35b-a3b-vs-qwen3-5-397b",
      "markdownUrl": "https://benchlm.ai/md/compare/holo3-35b-a3b-vs-qwen3-5-397b.md",
      "modelA": {
        "slug": "qwen3-5-397b",
        "canonicalModelKey": "qwen3-5-397b",
        "model": "Qwen3.5 397B",
        "creator": "Alibaba",
        "sourceType": "Open Weight",
        "reasoningType": "Non-Reasoning",
        "contextWindow": "128K",
        "contextWindowTokens": 128000,
        "displayScore": 62,
        "rankingEligible": true,
        "overallRank": 51,
        "url": "https://benchlm.ai/models/qwen3-5-397b",
        "markdownUrl": "https://benchlm.ai/md/models/qwen3-5-397b.md"
      },
      "modelB": {
        "slug": "holo3-35b-a3b",
        "canonicalModelKey": "holo3-35b-a3b",
        "model": "Holo3-35B-A3B",
        "creator": "H Company",
        "sourceType": "Open Weight",
        "reasoningType": "Non-Reasoning",
        "contextWindow": "64K",
        "contextWindowTokens": 64000,
        "displayScore": 100,
        "rankingEligible": false,
        "overallRank": null,
        "url": "https://benchlm.ai/models/holo3-35b-a3b",
        "markdownUrl": "https://benchlm.ai/md/models/holo3-35b-a3b.md"
      },
      "overallWinner": "B",
      "winner": {
        "slug": "holo3-35b-a3b",
        "canonicalModelKey": "holo3-35b-a3b",
        "model": "Holo3-35B-A3B",
        "creator": "H Company",
        "sourceType": "Open Weight",
        "reasoningType": "Non-Reasoning",
        "contextWindow": "64K",
        "contextWindowTokens": 64000,
        "displayScore": 100,
        "rankingEligible": false,
        "overallRank": null,
        "url": "https://benchlm.ai/models/holo3-35b-a3b",
        "markdownUrl": "https://benchlm.ai/md/models/holo3-35b-a3b.md"
      },
      "scoreDiff": 38,
      "winsA": 0,
      "winsB": 1,
      "comparableCategoryCount": 1,
      "benchmarkCountA": 54,
      "benchmarkCountB": 1,
      "categoryResults": {
        "agentic": {
          "categoryLabel": "Agentic",
          "avgA": 56.2,
          "avgB": 82.6,
          "winner": "B",
          "benchmarkCount": 17
        },
        "coding": {
          "categoryLabel": "Coding",
          "avgA": 60.3,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 6
        },
        "multimodalGrounded": {
          "categoryLabel": "Multimodal & Grounded",
          "avgA": 79.6,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 7
        },
        "reasoning": {
          "categoryLabel": "Reasoning",
          "avgA": 63.2,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 4
        },
        "knowledge": {
          "categoryLabel": "Knowledge",
          "avgA": 65.2,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 12
        },
        "instructionFollowing": {
          "categoryLabel": "Instruction Following",
          "avgA": 92.6,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 2
        },
        "multilingual": {
          "categoryLabel": "Multilingual",
          "avgA": 84.7,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 2
        },
        "math": {
          "categoryLabel": "Mathematics",
          "avgA": null,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 5
        }
      }
    },
    {
      "slug": "gpt-5-5-pro-vs-qwen3-5-27b",
      "url": "https://benchlm.ai/compare/gpt-5-5-pro-vs-qwen3-5-27b",
      "markdownUrl": "https://benchlm.ai/md/compare/gpt-5-5-pro-vs-qwen3-5-27b.md",
      "modelA": {
        "slug": "qwen3-5-27b",
        "canonicalModelKey": "qwen3-5-27b",
        "model": "Qwen3.5-27B",
        "creator": "Alibaba",
        "sourceType": "Open Weight",
        "reasoningType": "Reasoning",
        "contextWindow": "262K",
        "contextWindowTokens": 262000,
        "displayScore": 61,
        "rankingEligible": true,
        "overallRank": 52,
        "url": "https://benchlm.ai/models/qwen3-5-27b",
        "markdownUrl": "https://benchlm.ai/md/models/qwen3-5-27b.md"
      },
      "modelB": {
        "slug": "gpt-5-5-pro",
        "canonicalModelKey": "gpt-5-5-pro",
        "model": "GPT-5.5 Pro",
        "creator": "OpenAI",
        "sourceType": "Proprietary",
        "reasoningType": "Reasoning",
        "contextWindow": "1M",
        "contextWindowTokens": 1000000,
        "displayScore": 100,
        "rankingEligible": false,
        "overallRank": null,
        "url": "https://benchlm.ai/models/gpt-5-5-pro",
        "markdownUrl": "https://benchlm.ai/md/models/gpt-5-5-pro.md"
      },
      "overallWinner": "B",
      "winner": {
        "slug": "gpt-5-5-pro",
        "canonicalModelKey": "gpt-5-5-pro",
        "model": "GPT-5.5 Pro",
        "creator": "OpenAI",
        "sourceType": "Proprietary",
        "reasoningType": "Reasoning",
        "contextWindow": "1M",
        "contextWindowTokens": 1000000,
        "displayScore": 100,
        "rankingEligible": false,
        "overallRank": null,
        "url": "https://benchlm.ai/models/gpt-5-5-pro",
        "markdownUrl": "https://benchlm.ai/md/models/gpt-5-5-pro.md"
      },
      "scoreDiff": 39,
      "winsA": 1,
      "winsB": 1,
      "comparableCategoryCount": 2,
      "benchmarkCountA": 33,
      "benchmarkCountB": 4,
      "categoryResults": {
        "agentic": {
          "categoryLabel": "Agentic",
          "avgA": 51.6,
          "avgB": 90.1,
          "winner": "B",
          "benchmarkCount": 8
        },
        "coding": {
          "categoryLabel": "Coding",
          "avgA": 63,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 5
        },
        "multimodalGrounded": {
          "categoryLabel": "Multimodal & Grounded",
          "avgA": null,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 5
        },
        "reasoning": {
          "categoryLabel": "Reasoning",
          "avgA": 60.6,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 3
        },
        "knowledge": {
          "categoryLabel": "Knowledge",
          "avgA": 80.6,
          "avgB": 57.2,
          "winner": "A",
          "benchmarkCount": 11
        },
        "instructionFollowing": {
          "categoryLabel": "Instruction Following",
          "avgA": 95,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 2
        },
        "multilingual": {
          "categoryLabel": "Multilingual",
          "avgA": 82.2,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 1
        },
        "math": {
          "categoryLabel": "Mathematics",
          "avgA": null,
          "avgB": 52.4,
          "winner": null,
          "benchmarkCount": 1
        }
      }
    },
    {
      "slug": "holo3-35b-a3b-vs-qwen3-5-27b",
      "url": "https://benchlm.ai/compare/holo3-35b-a3b-vs-qwen3-5-27b",
      "markdownUrl": "https://benchlm.ai/md/compare/holo3-35b-a3b-vs-qwen3-5-27b.md",
      "modelA": {
        "slug": "qwen3-5-27b",
        "canonicalModelKey": "qwen3-5-27b",
        "model": "Qwen3.5-27B",
        "creator": "Alibaba",
        "sourceType": "Open Weight",
        "reasoningType": "Reasoning",
        "contextWindow": "262K",
        "contextWindowTokens": 262000,
        "displayScore": 61,
        "rankingEligible": true,
        "overallRank": 52,
        "url": "https://benchlm.ai/models/qwen3-5-27b",
        "markdownUrl": "https://benchlm.ai/md/models/qwen3-5-27b.md"
      },
      "modelB": {
        "slug": "holo3-35b-a3b",
        "canonicalModelKey": "holo3-35b-a3b",
        "model": "Holo3-35B-A3B",
        "creator": "H Company",
        "sourceType": "Open Weight",
        "reasoningType": "Non-Reasoning",
        "contextWindow": "64K",
        "contextWindowTokens": 64000,
        "displayScore": 100,
        "rankingEligible": false,
        "overallRank": null,
        "url": "https://benchlm.ai/models/holo3-35b-a3b",
        "markdownUrl": "https://benchlm.ai/md/models/holo3-35b-a3b.md"
      },
      "overallWinner": "B",
      "winner": {
        "slug": "holo3-35b-a3b",
        "canonicalModelKey": "holo3-35b-a3b",
        "model": "Holo3-35B-A3B",
        "creator": "H Company",
        "sourceType": "Open Weight",
        "reasoningType": "Non-Reasoning",
        "contextWindow": "64K",
        "contextWindowTokens": 64000,
        "displayScore": 100,
        "rankingEligible": false,
        "overallRank": null,
        "url": "https://benchlm.ai/models/holo3-35b-a3b",
        "markdownUrl": "https://benchlm.ai/md/models/holo3-35b-a3b.md"
      },
      "scoreDiff": 39,
      "winsA": 0,
      "winsB": 1,
      "comparableCategoryCount": 1,
      "benchmarkCountA": 33,
      "benchmarkCountB": 1,
      "categoryResults": {
        "agentic": {
          "categoryLabel": "Agentic",
          "avgA": 51.6,
          "avgB": 82.6,
          "winner": "B",
          "benchmarkCount": 8
        },
        "coding": {
          "categoryLabel": "Coding",
          "avgA": 63,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 5
        },
        "multimodalGrounded": {
          "categoryLabel": "Multimodal & Grounded",
          "avgA": null,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 5
        },
        "reasoning": {
          "categoryLabel": "Reasoning",
          "avgA": 60.6,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 3
        },
        "knowledge": {
          "categoryLabel": "Knowledge",
          "avgA": 80.6,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 9
        },
        "instructionFollowing": {
          "categoryLabel": "Instruction Following",
          "avgA": 95,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 2
        },
        "multilingual": {
          "categoryLabel": "Multilingual",
          "avgA": 82.2,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 1
        },
        "math": {
          "categoryLabel": "Mathematics",
          "avgA": null,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 0
        }
      }
    },
    {
      "slug": "deepseek-v3-2-thinking-vs-gpt-5-5-pro",
      "url": "https://benchlm.ai/compare/deepseek-v3-2-thinking-vs-gpt-5-5-pro",
      "markdownUrl": "https://benchlm.ai/md/compare/deepseek-v3-2-thinking-vs-gpt-5-5-pro.md",
      "modelA": {
        "slug": "deepseek-v3-2-thinking",
        "canonicalModelKey": "deepseek-v3-2-thinking",
        "model": "DeepSeek V3.2 (Thinking)",
        "creator": "DeepSeek",
        "sourceType": "Open Weight",
        "reasoningType": "Reasoning",
        "contextWindow": "128K",
        "contextWindowTokens": 128000,
        "displayScore": 60,
        "rankingEligible": true,
        "overallRank": 53,
        "url": "https://benchlm.ai/models/deepseek-v3-2-thinking",
        "markdownUrl": "https://benchlm.ai/md/models/deepseek-v3-2-thinking.md"
      },
      "modelB": {
        "slug": "gpt-5-5-pro",
        "canonicalModelKey": "gpt-5-5-pro",
        "model": "GPT-5.5 Pro",
        "creator": "OpenAI",
        "sourceType": "Proprietary",
        "reasoningType": "Reasoning",
        "contextWindow": "1M",
        "contextWindowTokens": 1000000,
        "displayScore": 100,
        "rankingEligible": false,
        "overallRank": null,
        "url": "https://benchlm.ai/models/gpt-5-5-pro",
        "markdownUrl": "https://benchlm.ai/md/models/gpt-5-5-pro.md"
      },
      "overallWinner": "B",
      "winner": {
        "slug": "gpt-5-5-pro",
        "canonicalModelKey": "gpt-5-5-pro",
        "model": "GPT-5.5 Pro",
        "creator": "OpenAI",
        "sourceType": "Proprietary",
        "reasoningType": "Reasoning",
        "contextWindow": "1M",
        "contextWindowTokens": 1000000,
        "displayScore": 100,
        "rankingEligible": false,
        "overallRank": null,
        "url": "https://benchlm.ai/models/gpt-5-5-pro",
        "markdownUrl": "https://benchlm.ai/md/models/gpt-5-5-pro.md"
      },
      "scoreDiff": 40,
      "winsA": 0,
      "winsB": 0,
      "comparableCategoryCount": 0,
      "benchmarkCountA": 2,
      "benchmarkCountB": 4,
      "categoryResults": {
        "agentic": {
          "categoryLabel": "Agentic",
          "avgA": null,
          "avgB": 90.1,
          "winner": null,
          "benchmarkCount": 1
        },
        "coding": {
          "categoryLabel": "Coding",
          "avgA": null,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 1
        },
        "multimodalGrounded": {
          "categoryLabel": "Multimodal & Grounded",
          "avgA": null,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 1
        },
        "reasoning": {
          "categoryLabel": "Reasoning",
          "avgA": null,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 0
        },
        "knowledge": {
          "categoryLabel": "Knowledge",
          "avgA": null,
          "avgB": 57.2,
          "winner": null,
          "benchmarkCount": 2
        },
        "instructionFollowing": {
          "categoryLabel": "Instruction Following",
          "avgA": null,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 0
        },
        "multilingual": {
          "categoryLabel": "Multilingual",
          "avgA": null,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 0
        },
        "math": {
          "categoryLabel": "Mathematics",
          "avgA": null,
          "avgB": 52.4,
          "winner": null,
          "benchmarkCount": 1
        }
      }
    },
    {
      "slug": "deepseek-v3-2-thinking-vs-holo3-35b-a3b",
      "url": "https://benchlm.ai/compare/deepseek-v3-2-thinking-vs-holo3-35b-a3b",
      "markdownUrl": "https://benchlm.ai/md/compare/deepseek-v3-2-thinking-vs-holo3-35b-a3b.md",
      "modelA": {
        "slug": "deepseek-v3-2-thinking",
        "canonicalModelKey": "deepseek-v3-2-thinking",
        "model": "DeepSeek V3.2 (Thinking)",
        "creator": "DeepSeek",
        "sourceType": "Open Weight",
        "reasoningType": "Reasoning",
        "contextWindow": "128K",
        "contextWindowTokens": 128000,
        "displayScore": 60,
        "rankingEligible": true,
        "overallRank": 53,
        "url": "https://benchlm.ai/models/deepseek-v3-2-thinking",
        "markdownUrl": "https://benchlm.ai/md/models/deepseek-v3-2-thinking.md"
      },
      "modelB": {
        "slug": "holo3-35b-a3b",
        "canonicalModelKey": "holo3-35b-a3b",
        "model": "Holo3-35B-A3B",
        "creator": "H Company",
        "sourceType": "Open Weight",
        "reasoningType": "Non-Reasoning",
        "contextWindow": "64K",
        "contextWindowTokens": 64000,
        "displayScore": 100,
        "rankingEligible": false,
        "overallRank": null,
        "url": "https://benchlm.ai/models/holo3-35b-a3b",
        "markdownUrl": "https://benchlm.ai/md/models/holo3-35b-a3b.md"
      },
      "overallWinner": "B",
      "winner": {
        "slug": "holo3-35b-a3b",
        "canonicalModelKey": "holo3-35b-a3b",
        "model": "Holo3-35B-A3B",
        "creator": "H Company",
        "sourceType": "Open Weight",
        "reasoningType": "Non-Reasoning",
        "contextWindow": "64K",
        "contextWindowTokens": 64000,
        "displayScore": 100,
        "rankingEligible": false,
        "overallRank": null,
        "url": "https://benchlm.ai/models/holo3-35b-a3b",
        "markdownUrl": "https://benchlm.ai/md/models/holo3-35b-a3b.md"
      },
      "scoreDiff": 40,
      "winsA": 0,
      "winsB": 0,
      "comparableCategoryCount": 0,
      "benchmarkCountA": 2,
      "benchmarkCountB": 1,
      "categoryResults": {
        "agentic": {
          "categoryLabel": "Agentic",
          "avgA": null,
          "avgB": 82.6,
          "winner": null,
          "benchmarkCount": 1
        },
        "coding": {
          "categoryLabel": "Coding",
          "avgA": null,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 1
        },
        "multimodalGrounded": {
          "categoryLabel": "Multimodal & Grounded",
          "avgA": null,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 1
        },
        "reasoning": {
          "categoryLabel": "Reasoning",
          "avgA": null,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 0
        },
        "knowledge": {
          "categoryLabel": "Knowledge",
          "avgA": null,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 0
        },
        "instructionFollowing": {
          "categoryLabel": "Instruction Following",
          "avgA": null,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 0
        },
        "multilingual": {
          "categoryLabel": "Multilingual",
          "avgA": null,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 0
        },
        "math": {
          "categoryLabel": "Mathematics",
          "avgA": null,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 0
        }
      }
    },
    {
      "slug": "gpt-5-5-pro-vs-mimo-v2-flash",
      "url": "https://benchlm.ai/compare/gpt-5-5-pro-vs-mimo-v2-flash",
      "markdownUrl": "https://benchlm.ai/md/compare/gpt-5-5-pro-vs-mimo-v2-flash.md",
      "modelA": {
        "slug": "mimo-v2-flash",
        "canonicalModelKey": "mimo-v2-flash",
        "model": "MiMo-V2-Flash",
        "creator": "Xiaomi",
        "sourceType": "Open Weight",
        "reasoningType": "Reasoning",
        "contextWindow": "256K",
        "contextWindowTokens": 256000,
        "displayScore": 59,
        "rankingEligible": true,
        "overallRank": 54,
        "url": "https://benchlm.ai/models/mimo-v2-flash",
        "markdownUrl": "https://benchlm.ai/md/models/mimo-v2-flash.md"
      },
      "modelB": {
        "slug": "gpt-5-5-pro",
        "canonicalModelKey": "gpt-5-5-pro",
        "model": "GPT-5.5 Pro",
        "creator": "OpenAI",
        "sourceType": "Proprietary",
        "reasoningType": "Reasoning",
        "contextWindow": "1M",
        "contextWindowTokens": 1000000,
        "displayScore": 100,
        "rankingEligible": false,
        "overallRank": null,
        "url": "https://benchlm.ai/models/gpt-5-5-pro",
        "markdownUrl": "https://benchlm.ai/md/models/gpt-5-5-pro.md"
      },
      "overallWinner": "B",
      "winner": {
        "slug": "gpt-5-5-pro",
        "canonicalModelKey": "gpt-5-5-pro",
        "model": "GPT-5.5 Pro",
        "creator": "OpenAI",
        "sourceType": "Proprietary",
        "reasoningType": "Reasoning",
        "contextWindow": "1M",
        "contextWindowTokens": 1000000,
        "displayScore": 100,
        "rankingEligible": false,
        "overallRank": null,
        "url": "https://benchlm.ai/models/gpt-5-5-pro",
        "markdownUrl": "https://benchlm.ai/md/models/gpt-5-5-pro.md"
      },
      "scoreDiff": 41,
      "winsA": 2,
      "winsB": 0,
      "comparableCategoryCount": 2,
      "benchmarkCountA": 21,
      "benchmarkCountB": 4,
      "categoryResults": {
        "agentic": {
          "categoryLabel": "Agentic",
          "avgA": null,
          "avgB": 90.1,
          "winner": null,
          "benchmarkCount": 5
        },
        "coding": {
          "categoryLabel": "Coding",
          "avgA": 73.4,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 4
        },
        "multimodalGrounded": {
          "categoryLabel": "Multimodal & Grounded",
          "avgA": null,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 1
        },
        "reasoning": {
          "categoryLabel": "Reasoning",
          "avgA": null,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 2
        },
        "knowledge": {
          "categoryLabel": "Knowledge",
          "avgA": 84.5,
          "avgB": 57.2,
          "winner": "A",
          "benchmarkCount": 10
        },
        "instructionFollowing": {
          "categoryLabel": "Instruction Following",
          "avgA": null,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 1
        },
        "multilingual": {
          "categoryLabel": "Multilingual",
          "avgA": null,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 0
        },
        "math": {
          "categoryLabel": "Mathematics",
          "avgA": 94.1,
          "avgB": 52.4,
          "winner": "A",
          "benchmarkCount": 2
        }
      }
    },
    {
      "slug": "holo3-35b-a3b-vs-mimo-v2-flash",
      "url": "https://benchlm.ai/compare/holo3-35b-a3b-vs-mimo-v2-flash",
      "markdownUrl": "https://benchlm.ai/md/compare/holo3-35b-a3b-vs-mimo-v2-flash.md",
      "modelA": {
        "slug": "mimo-v2-flash",
        "canonicalModelKey": "mimo-v2-flash",
        "model": "MiMo-V2-Flash",
        "creator": "Xiaomi",
        "sourceType": "Open Weight",
        "reasoningType": "Reasoning",
        "contextWindow": "256K",
        "contextWindowTokens": 256000,
        "displayScore": 59,
        "rankingEligible": true,
        "overallRank": 54,
        "url": "https://benchlm.ai/models/mimo-v2-flash",
        "markdownUrl": "https://benchlm.ai/md/models/mimo-v2-flash.md"
      },
      "modelB": {
        "slug": "holo3-35b-a3b",
        "canonicalModelKey": "holo3-35b-a3b",
        "model": "Holo3-35B-A3B",
        "creator": "H Company",
        "sourceType": "Open Weight",
        "reasoningType": "Non-Reasoning",
        "contextWindow": "64K",
        "contextWindowTokens": 64000,
        "displayScore": 100,
        "rankingEligible": false,
        "overallRank": null,
        "url": "https://benchlm.ai/models/holo3-35b-a3b",
        "markdownUrl": "https://benchlm.ai/md/models/holo3-35b-a3b.md"
      },
      "overallWinner": "B",
      "winner": {
        "slug": "holo3-35b-a3b",
        "canonicalModelKey": "holo3-35b-a3b",
        "model": "Holo3-35B-A3B",
        "creator": "H Company",
        "sourceType": "Open Weight",
        "reasoningType": "Non-Reasoning",
        "contextWindow": "64K",
        "contextWindowTokens": 64000,
        "displayScore": 100,
        "rankingEligible": false,
        "overallRank": null,
        "url": "https://benchlm.ai/models/holo3-35b-a3b",
        "markdownUrl": "https://benchlm.ai/md/models/holo3-35b-a3b.md"
      },
      "scoreDiff": 41,
      "winsA": 0,
      "winsB": 0,
      "comparableCategoryCount": 0,
      "benchmarkCountA": 21,
      "benchmarkCountB": 1,
      "categoryResults": {
        "agentic": {
          "categoryLabel": "Agentic",
          "avgA": null,
          "avgB": 82.6,
          "winner": null,
          "benchmarkCount": 5
        },
        "coding": {
          "categoryLabel": "Coding",
          "avgA": 73.4,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 4
        },
        "multimodalGrounded": {
          "categoryLabel": "Multimodal & Grounded",
          "avgA": null,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 1
        },
        "reasoning": {
          "categoryLabel": "Reasoning",
          "avgA": null,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 2
        },
        "knowledge": {
          "categoryLabel": "Knowledge",
          "avgA": 84.5,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 8
        },
        "instructionFollowing": {
          "categoryLabel": "Instruction Following",
          "avgA": null,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 1
        },
        "multilingual": {
          "categoryLabel": "Multilingual",
          "avgA": null,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 0
        },
        "math": {
          "categoryLabel": "Mathematics",
          "avgA": 94.1,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 1
        }
      }
    },
    {
      "slug": "deepseek-v4-flash-vs-gpt-5-5-pro",
      "url": "https://benchlm.ai/compare/deepseek-v4-flash-vs-gpt-5-5-pro",
      "markdownUrl": "https://benchlm.ai/md/compare/deepseek-v4-flash-vs-gpt-5-5-pro.md",
      "modelA": {
        "slug": "deepseek-v4-flash",
        "canonicalModelKey": "deepseek-v4-flash",
        "model": "DeepSeek V4 Flash",
        "creator": "DeepSeek",
        "sourceType": "Open Weight",
        "reasoningType": "Non-Reasoning",
        "contextWindow": "1M",
        "contextWindowTokens": 1000000,
        "displayScore": 57,
        "rankingEligible": true,
        "overallRank": 55,
        "url": "https://benchlm.ai/models/deepseek-v4-flash",
        "markdownUrl": "https://benchlm.ai/md/models/deepseek-v4-flash.md"
      },
      "modelB": {
        "slug": "gpt-5-5-pro",
        "canonicalModelKey": "gpt-5-5-pro",
        "model": "GPT-5.5 Pro",
        "creator": "OpenAI",
        "sourceType": "Proprietary",
        "reasoningType": "Reasoning",
        "contextWindow": "1M",
        "contextWindowTokens": 1000000,
        "displayScore": 100,
        "rankingEligible": false,
        "overallRank": null,
        "url": "https://benchlm.ai/models/gpt-5-5-pro",
        "markdownUrl": "https://benchlm.ai/md/models/gpt-5-5-pro.md"
      },
      "overallWinner": "B",
      "winner": {
        "slug": "gpt-5-5-pro",
        "canonicalModelKey": "gpt-5-5-pro",
        "model": "GPT-5.5 Pro",
        "creator": "OpenAI",
        "sourceType": "Proprietary",
        "reasoningType": "Reasoning",
        "contextWindow": "1M",
        "contextWindowTokens": 1000000,
        "displayScore": 100,
        "rankingEligible": false,
        "overallRank": null,
        "url": "https://benchlm.ai/models/gpt-5-5-pro",
        "markdownUrl": "https://benchlm.ai/md/models/gpt-5-5-pro.md"
      },
      "scoreDiff": 43,
      "winsA": 0,
      "winsB": 2,
      "comparableCategoryCount": 2,
      "benchmarkCountA": 23,
      "benchmarkCountB": 4,
      "categoryResults": {
        "agentic": {
          "categoryLabel": "Agentic",
          "avgA": 49.1,
          "avgB": 90.1,
          "winner": "B",
          "benchmarkCount": 6
        },
        "coding": {
          "categoryLabel": "Coding",
          "avgA": 57.1,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 5
        },
        "multimodalGrounded": {
          "categoryLabel": "Multimodal & Grounded",
          "avgA": null,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 1
        },
        "reasoning": {
          "categoryLabel": "Reasoning",
          "avgA": null,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 2
        },
        "knowledge": {
          "categoryLabel": "Knowledge",
          "avgA": 45.2,
          "avgB": 57.2,
          "winner": "B",
          "benchmarkCount": 7
        },
        "instructionFollowing": {
          "categoryLabel": "Instruction Following",
          "avgA": null,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 0
        },
        "multilingual": {
          "categoryLabel": "Multilingual",
          "avgA": null,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 0
        },
        "math": {
          "categoryLabel": "Mathematics",
          "avgA": null,
          "avgB": 52.4,
          "winner": null,
          "benchmarkCount": 5
        }
      }
    },
    {
      "slug": "deepseek-v4-flash-vs-holo3-35b-a3b",
      "url": "https://benchlm.ai/compare/deepseek-v4-flash-vs-holo3-35b-a3b",
      "markdownUrl": "https://benchlm.ai/md/compare/deepseek-v4-flash-vs-holo3-35b-a3b.md",
      "modelA": {
        "slug": "deepseek-v4-flash",
        "canonicalModelKey": "deepseek-v4-flash",
        "model": "DeepSeek V4 Flash",
        "creator": "DeepSeek",
        "sourceType": "Open Weight",
        "reasoningType": "Non-Reasoning",
        "contextWindow": "1M",
        "contextWindowTokens": 1000000,
        "displayScore": 57,
        "rankingEligible": true,
        "overallRank": 55,
        "url": "https://benchlm.ai/models/deepseek-v4-flash",
        "markdownUrl": "https://benchlm.ai/md/models/deepseek-v4-flash.md"
      },
      "modelB": {
        "slug": "holo3-35b-a3b",
        "canonicalModelKey": "holo3-35b-a3b",
        "model": "Holo3-35B-A3B",
        "creator": "H Company",
        "sourceType": "Open Weight",
        "reasoningType": "Non-Reasoning",
        "contextWindow": "64K",
        "contextWindowTokens": 64000,
        "displayScore": 100,
        "rankingEligible": false,
        "overallRank": null,
        "url": "https://benchlm.ai/models/holo3-35b-a3b",
        "markdownUrl": "https://benchlm.ai/md/models/holo3-35b-a3b.md"
      },
      "overallWinner": "B",
      "winner": {
        "slug": "holo3-35b-a3b",
        "canonicalModelKey": "holo3-35b-a3b",
        "model": "Holo3-35B-A3B",
        "creator": "H Company",
        "sourceType": "Open Weight",
        "reasoningType": "Non-Reasoning",
        "contextWindow": "64K",
        "contextWindowTokens": 64000,
        "displayScore": 100,
        "rankingEligible": false,
        "overallRank": null,
        "url": "https://benchlm.ai/models/holo3-35b-a3b",
        "markdownUrl": "https://benchlm.ai/md/models/holo3-35b-a3b.md"
      },
      "scoreDiff": 43,
      "winsA": 0,
      "winsB": 1,
      "comparableCategoryCount": 1,
      "benchmarkCountA": 23,
      "benchmarkCountB": 1,
      "categoryResults": {
        "agentic": {
          "categoryLabel": "Agentic",
          "avgA": 49.1,
          "avgB": 82.6,
          "winner": "B",
          "benchmarkCount": 6
        },
        "coding": {
          "categoryLabel": "Coding",
          "avgA": 57.1,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 5
        },
        "multimodalGrounded": {
          "categoryLabel": "Multimodal & Grounded",
          "avgA": null,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 1
        },
        "reasoning": {
          "categoryLabel": "Reasoning",
          "avgA": null,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 2
        },
        "knowledge": {
          "categoryLabel": "Knowledge",
          "avgA": 45.2,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 6
        },
        "instructionFollowing": {
          "categoryLabel": "Instruction Following",
          "avgA": null,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 0
        },
        "multilingual": {
          "categoryLabel": "Multilingual",
          "avgA": null,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 0
        },
        "math": {
          "categoryLabel": "Mathematics",
          "avgA": null,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 4
        }
      }
    },
    {
      "slug": "gpt-4-1-vs-gpt-5-5-pro",
      "url": "https://benchlm.ai/compare/gpt-4-1-vs-gpt-5-5-pro",
      "markdownUrl": "https://benchlm.ai/md/compare/gpt-4-1-vs-gpt-5-5-pro.md",
      "modelA": {
        "slug": "gpt-4-1",
        "canonicalModelKey": "gpt-4-1",
        "model": "GPT-4.1",
        "creator": "OpenAI",
        "sourceType": "Proprietary",
        "reasoningType": "Non-Reasoning",
        "contextWindow": "1M",
        "contextWindowTokens": 1000000,
        "displayScore": 57,
        "rankingEligible": true,
        "overallRank": 56,
        "url": "https://benchlm.ai/models/gpt-4-1",
        "markdownUrl": "https://benchlm.ai/md/models/gpt-4-1.md"
      },
      "modelB": {
        "slug": "gpt-5-5-pro",
        "canonicalModelKey": "gpt-5-5-pro",
        "model": "GPT-5.5 Pro",
        "creator": "OpenAI",
        "sourceType": "Proprietary",
        "reasoningType": "Reasoning",
        "contextWindow": "1M",
        "contextWindowTokens": 1000000,
        "displayScore": 100,
        "rankingEligible": false,
        "overallRank": null,
        "url": "https://benchlm.ai/models/gpt-5-5-pro",
        "markdownUrl": "https://benchlm.ai/md/models/gpt-5-5-pro.md"
      },
      "overallWinner": "B",
      "winner": {
        "slug": "gpt-5-5-pro",
        "canonicalModelKey": "gpt-5-5-pro",
        "model": "GPT-5.5 Pro",
        "creator": "OpenAI",
        "sourceType": "Proprietary",
        "reasoningType": "Reasoning",
        "contextWindow": "1M",
        "contextWindowTokens": 1000000,
        "displayScore": 100,
        "rankingEligible": false,
        "overallRank": null,
        "url": "https://benchlm.ai/models/gpt-5-5-pro",
        "markdownUrl": "https://benchlm.ai/md/models/gpt-5-5-pro.md"
      },
      "scoreDiff": 43,
      "winsA": 1,
      "winsB": 0,
      "comparableCategoryCount": 1,
      "benchmarkCountA": 23,
      "benchmarkCountB": 4,
      "categoryResults": {
        "agentic": {
          "categoryLabel": "Agentic",
          "avgA": null,
          "avgB": 90.1,
          "winner": null,
          "benchmarkCount": 6
        },
        "coding": {
          "categoryLabel": "Coding",
          "avgA": 54.6,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 4
        },
        "multimodalGrounded": {
          "categoryLabel": "Multimodal & Grounded",
          "avgA": null,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 2
        },
        "reasoning": {
          "categoryLabel": "Reasoning",
          "avgA": null,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 2
        },
        "knowledge": {
          "categoryLabel": "Knowledge",
          "avgA": 66.3,
          "avgB": 57.2,
          "winner": "A",
          "benchmarkCount": 10
        },
        "instructionFollowing": {
          "categoryLabel": "Instruction Following",
          "avgA": 87.4,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 2
        },
        "multilingual": {
          "categoryLabel": "Multilingual",
          "avgA": null,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 0
        },
        "math": {
          "categoryLabel": "Mathematics",
          "avgA": null,
          "avgB": 52.4,
          "winner": null,
          "benchmarkCount": 1
        }
      }
    },
    {
      "slug": "gpt-4-1-vs-holo3-35b-a3b",
      "url": "https://benchlm.ai/compare/gpt-4-1-vs-holo3-35b-a3b",
      "markdownUrl": "https://benchlm.ai/md/compare/gpt-4-1-vs-holo3-35b-a3b.md",
      "modelA": {
        "slug": "gpt-4-1",
        "canonicalModelKey": "gpt-4-1",
        "model": "GPT-4.1",
        "creator": "OpenAI",
        "sourceType": "Proprietary",
        "reasoningType": "Non-Reasoning",
        "contextWindow": "1M",
        "contextWindowTokens": 1000000,
        "displayScore": 57,
        "rankingEligible": true,
        "overallRank": 56,
        "url": "https://benchlm.ai/models/gpt-4-1",
        "markdownUrl": "https://benchlm.ai/md/models/gpt-4-1.md"
      },
      "modelB": {
        "slug": "holo3-35b-a3b",
        "canonicalModelKey": "holo3-35b-a3b",
        "model": "Holo3-35B-A3B",
        "creator": "H Company",
        "sourceType": "Open Weight",
        "reasoningType": "Non-Reasoning",
        "contextWindow": "64K",
        "contextWindowTokens": 64000,
        "displayScore": 100,
        "rankingEligible": false,
        "overallRank": null,
        "url": "https://benchlm.ai/models/holo3-35b-a3b",
        "markdownUrl": "https://benchlm.ai/md/models/holo3-35b-a3b.md"
      },
      "overallWinner": "B",
      "winner": {
        "slug": "holo3-35b-a3b",
        "canonicalModelKey": "holo3-35b-a3b",
        "model": "Holo3-35B-A3B",
        "creator": "H Company",
        "sourceType": "Open Weight",
        "reasoningType": "Non-Reasoning",
        "contextWindow": "64K",
        "contextWindowTokens": 64000,
        "displayScore": 100,
        "rankingEligible": false,
        "overallRank": null,
        "url": "https://benchlm.ai/models/holo3-35b-a3b",
        "markdownUrl": "https://benchlm.ai/md/models/holo3-35b-a3b.md"
      },
      "scoreDiff": 43,
      "winsA": 0,
      "winsB": 0,
      "comparableCategoryCount": 0,
      "benchmarkCountA": 23,
      "benchmarkCountB": 1,
      "categoryResults": {
        "agentic": {
          "categoryLabel": "Agentic",
          "avgA": null,
          "avgB": 82.6,
          "winner": null,
          "benchmarkCount": 6
        },
        "coding": {
          "categoryLabel": "Coding",
          "avgA": 54.6,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 4
        },
        "multimodalGrounded": {
          "categoryLabel": "Multimodal & Grounded",
          "avgA": null,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 2
        },
        "reasoning": {
          "categoryLabel": "Reasoning",
          "avgA": null,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 2
        },
        "knowledge": {
          "categoryLabel": "Knowledge",
          "avgA": 66.3,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 8
        },
        "instructionFollowing": {
          "categoryLabel": "Instruction Following",
          "avgA": 87.4,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 2
        },
        "multilingual": {
          "categoryLabel": "Multilingual",
          "avgA": null,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 0
        },
        "math": {
          "categoryLabel": "Mathematics",
          "avgA": null,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 0
        }
      }
    },
    {
      "slug": "gpt-5-5-pro-vs-o3-pro",
      "url": "https://benchlm.ai/compare/gpt-5-5-pro-vs-o3-pro",
      "markdownUrl": "https://benchlm.ai/md/compare/gpt-5-5-pro-vs-o3-pro.md",
      "modelA": {
        "slug": "o3-pro",
        "canonicalModelKey": "o3-pro",
        "model": "o3-pro",
        "creator": "OpenAI",
        "sourceType": "Proprietary",
        "reasoningType": "Reasoning",
        "contextWindow": "200K",
        "contextWindowTokens": 200000,
        "displayScore": 57,
        "rankingEligible": true,
        "overallRank": 57,
        "url": "https://benchlm.ai/models/o3-pro",
        "markdownUrl": "https://benchlm.ai/md/models/o3-pro.md"
      },
      "modelB": {
        "slug": "gpt-5-5-pro",
        "canonicalModelKey": "gpt-5-5-pro",
        "model": "GPT-5.5 Pro",
        "creator": "OpenAI",
        "sourceType": "Proprietary",
        "reasoningType": "Reasoning",
        "contextWindow": "1M",
        "contextWindowTokens": 1000000,
        "displayScore": 100,
        "rankingEligible": false,
        "overallRank": null,
        "url": "https://benchlm.ai/models/gpt-5-5-pro",
        "markdownUrl": "https://benchlm.ai/md/models/gpt-5-5-pro.md"
      },
      "overallWinner": "B",
      "winner": {
        "slug": "gpt-5-5-pro",
        "canonicalModelKey": "gpt-5-5-pro",
        "model": "GPT-5.5 Pro",
        "creator": "OpenAI",
        "sourceType": "Proprietary",
        "reasoningType": "Reasoning",
        "contextWindow": "1M",
        "contextWindowTokens": 1000000,
        "displayScore": 100,
        "rankingEligible": false,
        "overallRank": null,
        "url": "https://benchlm.ai/models/gpt-5-5-pro",
        "markdownUrl": "https://benchlm.ai/md/models/gpt-5-5-pro.md"
      },
      "scoreDiff": 43,
      "winsA": 0,
      "winsB": 0,
      "comparableCategoryCount": 0,
      "benchmarkCountA": 2,
      "benchmarkCountB": 4,
      "categoryResults": {
        "agentic": {
          "categoryLabel": "Agentic",
          "avgA": null,
          "avgB": 90.1,
          "winner": null,
          "benchmarkCount": 1
        },
        "coding": {
          "categoryLabel": "Coding",
          "avgA": null,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 0
        },
        "multimodalGrounded": {
          "categoryLabel": "Multimodal & Grounded",
          "avgA": null,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 0
        },
        "reasoning": {
          "categoryLabel": "Reasoning",
          "avgA": null,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 0
        },
        "knowledge": {
          "categoryLabel": "Knowledge",
          "avgA": null,
          "avgB": 57.2,
          "winner": null,
          "benchmarkCount": 4
        },
        "instructionFollowing": {
          "categoryLabel": "Instruction Following",
          "avgA": null,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 0
        },
        "multilingual": {
          "categoryLabel": "Multilingual",
          "avgA": null,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 0
        },
        "math": {
          "categoryLabel": "Mathematics",
          "avgA": null,
          "avgB": 52.4,
          "winner": null,
          "benchmarkCount": 1
        }
      }
    },
    {
      "slug": "holo3-35b-a3b-vs-o3-pro",
      "url": "https://benchlm.ai/compare/holo3-35b-a3b-vs-o3-pro",
      "markdownUrl": "https://benchlm.ai/md/compare/holo3-35b-a3b-vs-o3-pro.md",
      "modelA": {
        "slug": "o3-pro",
        "canonicalModelKey": "o3-pro",
        "model": "o3-pro",
        "creator": "OpenAI",
        "sourceType": "Proprietary",
        "reasoningType": "Reasoning",
        "contextWindow": "200K",
        "contextWindowTokens": 200000,
        "displayScore": 57,
        "rankingEligible": true,
        "overallRank": 57,
        "url": "https://benchlm.ai/models/o3-pro",
        "markdownUrl": "https://benchlm.ai/md/models/o3-pro.md"
      },
      "modelB": {
        "slug": "holo3-35b-a3b",
        "canonicalModelKey": "holo3-35b-a3b",
        "model": "Holo3-35B-A3B",
        "creator": "H Company",
        "sourceType": "Open Weight",
        "reasoningType": "Non-Reasoning",
        "contextWindow": "64K",
        "contextWindowTokens": 64000,
        "displayScore": 100,
        "rankingEligible": false,
        "overallRank": null,
        "url": "https://benchlm.ai/models/holo3-35b-a3b",
        "markdownUrl": "https://benchlm.ai/md/models/holo3-35b-a3b.md"
      },
      "overallWinner": "B",
      "winner": {
        "slug": "holo3-35b-a3b",
        "canonicalModelKey": "holo3-35b-a3b",
        "model": "Holo3-35B-A3B",
        "creator": "H Company",
        "sourceType": "Open Weight",
        "reasoningType": "Non-Reasoning",
        "contextWindow": "64K",
        "contextWindowTokens": 64000,
        "displayScore": 100,
        "rankingEligible": false,
        "overallRank": null,
        "url": "https://benchlm.ai/models/holo3-35b-a3b",
        "markdownUrl": "https://benchlm.ai/md/models/holo3-35b-a3b.md"
      },
      "scoreDiff": 43,
      "winsA": 0,
      "winsB": 0,
      "comparableCategoryCount": 0,
      "benchmarkCountA": 2,
      "benchmarkCountB": 1,
      "categoryResults": {
        "agentic": {
          "categoryLabel": "Agentic",
          "avgA": null,
          "avgB": 82.6,
          "winner": null,
          "benchmarkCount": 1
        },
        "coding": {
          "categoryLabel": "Coding",
          "avgA": null,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 0
        },
        "multimodalGrounded": {
          "categoryLabel": "Multimodal & Grounded",
          "avgA": null,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 0
        },
        "reasoning": {
          "categoryLabel": "Reasoning",
          "avgA": null,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 0
        },
        "knowledge": {
          "categoryLabel": "Knowledge",
          "avgA": null,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 2
        },
        "instructionFollowing": {
          "categoryLabel": "Instruction Following",
          "avgA": null,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 0
        },
        "multilingual": {
          "categoryLabel": "Multilingual",
          "avgA": null,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 0
        },
        "math": {
          "categoryLabel": "Mathematics",
          "avgA": null,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 0
        }
      }
    },
    {
      "slug": "gpt-5-5-pro-vs-o1",
      "url": "https://benchlm.ai/compare/gpt-5-5-pro-vs-o1",
      "markdownUrl": "https://benchlm.ai/md/compare/gpt-5-5-pro-vs-o1.md",
      "modelA": {
        "slug": "o1",
        "canonicalModelKey": "o1",
        "model": "o1",
        "creator": "OpenAI",
        "sourceType": "Proprietary",
        "reasoningType": "Reasoning",
        "contextWindow": "200K",
        "contextWindowTokens": 200000,
        "displayScore": 57,
        "rankingEligible": true,
        "overallRank": 58,
        "url": "https://benchlm.ai/models/o1",
        "markdownUrl": "https://benchlm.ai/md/models/o1.md"
      },
      "modelB": {
        "slug": "gpt-5-5-pro",
        "canonicalModelKey": "gpt-5-5-pro",
        "model": "GPT-5.5 Pro",
        "creator": "OpenAI",
        "sourceType": "Proprietary",
        "reasoningType": "Reasoning",
        "contextWindow": "1M",
        "contextWindowTokens": 1000000,
        "displayScore": 100,
        "rankingEligible": false,
        "overallRank": null,
        "url": "https://benchlm.ai/models/gpt-5-5-pro",
        "markdownUrl": "https://benchlm.ai/md/models/gpt-5-5-pro.md"
      },
      "overallWinner": "B",
      "winner": {
        "slug": "gpt-5-5-pro",
        "canonicalModelKey": "gpt-5-5-pro",
        "model": "GPT-5.5 Pro",
        "creator": "OpenAI",
        "sourceType": "Proprietary",
        "reasoningType": "Reasoning",
        "contextWindow": "1M",
        "contextWindowTokens": 1000000,
        "displayScore": 100,
        "rankingEligible": false,
        "overallRank": null,
        "url": "https://benchlm.ai/models/gpt-5-5-pro",
        "markdownUrl": "https://benchlm.ai/md/models/gpt-5-5-pro.md"
      },
      "scoreDiff": 43,
      "winsA": 1,
      "winsB": 0,
      "comparableCategoryCount": 1,
      "benchmarkCountA": 19,
      "benchmarkCountB": 4,
      "categoryResults": {
        "agentic": {
          "categoryLabel": "Agentic",
          "avgA": null,
          "avgB": 90.1,
          "winner": null,
          "benchmarkCount": 5
        },
        "coding": {
          "categoryLabel": "Coding",
          "avgA": null,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 3
        },
        "multimodalGrounded": {
          "categoryLabel": "Multimodal & Grounded",
          "avgA": null,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 0
        },
        "reasoning": {
          "categoryLabel": "Reasoning",
          "avgA": null,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 2
        },
        "knowledge": {
          "categoryLabel": "Knowledge",
          "avgA": 75.7,
          "avgB": 57.2,
          "winner": "A",
          "benchmarkCount": 10
        },
        "instructionFollowing": {
          "categoryLabel": "Instruction Following",
          "avgA": 92.2,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 2
        },
        "multilingual": {
          "categoryLabel": "Multilingual",
          "avgA": null,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 0
        },
        "math": {
          "categoryLabel": "Mathematics",
          "avgA": null,
          "avgB": 52.4,
          "winner": null,
          "benchmarkCount": 1
        }
      }
    },
    {
      "slug": "holo3-35b-a3b-vs-o1",
      "url": "https://benchlm.ai/compare/holo3-35b-a3b-vs-o1",
      "markdownUrl": "https://benchlm.ai/md/compare/holo3-35b-a3b-vs-o1.md",
      "modelA": {
        "slug": "o1",
        "canonicalModelKey": "o1",
        "model": "o1",
        "creator": "OpenAI",
        "sourceType": "Proprietary",
        "reasoningType": "Reasoning",
        "contextWindow": "200K",
        "contextWindowTokens": 200000,
        "displayScore": 57,
        "rankingEligible": true,
        "overallRank": 58,
        "url": "https://benchlm.ai/models/o1",
        "markdownUrl": "https://benchlm.ai/md/models/o1.md"
      },
      "modelB": {
        "slug": "holo3-35b-a3b",
        "canonicalModelKey": "holo3-35b-a3b",
        "model": "Holo3-35B-A3B",
        "creator": "H Company",
        "sourceType": "Open Weight",
        "reasoningType": "Non-Reasoning",
        "contextWindow": "64K",
        "contextWindowTokens": 64000,
        "displayScore": 100,
        "rankingEligible": false,
        "overallRank": null,
        "url": "https://benchlm.ai/models/holo3-35b-a3b",
        "markdownUrl": "https://benchlm.ai/md/models/holo3-35b-a3b.md"
      },
      "overallWinner": "B",
      "winner": {
        "slug": "holo3-35b-a3b",
        "canonicalModelKey": "holo3-35b-a3b",
        "model": "Holo3-35B-A3B",
        "creator": "H Company",
        "sourceType": "Open Weight",
        "reasoningType": "Non-Reasoning",
        "contextWindow": "64K",
        "contextWindowTokens": 64000,
        "displayScore": 100,
        "rankingEligible": false,
        "overallRank": null,
        "url": "https://benchlm.ai/models/holo3-35b-a3b",
        "markdownUrl": "https://benchlm.ai/md/models/holo3-35b-a3b.md"
      },
      "scoreDiff": 43,
      "winsA": 0,
      "winsB": 0,
      "comparableCategoryCount": 0,
      "benchmarkCountA": 19,
      "benchmarkCountB": 1,
      "categoryResults": {
        "agentic": {
          "categoryLabel": "Agentic",
          "avgA": null,
          "avgB": 82.6,
          "winner": null,
          "benchmarkCount": 5
        },
        "coding": {
          "categoryLabel": "Coding",
          "avgA": null,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 3
        },
        "multimodalGrounded": {
          "categoryLabel": "Multimodal & Grounded",
          "avgA": null,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 0
        },
        "reasoning": {
          "categoryLabel": "Reasoning",
          "avgA": null,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 2
        },
        "knowledge": {
          "categoryLabel": "Knowledge",
          "avgA": 75.7,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 8
        },
        "instructionFollowing": {
          "categoryLabel": "Instruction Following",
          "avgA": 92.2,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 2
        },
        "multilingual": {
          "categoryLabel": "Multilingual",
          "avgA": null,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 0
        },
        "math": {
          "categoryLabel": "Mathematics",
          "avgA": null,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 0
        }
      }
    },
    {
      "slug": "deepseek-v3-2-vs-gpt-5-5-pro",
      "url": "https://benchlm.ai/compare/deepseek-v3-2-vs-gpt-5-5-pro",
      "markdownUrl": "https://benchlm.ai/md/compare/deepseek-v3-2-vs-gpt-5-5-pro.md",
      "modelA": {
        "slug": "deepseek-v3-2",
        "canonicalModelKey": "deepseek-v3-2",
        "model": "DeepSeek V3.2",
        "creator": "DeepSeek",
        "sourceType": "Open Weight",
        "reasoningType": "Non-Reasoning",
        "contextWindow": "128K",
        "contextWindowTokens": 128000,
        "displayScore": 56,
        "rankingEligible": true,
        "overallRank": 59,
        "url": "https://benchlm.ai/models/deepseek-v3-2",
        "markdownUrl": "https://benchlm.ai/md/models/deepseek-v3-2.md"
      },
      "modelB": {
        "slug": "gpt-5-5-pro",
        "canonicalModelKey": "gpt-5-5-pro",
        "model": "GPT-5.5 Pro",
        "creator": "OpenAI",
        "sourceType": "Proprietary",
        "reasoningType": "Reasoning",
        "contextWindow": "1M",
        "contextWindowTokens": 1000000,
        "displayScore": 100,
        "rankingEligible": false,
        "overallRank": null,
        "url": "https://benchlm.ai/models/gpt-5-5-pro",
        "markdownUrl": "https://benchlm.ai/md/models/gpt-5-5-pro.md"
      },
      "overallWinner": "B",
      "winner": {
        "slug": "gpt-5-5-pro",
        "canonicalModelKey": "gpt-5-5-pro",
        "model": "GPT-5.5 Pro",
        "creator": "OpenAI",
        "sourceType": "Proprietary",
        "reasoningType": "Reasoning",
        "contextWindow": "1M",
        "contextWindowTokens": 1000000,
        "displayScore": 100,
        "rankingEligible": false,
        "overallRank": null,
        "url": "https://benchlm.ai/models/gpt-5-5-pro",
        "markdownUrl": "https://benchlm.ai/md/models/gpt-5-5-pro.md"
      },
      "scoreDiff": 44,
      "winsA": 0,
      "winsB": 0,
      "comparableCategoryCount": 0,
      "benchmarkCountA": 22,
      "benchmarkCountB": 4,
      "categoryResults": {
        "agentic": {
          "categoryLabel": "Agentic",
          "avgA": null,
          "avgB": 90.1,
          "winner": null,
          "benchmarkCount": 8
        },
        "coding": {
          "categoryLabel": "Coding",
          "avgA": 60.9,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 5
        },
        "multimodalGrounded": {
          "categoryLabel": "Multimodal & Grounded",
          "avgA": null,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 1
        },
        "reasoning": {
          "categoryLabel": "Reasoning",
          "avgA": null,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 2
        },
        "knowledge": {
          "categoryLabel": "Knowledge",
          "avgA": null,
          "avgB": 57.2,
          "winner": null,
          "benchmarkCount": 8
        },
        "instructionFollowing": {
          "categoryLabel": "Instruction Following",
          "avgA": null,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 1
        },
        "multilingual": {
          "categoryLabel": "Multilingual",
          "avgA": null,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 0
        },
        "math": {
          "categoryLabel": "Mathematics",
          "avgA": null,
          "avgB": 52.4,
          "winner": null,
          "benchmarkCount": 1
        }
      }
    },
    {
      "slug": "deepseek-v3-2-vs-holo3-35b-a3b",
      "url": "https://benchlm.ai/compare/deepseek-v3-2-vs-holo3-35b-a3b",
      "markdownUrl": "https://benchlm.ai/md/compare/deepseek-v3-2-vs-holo3-35b-a3b.md",
      "modelA": {
        "slug": "deepseek-v3-2",
        "canonicalModelKey": "deepseek-v3-2",
        "model": "DeepSeek V3.2",
        "creator": "DeepSeek",
        "sourceType": "Open Weight",
        "reasoningType": "Non-Reasoning",
        "contextWindow": "128K",
        "contextWindowTokens": 128000,
        "displayScore": 56,
        "rankingEligible": true,
        "overallRank": 59,
        "url": "https://benchlm.ai/models/deepseek-v3-2",
        "markdownUrl": "https://benchlm.ai/md/models/deepseek-v3-2.md"
      },
      "modelB": {
        "slug": "holo3-35b-a3b",
        "canonicalModelKey": "holo3-35b-a3b",
        "model": "Holo3-35B-A3B",
        "creator": "H Company",
        "sourceType": "Open Weight",
        "reasoningType": "Non-Reasoning",
        "contextWindow": "64K",
        "contextWindowTokens": 64000,
        "displayScore": 100,
        "rankingEligible": false,
        "overallRank": null,
        "url": "https://benchlm.ai/models/holo3-35b-a3b",
        "markdownUrl": "https://benchlm.ai/md/models/holo3-35b-a3b.md"
      },
      "overallWinner": "B",
      "winner": {
        "slug": "holo3-35b-a3b",
        "canonicalModelKey": "holo3-35b-a3b",
        "model": "Holo3-35B-A3B",
        "creator": "H Company",
        "sourceType": "Open Weight",
        "reasoningType": "Non-Reasoning",
        "contextWindow": "64K",
        "contextWindowTokens": 64000,
        "displayScore": 100,
        "rankingEligible": false,
        "overallRank": null,
        "url": "https://benchlm.ai/models/holo3-35b-a3b",
        "markdownUrl": "https://benchlm.ai/md/models/holo3-35b-a3b.md"
      },
      "scoreDiff": 44,
      "winsA": 0,
      "winsB": 0,
      "comparableCategoryCount": 0,
      "benchmarkCountA": 22,
      "benchmarkCountB": 1,
      "categoryResults": {
        "agentic": {
          "categoryLabel": "Agentic",
          "avgA": null,
          "avgB": 82.6,
          "winner": null,
          "benchmarkCount": 8
        },
        "coding": {
          "categoryLabel": "Coding",
          "avgA": 60.9,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 5
        },
        "multimodalGrounded": {
          "categoryLabel": "Multimodal & Grounded",
          "avgA": null,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 1
        },
        "reasoning": {
          "categoryLabel": "Reasoning",
          "avgA": null,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 2
        },
        "knowledge": {
          "categoryLabel": "Knowledge",
          "avgA": null,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 6
        },
        "instructionFollowing": {
          "categoryLabel": "Instruction Following",
          "avgA": null,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 1
        },
        "multilingual": {
          "categoryLabel": "Multilingual",
          "avgA": null,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 0
        },
        "math": {
          "categoryLabel": "Mathematics",
          "avgA": null,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 0
        }
      }
    },
    {
      "slug": "claude-haiku-4-5-vs-gpt-5-5-pro",
      "url": "https://benchlm.ai/compare/claude-haiku-4-5-vs-gpt-5-5-pro",
      "markdownUrl": "https://benchlm.ai/md/compare/claude-haiku-4-5-vs-gpt-5-5-pro.md",
      "modelA": {
        "slug": "claude-haiku-4-5",
        "canonicalModelKey": "claude-haiku-4-5",
        "model": "Claude Haiku 4.5",
        "creator": "Anthropic",
        "sourceType": "Proprietary",
        "reasoningType": "Non-Reasoning",
        "contextWindow": "200K",
        "contextWindowTokens": 200000,
        "displayScore": 56,
        "rankingEligible": true,
        "overallRank": 60,
        "url": "https://benchlm.ai/models/claude-haiku-4-5",
        "markdownUrl": "https://benchlm.ai/md/models/claude-haiku-4-5.md"
      },
      "modelB": {
        "slug": "gpt-5-5-pro",
        "canonicalModelKey": "gpt-5-5-pro",
        "model": "GPT-5.5 Pro",
        "creator": "OpenAI",
        "sourceType": "Proprietary",
        "reasoningType": "Reasoning",
        "contextWindow": "1M",
        "contextWindowTokens": 1000000,
        "displayScore": 100,
        "rankingEligible": false,
        "overallRank": null,
        "url": "https://benchlm.ai/models/gpt-5-5-pro",
        "markdownUrl": "https://benchlm.ai/md/models/gpt-5-5-pro.md"
      },
      "overallWinner": "B",
      "winner": {
        "slug": "gpt-5-5-pro",
        "canonicalModelKey": "gpt-5-5-pro",
        "model": "GPT-5.5 Pro",
        "creator": "OpenAI",
        "sourceType": "Proprietary",
        "reasoningType": "Reasoning",
        "contextWindow": "1M",
        "contextWindowTokens": 1000000,
        "displayScore": 100,
        "rankingEligible": false,
        "overallRank": null,
        "url": "https://benchlm.ai/models/gpt-5-5-pro",
        "markdownUrl": "https://benchlm.ai/md/models/gpt-5-5-pro.md"
      },
      "scoreDiff": 44,
      "winsA": 0,
      "winsB": 0,
      "comparableCategoryCount": 0,
      "benchmarkCountA": 2,
      "benchmarkCountB": 4,
      "categoryResults": {
        "agentic": {
          "categoryLabel": "Agentic",
          "avgA": null,
          "avgB": 90.1,
          "winner": null,
          "benchmarkCount": 1
        },
        "coding": {
          "categoryLabel": "Coding",
          "avgA": 73.3,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 1
        },
        "multimodalGrounded": {
          "categoryLabel": "Multimodal & Grounded",
          "avgA": null,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 1
        },
        "reasoning": {
          "categoryLabel": "Reasoning",
          "avgA": null,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 0
        },
        "knowledge": {
          "categoryLabel": "Knowledge",
          "avgA": null,
          "avgB": 57.2,
          "winner": null,
          "benchmarkCount": 2
        },
        "instructionFollowing": {
          "categoryLabel": "Instruction Following",
          "avgA": null,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 0
        },
        "multilingual": {
          "categoryLabel": "Multilingual",
          "avgA": null,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 0
        },
        "math": {
          "categoryLabel": "Mathematics",
          "avgA": null,
          "avgB": 52.4,
          "winner": null,
          "benchmarkCount": 1
        }
      }
    },
    {
      "slug": "claude-haiku-4-5-vs-holo3-35b-a3b",
      "url": "https://benchlm.ai/compare/claude-haiku-4-5-vs-holo3-35b-a3b",
      "markdownUrl": "https://benchlm.ai/md/compare/claude-haiku-4-5-vs-holo3-35b-a3b.md",
      "modelA": {
        "slug": "claude-haiku-4-5",
        "canonicalModelKey": "claude-haiku-4-5",
        "model": "Claude Haiku 4.5",
        "creator": "Anthropic",
        "sourceType": "Proprietary",
        "reasoningType": "Non-Reasoning",
        "contextWindow": "200K",
        "contextWindowTokens": 200000,
        "displayScore": 56,
        "rankingEligible": true,
        "overallRank": 60,
        "url": "https://benchlm.ai/models/claude-haiku-4-5",
        "markdownUrl": "https://benchlm.ai/md/models/claude-haiku-4-5.md"
      },
      "modelB": {
        "slug": "holo3-35b-a3b",
        "canonicalModelKey": "holo3-35b-a3b",
        "model": "Holo3-35B-A3B",
        "creator": "H Company",
        "sourceType": "Open Weight",
        "reasoningType": "Non-Reasoning",
        "contextWindow": "64K",
        "contextWindowTokens": 64000,
        "displayScore": 100,
        "rankingEligible": false,
        "overallRank": null,
        "url": "https://benchlm.ai/models/holo3-35b-a3b",
        "markdownUrl": "https://benchlm.ai/md/models/holo3-35b-a3b.md"
      },
      "overallWinner": "B",
      "winner": {
        "slug": "holo3-35b-a3b",
        "canonicalModelKey": "holo3-35b-a3b",
        "model": "Holo3-35B-A3B",
        "creator": "H Company",
        "sourceType": "Open Weight",
        "reasoningType": "Non-Reasoning",
        "contextWindow": "64K",
        "contextWindowTokens": 64000,
        "displayScore": 100,
        "rankingEligible": false,
        "overallRank": null,
        "url": "https://benchlm.ai/models/holo3-35b-a3b",
        "markdownUrl": "https://benchlm.ai/md/models/holo3-35b-a3b.md"
      },
      "scoreDiff": 44,
      "winsA": 0,
      "winsB": 0,
      "comparableCategoryCount": 0,
      "benchmarkCountA": 2,
      "benchmarkCountB": 1,
      "categoryResults": {
        "agentic": {
          "categoryLabel": "Agentic",
          "avgA": null,
          "avgB": 82.6,
          "winner": null,
          "benchmarkCount": 1
        },
        "coding": {
          "categoryLabel": "Coding",
          "avgA": 73.3,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 1
        },
        "multimodalGrounded": {
          "categoryLabel": "Multimodal & Grounded",
          "avgA": null,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 1
        },
        "reasoning": {
          "categoryLabel": "Reasoning",
          "avgA": null,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 0
        },
        "knowledge": {
          "categoryLabel": "Knowledge",
          "avgA": null,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 0
        },
        "instructionFollowing": {
          "categoryLabel": "Instruction Following",
          "avgA": null,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 0
        },
        "multilingual": {
          "categoryLabel": "Multilingual",
          "avgA": null,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 0
        },
        "math": {
          "categoryLabel": "Mathematics",
          "avgA": null,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 0
        }
      }
    },
    {
      "slug": "gpt-5-5-pro-vs-o3",
      "url": "https://benchlm.ai/compare/gpt-5-5-pro-vs-o3",
      "markdownUrl": "https://benchlm.ai/md/compare/gpt-5-5-pro-vs-o3.md",
      "modelA": {
        "slug": "o3",
        "canonicalModelKey": "o3",
        "model": "o3",
        "creator": "OpenAI",
        "sourceType": "Proprietary",
        "reasoningType": "Reasoning",
        "contextWindow": "200K",
        "contextWindowTokens": 200000,
        "displayScore": 56,
        "rankingEligible": true,
        "overallRank": 61,
        "url": "https://benchlm.ai/models/o3",
        "markdownUrl": "https://benchlm.ai/md/models/o3.md"
      },
      "modelB": {
        "slug": "gpt-5-5-pro",
        "canonicalModelKey": "gpt-5-5-pro",
        "model": "GPT-5.5 Pro",
        "creator": "OpenAI",
        "sourceType": "Proprietary",
        "reasoningType": "Reasoning",
        "contextWindow": "1M",
        "contextWindowTokens": 1000000,
        "displayScore": 100,
        "rankingEligible": false,
        "overallRank": null,
        "url": "https://benchlm.ai/models/gpt-5-5-pro",
        "markdownUrl": "https://benchlm.ai/md/models/gpt-5-5-pro.md"
      },
      "overallWinner": "B",
      "winner": {
        "slug": "gpt-5-5-pro",
        "canonicalModelKey": "gpt-5-5-pro",
        "model": "GPT-5.5 Pro",
        "creator": "OpenAI",
        "sourceType": "Proprietary",
        "reasoningType": "Reasoning",
        "contextWindow": "1M",
        "contextWindowTokens": 1000000,
        "displayScore": 100,
        "rankingEligible": false,
        "overallRank": null,
        "url": "https://benchlm.ai/models/gpt-5-5-pro",
        "markdownUrl": "https://benchlm.ai/md/models/gpt-5-5-pro.md"
      },
      "scoreDiff": 44,
      "winsA": 0,
      "winsB": 0,
      "comparableCategoryCount": 0,
      "benchmarkCountA": 18,
      "benchmarkCountB": 4,
      "categoryResults": {
        "agentic": {
          "categoryLabel": "Agentic",
          "avgA": null,
          "avgB": 90.1,
          "winner": null,
          "benchmarkCount": 5
        },
        "coding": {
          "categoryLabel": "Coding",
          "avgA": null,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 3
        },
        "multimodalGrounded": {
          "categoryLabel": "Multimodal & Grounded",
          "avgA": null,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 2
        },
        "reasoning": {
          "categoryLabel": "Reasoning",
          "avgA": null,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 2
        },
        "knowledge": {
          "categoryLabel": "Knowledge",
          "avgA": null,
          "avgB": 57.2,
          "winner": null,
          "benchmarkCount": 8
        },
        "instructionFollowing": {
          "categoryLabel": "Instruction Following",
          "avgA": null,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 1
        },
        "multilingual": {
          "categoryLabel": "Multilingual",
          "avgA": null,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 0
        },
        "math": {
          "categoryLabel": "Mathematics",
          "avgA": null,
          "avgB": 52.4,
          "winner": null,
          "benchmarkCount": 1
        }
      }
    },
    {
      "slug": "holo3-35b-a3b-vs-o3",
      "url": "https://benchlm.ai/compare/holo3-35b-a3b-vs-o3",
      "markdownUrl": "https://benchlm.ai/md/compare/holo3-35b-a3b-vs-o3.md",
      "modelA": {
        "slug": "o3",
        "canonicalModelKey": "o3",
        "model": "o3",
        "creator": "OpenAI",
        "sourceType": "Proprietary",
        "reasoningType": "Reasoning",
        "contextWindow": "200K",
        "contextWindowTokens": 200000,
        "displayScore": 56,
        "rankingEligible": true,
        "overallRank": 61,
        "url": "https://benchlm.ai/models/o3",
        "markdownUrl": "https://benchlm.ai/md/models/o3.md"
      },
      "modelB": {
        "slug": "holo3-35b-a3b",
        "canonicalModelKey": "holo3-35b-a3b",
        "model": "Holo3-35B-A3B",
        "creator": "H Company",
        "sourceType": "Open Weight",
        "reasoningType": "Non-Reasoning",
        "contextWindow": "64K",
        "contextWindowTokens": 64000,
        "displayScore": 100,
        "rankingEligible": false,
        "overallRank": null,
        "url": "https://benchlm.ai/models/holo3-35b-a3b",
        "markdownUrl": "https://benchlm.ai/md/models/holo3-35b-a3b.md"
      },
      "overallWinner": "B",
      "winner": {
        "slug": "holo3-35b-a3b",
        "canonicalModelKey": "holo3-35b-a3b",
        "model": "Holo3-35B-A3B",
        "creator": "H Company",
        "sourceType": "Open Weight",
        "reasoningType": "Non-Reasoning",
        "contextWindow": "64K",
        "contextWindowTokens": 64000,
        "displayScore": 100,
        "rankingEligible": false,
        "overallRank": null,
        "url": "https://benchlm.ai/models/holo3-35b-a3b",
        "markdownUrl": "https://benchlm.ai/md/models/holo3-35b-a3b.md"
      },
      "scoreDiff": 44,
      "winsA": 0,
      "winsB": 0,
      "comparableCategoryCount": 0,
      "benchmarkCountA": 18,
      "benchmarkCountB": 1,
      "categoryResults": {
        "agentic": {
          "categoryLabel": "Agentic",
          "avgA": null,
          "avgB": 82.6,
          "winner": null,
          "benchmarkCount": 5
        },
        "coding": {
          "categoryLabel": "Coding",
          "avgA": null,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 3
        },
        "multimodalGrounded": {
          "categoryLabel": "Multimodal & Grounded",
          "avgA": null,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 2
        },
        "reasoning": {
          "categoryLabel": "Reasoning",
          "avgA": null,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 2
        },
        "knowledge": {
          "categoryLabel": "Knowledge",
          "avgA": null,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 6
        },
        "instructionFollowing": {
          "categoryLabel": "Instruction Following",
          "avgA": null,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 1
        },
        "multilingual": {
          "categoryLabel": "Multilingual",
          "avgA": null,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 0
        },
        "math": {
          "categoryLabel": "Mathematics",
          "avgA": null,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 0
        }
      }
    },
    {
      "slug": "gpt-5-5-pro-vs-qwen3-5-35b-a3b",
      "url": "https://benchlm.ai/compare/gpt-5-5-pro-vs-qwen3-5-35b-a3b",
      "markdownUrl": "https://benchlm.ai/md/compare/gpt-5-5-pro-vs-qwen3-5-35b-a3b.md",
      "modelA": {
        "slug": "qwen3-5-35b-a3b",
        "canonicalModelKey": "qwen3-5-35b-a3b",
        "model": "Qwen3.5-35B-A3B",
        "creator": "Alibaba",
        "sourceType": "Open Weight",
        "reasoningType": "Reasoning",
        "contextWindow": "262K",
        "contextWindowTokens": 262000,
        "displayScore": 55,
        "rankingEligible": true,
        "overallRank": 62,
        "url": "https://benchlm.ai/models/qwen3-5-35b-a3b",
        "markdownUrl": "https://benchlm.ai/md/models/qwen3-5-35b-a3b.md"
      },
      "modelB": {
        "slug": "gpt-5-5-pro",
        "canonicalModelKey": "gpt-5-5-pro",
        "model": "GPT-5.5 Pro",
        "creator": "OpenAI",
        "sourceType": "Proprietary",
        "reasoningType": "Reasoning",
        "contextWindow": "1M",
        "contextWindowTokens": 1000000,
        "displayScore": 100,
        "rankingEligible": false,
        "overallRank": null,
        "url": "https://benchlm.ai/models/gpt-5-5-pro",
        "markdownUrl": "https://benchlm.ai/md/models/gpt-5-5-pro.md"
      },
      "overallWinner": "B",
      "winner": {
        "slug": "gpt-5-5-pro",
        "canonicalModelKey": "gpt-5-5-pro",
        "model": "GPT-5.5 Pro",
        "creator": "OpenAI",
        "sourceType": "Proprietary",
        "reasoningType": "Reasoning",
        "contextWindow": "1M",
        "contextWindowTokens": 1000000,
        "displayScore": 100,
        "rankingEligible": false,
        "overallRank": null,
        "url": "https://benchlm.ai/models/gpt-5-5-pro",
        "markdownUrl": "https://benchlm.ai/md/models/gpt-5-5-pro.md"
      },
      "scoreDiff": 45,
      "winsA": 1,
      "winsB": 1,
      "comparableCategoryCount": 2,
      "benchmarkCountA": 33,
      "benchmarkCountB": 4,
      "categoryResults": {
        "agentic": {
          "categoryLabel": "Agentic",
          "avgA": 50.6,
          "avgB": 90.1,
          "winner": "B",
          "benchmarkCount": 8
        },
        "coding": {
          "categoryLabel": "Coding",
          "avgA": 58.4,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 5
        },
        "multimodalGrounded": {
          "categoryLabel": "Multimodal & Grounded",
          "avgA": null,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 5
        },
        "reasoning": {
          "categoryLabel": "Reasoning",
          "avgA": 59,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 3
        },
        "knowledge": {
          "categoryLabel": "Knowledge",
          "avgA": 79.3,
          "avgB": 57.2,
          "winner": "A",
          "benchmarkCount": 11
        },
        "instructionFollowing": {
          "categoryLabel": "Instruction Following",
          "avgA": 91.9,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 2
        },
        "multilingual": {
          "categoryLabel": "Multilingual",
          "avgA": 81,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 1
        },
        "math": {
          "categoryLabel": "Mathematics",
          "avgA": null,
          "avgB": 52.4,
          "winner": null,
          "benchmarkCount": 1
        }
      }
    },
    {
      "slug": "holo3-35b-a3b-vs-qwen3-5-35b-a3b",
      "url": "https://benchlm.ai/compare/holo3-35b-a3b-vs-qwen3-5-35b-a3b",
      "markdownUrl": "https://benchlm.ai/md/compare/holo3-35b-a3b-vs-qwen3-5-35b-a3b.md",
      "modelA": {
        "slug": "qwen3-5-35b-a3b",
        "canonicalModelKey": "qwen3-5-35b-a3b",
        "model": "Qwen3.5-35B-A3B",
        "creator": "Alibaba",
        "sourceType": "Open Weight",
        "reasoningType": "Reasoning",
        "contextWindow": "262K",
        "contextWindowTokens": 262000,
        "displayScore": 55,
        "rankingEligible": true,
        "overallRank": 62,
        "url": "https://benchlm.ai/models/qwen3-5-35b-a3b",
        "markdownUrl": "https://benchlm.ai/md/models/qwen3-5-35b-a3b.md"
      },
      "modelB": {
        "slug": "holo3-35b-a3b",
        "canonicalModelKey": "holo3-35b-a3b",
        "model": "Holo3-35B-A3B",
        "creator": "H Company",
        "sourceType": "Open Weight",
        "reasoningType": "Non-Reasoning",
        "contextWindow": "64K",
        "contextWindowTokens": 64000,
        "displayScore": 100,
        "rankingEligible": false,
        "overallRank": null,
        "url": "https://benchlm.ai/models/holo3-35b-a3b",
        "markdownUrl": "https://benchlm.ai/md/models/holo3-35b-a3b.md"
      },
      "overallWinner": "B",
      "winner": {
        "slug": "holo3-35b-a3b",
        "canonicalModelKey": "holo3-35b-a3b",
        "model": "Holo3-35B-A3B",
        "creator": "H Company",
        "sourceType": "Open Weight",
        "reasoningType": "Non-Reasoning",
        "contextWindow": "64K",
        "contextWindowTokens": 64000,
        "displayScore": 100,
        "rankingEligible": false,
        "overallRank": null,
        "url": "https://benchlm.ai/models/holo3-35b-a3b",
        "markdownUrl": "https://benchlm.ai/md/models/holo3-35b-a3b.md"
      },
      "scoreDiff": 45,
      "winsA": 0,
      "winsB": 1,
      "comparableCategoryCount": 1,
      "benchmarkCountA": 33,
      "benchmarkCountB": 1,
      "categoryResults": {
        "agentic": {
          "categoryLabel": "Agentic",
          "avgA": 50.6,
          "avgB": 82.6,
          "winner": "B",
          "benchmarkCount": 8
        },
        "coding": {
          "categoryLabel": "Coding",
          "avgA": 58.4,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 5
        },
        "multimodalGrounded": {
          "categoryLabel": "Multimodal & Grounded",
          "avgA": null,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 5
        },
        "reasoning": {
          "categoryLabel": "Reasoning",
          "avgA": 59,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 3
        },
        "knowledge": {
          "categoryLabel": "Knowledge",
          "avgA": 79.3,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 9
        },
        "instructionFollowing": {
          "categoryLabel": "Instruction Following",
          "avgA": 91.9,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 2
        },
        "multilingual": {
          "categoryLabel": "Multilingual",
          "avgA": 81,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 1
        },
        "math": {
          "categoryLabel": "Mathematics",
          "avgA": null,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 0
        }
      }
    },
    {
      "slug": "gemini-3-flash-vs-gpt-5-5-pro",
      "url": "https://benchlm.ai/compare/gemini-3-flash-vs-gpt-5-5-pro",
      "markdownUrl": "https://benchlm.ai/md/compare/gemini-3-flash-vs-gpt-5-5-pro.md",
      "modelA": {
        "slug": "gemini-3-flash",
        "canonicalModelKey": "gemini-3-flash",
        "model": "Gemini 3 Flash",
        "creator": "Google",
        "sourceType": "Proprietary",
        "reasoningType": "Non-Reasoning",
        "contextWindow": "1M",
        "contextWindowTokens": 1000000,
        "displayScore": 55,
        "rankingEligible": true,
        "overallRank": 63,
        "url": "https://benchlm.ai/models/gemini-3-flash",
        "markdownUrl": "https://benchlm.ai/md/models/gemini-3-flash.md"
      },
      "modelB": {
        "slug": "gpt-5-5-pro",
        "canonicalModelKey": "gpt-5-5-pro",
        "model": "GPT-5.5 Pro",
        "creator": "OpenAI",
        "sourceType": "Proprietary",
        "reasoningType": "Reasoning",
        "contextWindow": "1M",
        "contextWindowTokens": 1000000,
        "displayScore": 100,
        "rankingEligible": false,
        "overallRank": null,
        "url": "https://benchlm.ai/models/gpt-5-5-pro",
        "markdownUrl": "https://benchlm.ai/md/models/gpt-5-5-pro.md"
      },
      "overallWinner": "B",
      "winner": {
        "slug": "gpt-5-5-pro",
        "canonicalModelKey": "gpt-5-5-pro",
        "model": "GPT-5.5 Pro",
        "creator": "OpenAI",
        "sourceType": "Proprietary",
        "reasoningType": "Reasoning",
        "contextWindow": "1M",
        "contextWindowTokens": 1000000,
        "displayScore": 100,
        "rankingEligible": false,
        "overallRank": null,
        "url": "https://benchlm.ai/models/gpt-5-5-pro",
        "markdownUrl": "https://benchlm.ai/md/models/gpt-5-5-pro.md"
      },
      "scoreDiff": 45,
      "winsA": 0,
      "winsB": 0,
      "comparableCategoryCount": 0,
      "benchmarkCountA": 21,
      "benchmarkCountB": 4,
      "categoryResults": {
        "agentic": {
          "categoryLabel": "Agentic",
          "avgA": null,
          "avgB": 90.1,
          "winner": null,
          "benchmarkCount": 7
        },
        "coding": {
          "categoryLabel": "Coding",
          "avgA": null,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 4
        },
        "multimodalGrounded": {
          "categoryLabel": "Multimodal & Grounded",
          "avgA": null,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 2
        },
        "reasoning": {
          "categoryLabel": "Reasoning",
          "avgA": null,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 2
        },
        "knowledge": {
          "categoryLabel": "Knowledge",
          "avgA": null,
          "avgB": 57.2,
          "winner": null,
          "benchmarkCount": 8
        },
        "instructionFollowing": {
          "categoryLabel": "Instruction Following",
          "avgA": null,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 1
        },
        "multilingual": {
          "categoryLabel": "Multilingual",
          "avgA": null,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 0
        },
        "math": {
          "categoryLabel": "Mathematics",
          "avgA": null,
          "avgB": 52.4,
          "winner": null,
          "benchmarkCount": 1
        }
      }
    },
    {
      "slug": "gemini-3-flash-vs-holo3-35b-a3b",
      "url": "https://benchlm.ai/compare/gemini-3-flash-vs-holo3-35b-a3b",
      "markdownUrl": "https://benchlm.ai/md/compare/gemini-3-flash-vs-holo3-35b-a3b.md",
      "modelA": {
        "slug": "gemini-3-flash",
        "canonicalModelKey": "gemini-3-flash",
        "model": "Gemini 3 Flash",
        "creator": "Google",
        "sourceType": "Proprietary",
        "reasoningType": "Non-Reasoning",
        "contextWindow": "1M",
        "contextWindowTokens": 1000000,
        "displayScore": 55,
        "rankingEligible": true,
        "overallRank": 63,
        "url": "https://benchlm.ai/models/gemini-3-flash",
        "markdownUrl": "https://benchlm.ai/md/models/gemini-3-flash.md"
      },
      "modelB": {
        "slug": "holo3-35b-a3b",
        "canonicalModelKey": "holo3-35b-a3b",
        "model": "Holo3-35B-A3B",
        "creator": "H Company",
        "sourceType": "Open Weight",
        "reasoningType": "Non-Reasoning",
        "contextWindow": "64K",
        "contextWindowTokens": 64000,
        "displayScore": 100,
        "rankingEligible": false,
        "overallRank": null,
        "url": "https://benchlm.ai/models/holo3-35b-a3b",
        "markdownUrl": "https://benchlm.ai/md/models/holo3-35b-a3b.md"
      },
      "overallWinner": "B",
      "winner": {
        "slug": "holo3-35b-a3b",
        "canonicalModelKey": "holo3-35b-a3b",
        "model": "Holo3-35B-A3B",
        "creator": "H Company",
        "sourceType": "Open Weight",
        "reasoningType": "Non-Reasoning",
        "contextWindow": "64K",
        "contextWindowTokens": 64000,
        "displayScore": 100,
        "rankingEligible": false,
        "overallRank": null,
        "url": "https://benchlm.ai/models/holo3-35b-a3b",
        "markdownUrl": "https://benchlm.ai/md/models/holo3-35b-a3b.md"
      },
      "scoreDiff": 45,
      "winsA": 0,
      "winsB": 0,
      "comparableCategoryCount": 0,
      "benchmarkCountA": 21,
      "benchmarkCountB": 1,
      "categoryResults": {
        "agentic": {
          "categoryLabel": "Agentic",
          "avgA": null,
          "avgB": 82.6,
          "winner": null,
          "benchmarkCount": 7
        },
        "coding": {
          "categoryLabel": "Coding",
          "avgA": null,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 4
        },
        "multimodalGrounded": {
          "categoryLabel": "Multimodal & Grounded",
          "avgA": null,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 2
        },
        "reasoning": {
          "categoryLabel": "Reasoning",
          "avgA": null,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 2
        },
        "knowledge": {
          "categoryLabel": "Knowledge",
          "avgA": null,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 6
        },
        "instructionFollowing": {
          "categoryLabel": "Instruction Following",
          "avgA": null,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 1
        },
        "multilingual": {
          "categoryLabel": "Multilingual",
          "avgA": null,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 0
        },
        "math": {
          "categoryLabel": "Mathematics",
          "avgA": null,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 0
        }
      }
    },
    {
      "slug": "gpt-5-5-pro-vs-o3-mini",
      "url": "https://benchlm.ai/compare/gpt-5-5-pro-vs-o3-mini",
      "markdownUrl": "https://benchlm.ai/md/compare/gpt-5-5-pro-vs-o3-mini.md",
      "modelA": {
        "slug": "o3-mini",
        "canonicalModelKey": "o3-mini",
        "model": "o3-mini",
        "creator": "OpenAI",
        "sourceType": "Proprietary",
        "reasoningType": "Reasoning",
        "contextWindow": "200K",
        "contextWindowTokens": 200000,
        "displayScore": 55,
        "rankingEligible": true,
        "overallRank": 64,
        "url": "https://benchlm.ai/models/o3-mini",
        "markdownUrl": "https://benchlm.ai/md/models/o3-mini.md"
      },
      "modelB": {
        "slug": "gpt-5-5-pro",
        "canonicalModelKey": "gpt-5-5-pro",
        "model": "GPT-5.5 Pro",
        "creator": "OpenAI",
        "sourceType": "Proprietary",
        "reasoningType": "Reasoning",
        "contextWindow": "1M",
        "contextWindowTokens": 1000000,
        "displayScore": 100,
        "rankingEligible": false,
        "overallRank": null,
        "url": "https://benchlm.ai/models/gpt-5-5-pro",
        "markdownUrl": "https://benchlm.ai/md/models/gpt-5-5-pro.md"
      },
      "overallWinner": "B",
      "winner": {
        "slug": "gpt-5-5-pro",
        "canonicalModelKey": "gpt-5-5-pro",
        "model": "GPT-5.5 Pro",
        "creator": "OpenAI",
        "sourceType": "Proprietary",
        "reasoningType": "Reasoning",
        "contextWindow": "1M",
        "contextWindowTokens": 1000000,
        "displayScore": 100,
        "rankingEligible": false,
        "overallRank": null,
        "url": "https://benchlm.ai/models/gpt-5-5-pro",
        "markdownUrl": "https://benchlm.ai/md/models/gpt-5-5-pro.md"
      },
      "scoreDiff": 45,
      "winsA": 1,
      "winsB": 0,
      "comparableCategoryCount": 1,
      "benchmarkCountA": 12,
      "benchmarkCountB": 4,
      "categoryResults": {
        "agentic": {
          "categoryLabel": "Agentic",
          "avgA": null,
          "avgB": 90.1,
          "winner": null,
          "benchmarkCount": 2
        },
        "coding": {
          "categoryLabel": "Coding",
          "avgA": 49.3,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 4
        },
        "multimodalGrounded": {
          "categoryLabel": "Multimodal & Grounded",
          "avgA": null,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 0
        },
        "reasoning": {
          "categoryLabel": "Reasoning",
          "avgA": null,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 0
        },
        "knowledge": {
          "categoryLabel": "Knowledge",
          "avgA": 77.2,
          "avgB": 57.2,
          "winner": "A",
          "benchmarkCount": 7
        },
        "instructionFollowing": {
          "categoryLabel": "Instruction Following",
          "avgA": 93.9,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 1
        },
        "multilingual": {
          "categoryLabel": "Multilingual",
          "avgA": null,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 0
        },
        "math": {
          "categoryLabel": "Mathematics",
          "avgA": null,
          "avgB": 52.4,
          "winner": null,
          "benchmarkCount": 2
        }
      }
    },
    {
      "slug": "holo3-35b-a3b-vs-o3-mini",
      "url": "https://benchlm.ai/compare/holo3-35b-a3b-vs-o3-mini",
      "markdownUrl": "https://benchlm.ai/md/compare/holo3-35b-a3b-vs-o3-mini.md",
      "modelA": {
        "slug": "o3-mini",
        "canonicalModelKey": "o3-mini",
        "model": "o3-mini",
        "creator": "OpenAI",
        "sourceType": "Proprietary",
        "reasoningType": "Reasoning",
        "contextWindow": "200K",
        "contextWindowTokens": 200000,
        "displayScore": 55,
        "rankingEligible": true,
        "overallRank": 64,
        "url": "https://benchlm.ai/models/o3-mini",
        "markdownUrl": "https://benchlm.ai/md/models/o3-mini.md"
      },
      "modelB": {
        "slug": "holo3-35b-a3b",
        "canonicalModelKey": "holo3-35b-a3b",
        "model": "Holo3-35B-A3B",
        "creator": "H Company",
        "sourceType": "Open Weight",
        "reasoningType": "Non-Reasoning",
        "contextWindow": "64K",
        "contextWindowTokens": 64000,
        "displayScore": 100,
        "rankingEligible": false,
        "overallRank": null,
        "url": "https://benchlm.ai/models/holo3-35b-a3b",
        "markdownUrl": "https://benchlm.ai/md/models/holo3-35b-a3b.md"
      },
      "overallWinner": "B",
      "winner": {
        "slug": "holo3-35b-a3b",
        "canonicalModelKey": "holo3-35b-a3b",
        "model": "Holo3-35B-A3B",
        "creator": "H Company",
        "sourceType": "Open Weight",
        "reasoningType": "Non-Reasoning",
        "contextWindow": "64K",
        "contextWindowTokens": 64000,
        "displayScore": 100,
        "rankingEligible": false,
        "overallRank": null,
        "url": "https://benchlm.ai/models/holo3-35b-a3b",
        "markdownUrl": "https://benchlm.ai/md/models/holo3-35b-a3b.md"
      },
      "scoreDiff": 45,
      "winsA": 0,
      "winsB": 0,
      "comparableCategoryCount": 0,
      "benchmarkCountA": 12,
      "benchmarkCountB": 1,
      "categoryResults": {
        "agentic": {
          "categoryLabel": "Agentic",
          "avgA": null,
          "avgB": 82.6,
          "winner": null,
          "benchmarkCount": 2
        },
        "coding": {
          "categoryLabel": "Coding",
          "avgA": 49.3,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 4
        },
        "multimodalGrounded": {
          "categoryLabel": "Multimodal & Grounded",
          "avgA": null,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 0
        },
        "reasoning": {
          "categoryLabel": "Reasoning",
          "avgA": null,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 0
        },
        "knowledge": {
          "categoryLabel": "Knowledge",
          "avgA": 77.2,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 5
        },
        "instructionFollowing": {
          "categoryLabel": "Instruction Following",
          "avgA": 93.9,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 1
        },
        "multilingual": {
          "categoryLabel": "Multilingual",
          "avgA": null,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 0
        },
        "math": {
          "categoryLabel": "Mathematics",
          "avgA": null,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 1
        }
      }
    },
    {
      "slug": "gpt-5-5-pro-vs-minimax-m2-7",
      "url": "https://benchlm.ai/compare/gpt-5-5-pro-vs-minimax-m2-7",
      "markdownUrl": "https://benchlm.ai/md/compare/gpt-5-5-pro-vs-minimax-m2-7.md",
      "modelA": {
        "slug": "minimax-m2-7",
        "canonicalModelKey": "minimax-m2-7",
        "model": "MiniMax M2.7",
        "creator": "MiniMax",
        "sourceType": "Open Weight",
        "reasoningType": "Non-Reasoning",
        "contextWindow": "200K",
        "contextWindowTokens": 200000,
        "displayScore": 53,
        "rankingEligible": true,
        "overallRank": 65,
        "url": "https://benchlm.ai/models/minimax-m2-7",
        "markdownUrl": "https://benchlm.ai/md/models/minimax-m2-7.md"
      },
      "modelB": {
        "slug": "gpt-5-5-pro",
        "canonicalModelKey": "gpt-5-5-pro",
        "model": "GPT-5.5 Pro",
        "creator": "OpenAI",
        "sourceType": "Proprietary",
        "reasoningType": "Reasoning",
        "contextWindow": "1M",
        "contextWindowTokens": 1000000,
        "displayScore": 100,
        "rankingEligible": false,
        "overallRank": null,
        "url": "https://benchlm.ai/models/gpt-5-5-pro",
        "markdownUrl": "https://benchlm.ai/md/models/gpt-5-5-pro.md"
      },
      "overallWinner": "B",
      "winner": {
        "slug": "gpt-5-5-pro",
        "canonicalModelKey": "gpt-5-5-pro",
        "model": "GPT-5.5 Pro",
        "creator": "OpenAI",
        "sourceType": "Proprietary",
        "reasoningType": "Reasoning",
        "contextWindow": "1M",
        "contextWindowTokens": 1000000,
        "displayScore": 100,
        "rankingEligible": false,
        "overallRank": null,
        "url": "https://benchlm.ai/models/gpt-5-5-pro",
        "markdownUrl": "https://benchlm.ai/md/models/gpt-5-5-pro.md"
      },
      "scoreDiff": 47,
      "winsA": 0,
      "winsB": 1,
      "comparableCategoryCount": 1,
      "benchmarkCountA": 37,
      "benchmarkCountB": 4,
      "categoryResults": {
        "agentic": {
          "categoryLabel": "Agentic",
          "avgA": 57,
          "avgB": 90.1,
          "winner": "B",
          "benchmarkCount": 12
        },
        "coding": {
          "categoryLabel": "Coding",
          "avgA": 53.7,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 12
        },
        "multimodalGrounded": {
          "categoryLabel": "Multimodal & Grounded",
          "avgA": null,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 2
        },
        "reasoning": {
          "categoryLabel": "Reasoning",
          "avgA": null,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 2
        },
        "knowledge": {
          "categoryLabel": "Knowledge",
          "avgA": null,
          "avgB": 57.2,
          "winner": null,
          "benchmarkCount": 10
        },
        "instructionFollowing": {
          "categoryLabel": "Instruction Following",
          "avgA": null,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 1
        },
        "multilingual": {
          "categoryLabel": "Multilingual",
          "avgA": null,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 0
        },
        "math": {
          "categoryLabel": "Mathematics",
          "avgA": null,
          "avgB": 52.4,
          "winner": null,
          "benchmarkCount": 2
        }
      }
    },
    {
      "slug": "holo3-35b-a3b-vs-minimax-m2-7",
      "url": "https://benchlm.ai/compare/holo3-35b-a3b-vs-minimax-m2-7",
      "markdownUrl": "https://benchlm.ai/md/compare/holo3-35b-a3b-vs-minimax-m2-7.md",
      "modelA": {
        "slug": "minimax-m2-7",
        "canonicalModelKey": "minimax-m2-7",
        "model": "MiniMax M2.7",
        "creator": "MiniMax",
        "sourceType": "Open Weight",
        "reasoningType": "Non-Reasoning",
        "contextWindow": "200K",
        "contextWindowTokens": 200000,
        "displayScore": 53,
        "rankingEligible": true,
        "overallRank": 65,
        "url": "https://benchlm.ai/models/minimax-m2-7",
        "markdownUrl": "https://benchlm.ai/md/models/minimax-m2-7.md"
      },
      "modelB": {
        "slug": "holo3-35b-a3b",
        "canonicalModelKey": "holo3-35b-a3b",
        "model": "Holo3-35B-A3B",
        "creator": "H Company",
        "sourceType": "Open Weight",
        "reasoningType": "Non-Reasoning",
        "contextWindow": "64K",
        "contextWindowTokens": 64000,
        "displayScore": 100,
        "rankingEligible": false,
        "overallRank": null,
        "url": "https://benchlm.ai/models/holo3-35b-a3b",
        "markdownUrl": "https://benchlm.ai/md/models/holo3-35b-a3b.md"
      },
      "overallWinner": "B",
      "winner": {
        "slug": "holo3-35b-a3b",
        "canonicalModelKey": "holo3-35b-a3b",
        "model": "Holo3-35B-A3B",
        "creator": "H Company",
        "sourceType": "Open Weight",
        "reasoningType": "Non-Reasoning",
        "contextWindow": "64K",
        "contextWindowTokens": 64000,
        "displayScore": 100,
        "rankingEligible": false,
        "overallRank": null,
        "url": "https://benchlm.ai/models/holo3-35b-a3b",
        "markdownUrl": "https://benchlm.ai/md/models/holo3-35b-a3b.md"
      },
      "scoreDiff": 47,
      "winsA": 0,
      "winsB": 1,
      "comparableCategoryCount": 1,
      "benchmarkCountA": 37,
      "benchmarkCountB": 1,
      "categoryResults": {
        "agentic": {
          "categoryLabel": "Agentic",
          "avgA": 57,
          "avgB": 82.6,
          "winner": "B",
          "benchmarkCount": 12
        },
        "coding": {
          "categoryLabel": "Coding",
          "avgA": 53.7,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 12
        },
        "multimodalGrounded": {
          "categoryLabel": "Multimodal & Grounded",
          "avgA": null,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 2
        },
        "reasoning": {
          "categoryLabel": "Reasoning",
          "avgA": null,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 2
        },
        "knowledge": {
          "categoryLabel": "Knowledge",
          "avgA": null,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 8
        },
        "instructionFollowing": {
          "categoryLabel": "Instruction Following",
          "avgA": null,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 1
        },
        "multilingual": {
          "categoryLabel": "Multilingual",
          "avgA": null,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 0
        },
        "math": {
          "categoryLabel": "Mathematics",
          "avgA": null,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 1
        }
      }
    },
    {
      "slug": "deepseek-coder-2-0-vs-gpt-5-5-pro",
      "url": "https://benchlm.ai/compare/deepseek-coder-2-0-vs-gpt-5-5-pro",
      "markdownUrl": "https://benchlm.ai/md/compare/deepseek-coder-2-0-vs-gpt-5-5-pro.md",
      "modelA": {
        "slug": "deepseek-coder-2-0",
        "canonicalModelKey": "deepseek-coder-2-0",
        "model": "DeepSeek Coder 2.0",
        "creator": "DeepSeek",
        "sourceType": "Open Weight",
        "reasoningType": "Non-Reasoning",
        "contextWindow": "128K",
        "contextWindowTokens": 128000,
        "displayScore": 51,
        "rankingEligible": true,
        "overallRank": 66,
        "url": "https://benchlm.ai/models/deepseek-coder-2-0",
        "markdownUrl": "https://benchlm.ai/md/models/deepseek-coder-2-0.md"
      },
      "modelB": {
        "slug": "gpt-5-5-pro",
        "canonicalModelKey": "gpt-5-5-pro",
        "model": "GPT-5.5 Pro",
        "creator": "OpenAI",
        "sourceType": "Proprietary",
        "reasoningType": "Reasoning",
        "contextWindow": "1M",
        "contextWindowTokens": 1000000,
        "displayScore": 100,
        "rankingEligible": false,
        "overallRank": null,
        "url": "https://benchlm.ai/models/gpt-5-5-pro",
        "markdownUrl": "https://benchlm.ai/md/models/gpt-5-5-pro.md"
      },
      "overallWinner": "B",
      "winner": {
        "slug": "gpt-5-5-pro",
        "canonicalModelKey": "gpt-5-5-pro",
        "model": "GPT-5.5 Pro",
        "creator": "OpenAI",
        "sourceType": "Proprietary",
        "reasoningType": "Reasoning",
        "contextWindow": "1M",
        "contextWindowTokens": 1000000,
        "displayScore": 100,
        "rankingEligible": false,
        "overallRank": null,
        "url": "https://benchlm.ai/models/gpt-5-5-pro",
        "markdownUrl": "https://benchlm.ai/md/models/gpt-5-5-pro.md"
      },
      "scoreDiff": 49,
      "winsA": 0,
      "winsB": 0,
      "comparableCategoryCount": 0,
      "benchmarkCountA": 0,
      "benchmarkCountB": 4,
      "categoryResults": {
        "agentic": {
          "categoryLabel": "Agentic",
          "avgA": null,
          "avgB": 90.1,
          "winner": null,
          "benchmarkCount": 1
        },
        "coding": {
          "categoryLabel": "Coding",
          "avgA": null,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 0
        },
        "multimodalGrounded": {
          "categoryLabel": "Multimodal & Grounded",
          "avgA": null,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 0
        },
        "reasoning": {
          "categoryLabel": "Reasoning",
          "avgA": null,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 0
        },
        "knowledge": {
          "categoryLabel": "Knowledge",
          "avgA": null,
          "avgB": 57.2,
          "winner": null,
          "benchmarkCount": 2
        },
        "instructionFollowing": {
          "categoryLabel": "Instruction Following",
          "avgA": null,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 0
        },
        "multilingual": {
          "categoryLabel": "Multilingual",
          "avgA": null,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 0
        },
        "math": {
          "categoryLabel": "Mathematics",
          "avgA": null,
          "avgB": 52.4,
          "winner": null,
          "benchmarkCount": 1
        }
      }
    },
    {
      "slug": "deepseek-coder-2-0-vs-holo3-35b-a3b",
      "url": "https://benchlm.ai/compare/deepseek-coder-2-0-vs-holo3-35b-a3b",
      "markdownUrl": "https://benchlm.ai/md/compare/deepseek-coder-2-0-vs-holo3-35b-a3b.md",
      "modelA": {
        "slug": "deepseek-coder-2-0",
        "canonicalModelKey": "deepseek-coder-2-0",
        "model": "DeepSeek Coder 2.0",
        "creator": "DeepSeek",
        "sourceType": "Open Weight",
        "reasoningType": "Non-Reasoning",
        "contextWindow": "128K",
        "contextWindowTokens": 128000,
        "displayScore": 51,
        "rankingEligible": true,
        "overallRank": 66,
        "url": "https://benchlm.ai/models/deepseek-coder-2-0",
        "markdownUrl": "https://benchlm.ai/md/models/deepseek-coder-2-0.md"
      },
      "modelB": {
        "slug": "holo3-35b-a3b",
        "canonicalModelKey": "holo3-35b-a3b",
        "model": "Holo3-35B-A3B",
        "creator": "H Company",
        "sourceType": "Open Weight",
        "reasoningType": "Non-Reasoning",
        "contextWindow": "64K",
        "contextWindowTokens": 64000,
        "displayScore": 100,
        "rankingEligible": false,
        "overallRank": null,
        "url": "https://benchlm.ai/models/holo3-35b-a3b",
        "markdownUrl": "https://benchlm.ai/md/models/holo3-35b-a3b.md"
      },
      "overallWinner": "B",
      "winner": {
        "slug": "holo3-35b-a3b",
        "canonicalModelKey": "holo3-35b-a3b",
        "model": "Holo3-35B-A3B",
        "creator": "H Company",
        "sourceType": "Open Weight",
        "reasoningType": "Non-Reasoning",
        "contextWindow": "64K",
        "contextWindowTokens": 64000,
        "displayScore": 100,
        "rankingEligible": false,
        "overallRank": null,
        "url": "https://benchlm.ai/models/holo3-35b-a3b",
        "markdownUrl": "https://benchlm.ai/md/models/holo3-35b-a3b.md"
      },
      "scoreDiff": 49,
      "winsA": 0,
      "winsB": 0,
      "comparableCategoryCount": 0,
      "benchmarkCountA": 0,
      "benchmarkCountB": 1,
      "categoryResults": {
        "agentic": {
          "categoryLabel": "Agentic",
          "avgA": null,
          "avgB": 82.6,
          "winner": null,
          "benchmarkCount": 1
        },
        "coding": {
          "categoryLabel": "Coding",
          "avgA": null,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 0
        },
        "multimodalGrounded": {
          "categoryLabel": "Multimodal & Grounded",
          "avgA": null,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 0
        },
        "reasoning": {
          "categoryLabel": "Reasoning",
          "avgA": null,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 0
        },
        "knowledge": {
          "categoryLabel": "Knowledge",
          "avgA": null,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 0
        },
        "instructionFollowing": {
          "categoryLabel": "Instruction Following",
          "avgA": null,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 0
        },
        "multilingual": {
          "categoryLabel": "Multilingual",
          "avgA": null,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 0
        },
        "math": {
          "categoryLabel": "Mathematics",
          "avgA": null,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 0
        }
      }
    },
    {
      "slug": "claude-4-1-opus-vs-gpt-5-5-pro",
      "url": "https://benchlm.ai/compare/claude-4-1-opus-vs-gpt-5-5-pro",
      "markdownUrl": "https://benchlm.ai/md/compare/claude-4-1-opus-vs-gpt-5-5-pro.md",
      "modelA": {
        "slug": "claude-4-1-opus",
        "canonicalModelKey": "claude-4-1-opus",
        "model": "Claude 4.1 Opus",
        "creator": "Anthropic",
        "sourceType": "Proprietary",
        "reasoningType": "Non-Reasoning",
        "contextWindow": "200K",
        "contextWindowTokens": 200000,
        "displayScore": 51,
        "rankingEligible": true,
        "overallRank": 67,
        "url": "https://benchlm.ai/models/claude-4-1-opus",
        "markdownUrl": "https://benchlm.ai/md/models/claude-4-1-opus.md"
      },
      "modelB": {
        "slug": "gpt-5-5-pro",
        "canonicalModelKey": "gpt-5-5-pro",
        "model": "GPT-5.5 Pro",
        "creator": "OpenAI",
        "sourceType": "Proprietary",
        "reasoningType": "Reasoning",
        "contextWindow": "1M",
        "contextWindowTokens": 1000000,
        "displayScore": 100,
        "rankingEligible": false,
        "overallRank": null,
        "url": "https://benchlm.ai/models/gpt-5-5-pro",
        "markdownUrl": "https://benchlm.ai/md/models/gpt-5-5-pro.md"
      },
      "overallWinner": "B",
      "winner": {
        "slug": "gpt-5-5-pro",
        "canonicalModelKey": "gpt-5-5-pro",
        "model": "GPT-5.5 Pro",
        "creator": "OpenAI",
        "sourceType": "Proprietary",
        "reasoningType": "Reasoning",
        "contextWindow": "1M",
        "contextWindowTokens": 1000000,
        "displayScore": 100,
        "rankingEligible": false,
        "overallRank": null,
        "url": "https://benchlm.ai/models/gpt-5-5-pro",
        "markdownUrl": "https://benchlm.ai/md/models/gpt-5-5-pro.md"
      },
      "scoreDiff": 49,
      "winsA": 0,
      "winsB": 0,
      "comparableCategoryCount": 0,
      "benchmarkCountA": 3,
      "benchmarkCountB": 4,
      "categoryResults": {
        "agentic": {
          "categoryLabel": "Agentic",
          "avgA": null,
          "avgB": 90.1,
          "winner": null,
          "benchmarkCount": 1
        },
        "coding": {
          "categoryLabel": "Coding",
          "avgA": 74.5,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 1
        },
        "multimodalGrounded": {
          "categoryLabel": "Multimodal & Grounded",
          "avgA": null,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 1
        },
        "reasoning": {
          "categoryLabel": "Reasoning",
          "avgA": null,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 0
        },
        "knowledge": {
          "categoryLabel": "Knowledge",
          "avgA": null,
          "avgB": 57.2,
          "winner": null,
          "benchmarkCount": 3
        },
        "instructionFollowing": {
          "categoryLabel": "Instruction Following",
          "avgA": null,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 0
        },
        "multilingual": {
          "categoryLabel": "Multilingual",
          "avgA": null,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 0
        },
        "math": {
          "categoryLabel": "Mathematics",
          "avgA": null,
          "avgB": 52.4,
          "winner": null,
          "benchmarkCount": 1
        }
      }
    },
    {
      "slug": "claude-4-1-opus-vs-holo3-35b-a3b",
      "url": "https://benchlm.ai/compare/claude-4-1-opus-vs-holo3-35b-a3b",
      "markdownUrl": "https://benchlm.ai/md/compare/claude-4-1-opus-vs-holo3-35b-a3b.md",
      "modelA": {
        "slug": "claude-4-1-opus",
        "canonicalModelKey": "claude-4-1-opus",
        "model": "Claude 4.1 Opus",
        "creator": "Anthropic",
        "sourceType": "Proprietary",
        "reasoningType": "Non-Reasoning",
        "contextWindow": "200K",
        "contextWindowTokens": 200000,
        "displayScore": 51,
        "rankingEligible": true,
        "overallRank": 67,
        "url": "https://benchlm.ai/models/claude-4-1-opus",
        "markdownUrl": "https://benchlm.ai/md/models/claude-4-1-opus.md"
      },
      "modelB": {
        "slug": "holo3-35b-a3b",
        "canonicalModelKey": "holo3-35b-a3b",
        "model": "Holo3-35B-A3B",
        "creator": "H Company",
        "sourceType": "Open Weight",
        "reasoningType": "Non-Reasoning",
        "contextWindow": "64K",
        "contextWindowTokens": 64000,
        "displayScore": 100,
        "rankingEligible": false,
        "overallRank": null,
        "url": "https://benchlm.ai/models/holo3-35b-a3b",
        "markdownUrl": "https://benchlm.ai/md/models/holo3-35b-a3b.md"
      },
      "overallWinner": "B",
      "winner": {
        "slug": "holo3-35b-a3b",
        "canonicalModelKey": "holo3-35b-a3b",
        "model": "Holo3-35B-A3B",
        "creator": "H Company",
        "sourceType": "Open Weight",
        "reasoningType": "Non-Reasoning",
        "contextWindow": "64K",
        "contextWindowTokens": 64000,
        "displayScore": 100,
        "rankingEligible": false,
        "overallRank": null,
        "url": "https://benchlm.ai/models/holo3-35b-a3b",
        "markdownUrl": "https://benchlm.ai/md/models/holo3-35b-a3b.md"
      },
      "scoreDiff": 49,
      "winsA": 0,
      "winsB": 0,
      "comparableCategoryCount": 0,
      "benchmarkCountA": 3,
      "benchmarkCountB": 1,
      "categoryResults": {
        "agentic": {
          "categoryLabel": "Agentic",
          "avgA": null,
          "avgB": 82.6,
          "winner": null,
          "benchmarkCount": 1
        },
        "coding": {
          "categoryLabel": "Coding",
          "avgA": 74.5,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 1
        },
        "multimodalGrounded": {
          "categoryLabel": "Multimodal & Grounded",
          "avgA": null,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 1
        },
        "reasoning": {
          "categoryLabel": "Reasoning",
          "avgA": null,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 0
        },
        "knowledge": {
          "categoryLabel": "Knowledge",
          "avgA": null,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 1
        },
        "instructionFollowing": {
          "categoryLabel": "Instruction Following",
          "avgA": null,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 0
        },
        "multilingual": {
          "categoryLabel": "Multilingual",
          "avgA": null,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 0
        },
        "math": {
          "categoryLabel": "Mathematics",
          "avgA": null,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 0
        }
      }
    },
    {
      "slug": "deepseek-llm-2-0-vs-gpt-5-5-pro",
      "url": "https://benchlm.ai/compare/deepseek-llm-2-0-vs-gpt-5-5-pro",
      "markdownUrl": "https://benchlm.ai/md/compare/deepseek-llm-2-0-vs-gpt-5-5-pro.md",
      "modelA": {
        "slug": "deepseek-llm-2-0",
        "canonicalModelKey": "deepseek-llm-2-0",
        "model": "DeepSeek LLM 2.0",
        "creator": "DeepSeek",
        "sourceType": "Open Weight",
        "reasoningType": "Non-Reasoning",
        "contextWindow": "128K",
        "contextWindowTokens": 128000,
        "displayScore": 50,
        "rankingEligible": true,
        "overallRank": 68,
        "url": "https://benchlm.ai/models/deepseek-llm-2-0",
        "markdownUrl": "https://benchlm.ai/md/models/deepseek-llm-2-0.md"
      },
      "modelB": {
        "slug": "gpt-5-5-pro",
        "canonicalModelKey": "gpt-5-5-pro",
        "model": "GPT-5.5 Pro",
        "creator": "OpenAI",
        "sourceType": "Proprietary",
        "reasoningType": "Reasoning",
        "contextWindow": "1M",
        "contextWindowTokens": 1000000,
        "displayScore": 100,
        "rankingEligible": false,
        "overallRank": null,
        "url": "https://benchlm.ai/models/gpt-5-5-pro",
        "markdownUrl": "https://benchlm.ai/md/models/gpt-5-5-pro.md"
      },
      "overallWinner": "B",
      "winner": {
        "slug": "gpt-5-5-pro",
        "canonicalModelKey": "gpt-5-5-pro",
        "model": "GPT-5.5 Pro",
        "creator": "OpenAI",
        "sourceType": "Proprietary",
        "reasoningType": "Reasoning",
        "contextWindow": "1M",
        "contextWindowTokens": 1000000,
        "displayScore": 100,
        "rankingEligible": false,
        "overallRank": null,
        "url": "https://benchlm.ai/models/gpt-5-5-pro",
        "markdownUrl": "https://benchlm.ai/md/models/gpt-5-5-pro.md"
      },
      "scoreDiff": 50,
      "winsA": 0,
      "winsB": 0,
      "comparableCategoryCount": 0,
      "benchmarkCountA": 0,
      "benchmarkCountB": 4,
      "categoryResults": {
        "agentic": {
          "categoryLabel": "Agentic",
          "avgA": null,
          "avgB": 90.1,
          "winner": null,
          "benchmarkCount": 1
        },
        "coding": {
          "categoryLabel": "Coding",
          "avgA": null,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 0
        },
        "multimodalGrounded": {
          "categoryLabel": "Multimodal & Grounded",
          "avgA": null,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 0
        },
        "reasoning": {
          "categoryLabel": "Reasoning",
          "avgA": null,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 0
        },
        "knowledge": {
          "categoryLabel": "Knowledge",
          "avgA": null,
          "avgB": 57.2,
          "winner": null,
          "benchmarkCount": 2
        },
        "instructionFollowing": {
          "categoryLabel": "Instruction Following",
          "avgA": null,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 0
        },
        "multilingual": {
          "categoryLabel": "Multilingual",
          "avgA": null,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 0
        },
        "math": {
          "categoryLabel": "Mathematics",
          "avgA": null,
          "avgB": 52.4,
          "winner": null,
          "benchmarkCount": 1
        }
      }
    },
    {
      "slug": "deepseek-llm-2-0-vs-holo3-35b-a3b",
      "url": "https://benchlm.ai/compare/deepseek-llm-2-0-vs-holo3-35b-a3b",
      "markdownUrl": "https://benchlm.ai/md/compare/deepseek-llm-2-0-vs-holo3-35b-a3b.md",
      "modelA": {
        "slug": "deepseek-llm-2-0",
        "canonicalModelKey": "deepseek-llm-2-0",
        "model": "DeepSeek LLM 2.0",
        "creator": "DeepSeek",
        "sourceType": "Open Weight",
        "reasoningType": "Non-Reasoning",
        "contextWindow": "128K",
        "contextWindowTokens": 128000,
        "displayScore": 50,
        "rankingEligible": true,
        "overallRank": 68,
        "url": "https://benchlm.ai/models/deepseek-llm-2-0",
        "markdownUrl": "https://benchlm.ai/md/models/deepseek-llm-2-0.md"
      },
      "modelB": {
        "slug": "holo3-35b-a3b",
        "canonicalModelKey": "holo3-35b-a3b",
        "model": "Holo3-35B-A3B",
        "creator": "H Company",
        "sourceType": "Open Weight",
        "reasoningType": "Non-Reasoning",
        "contextWindow": "64K",
        "contextWindowTokens": 64000,
        "displayScore": 100,
        "rankingEligible": false,
        "overallRank": null,
        "url": "https://benchlm.ai/models/holo3-35b-a3b",
        "markdownUrl": "https://benchlm.ai/md/models/holo3-35b-a3b.md"
      },
      "overallWinner": "B",
      "winner": {
        "slug": "holo3-35b-a3b",
        "canonicalModelKey": "holo3-35b-a3b",
        "model": "Holo3-35B-A3B",
        "creator": "H Company",
        "sourceType": "Open Weight",
        "reasoningType": "Non-Reasoning",
        "contextWindow": "64K",
        "contextWindowTokens": 64000,
        "displayScore": 100,
        "rankingEligible": false,
        "overallRank": null,
        "url": "https://benchlm.ai/models/holo3-35b-a3b",
        "markdownUrl": "https://benchlm.ai/md/models/holo3-35b-a3b.md"
      },
      "scoreDiff": 50,
      "winsA": 0,
      "winsB": 0,
      "comparableCategoryCount": 0,
      "benchmarkCountA": 0,
      "benchmarkCountB": 1,
      "categoryResults": {
        "agentic": {
          "categoryLabel": "Agentic",
          "avgA": null,
          "avgB": 82.6,
          "winner": null,
          "benchmarkCount": 1
        },
        "coding": {
          "categoryLabel": "Coding",
          "avgA": null,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 0
        },
        "multimodalGrounded": {
          "categoryLabel": "Multimodal & Grounded",
          "avgA": null,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 0
        },
        "reasoning": {
          "categoryLabel": "Reasoning",
          "avgA": null,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 0
        },
        "knowledge": {
          "categoryLabel": "Knowledge",
          "avgA": null,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 0
        },
        "instructionFollowing": {
          "categoryLabel": "Instruction Following",
          "avgA": null,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 0
        },
        "multilingual": {
          "categoryLabel": "Multilingual",
          "avgA": null,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 0
        },
        "math": {
          "categoryLabel": "Mathematics",
          "avgA": null,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 0
        }
      }
    },
    {
      "slug": "gpt-5-5-pro-vs-qwen2-5-1m",
      "url": "https://benchlm.ai/compare/gpt-5-5-pro-vs-qwen2-5-1m",
      "markdownUrl": "https://benchlm.ai/md/compare/gpt-5-5-pro-vs-qwen2-5-1m.md",
      "modelA": {
        "slug": "qwen2-5-1m",
        "canonicalModelKey": "qwen2-5-1m",
        "model": "Qwen2.5-1M",
        "creator": "Alibaba",
        "sourceType": "Open Weight",
        "reasoningType": "Non-Reasoning",
        "contextWindow": "1M",
        "contextWindowTokens": 1000000,
        "displayScore": 50,
        "rankingEligible": true,
        "overallRank": 69,
        "url": "https://benchlm.ai/models/qwen2-5-1m",
        "markdownUrl": "https://benchlm.ai/md/models/qwen2-5-1m.md"
      },
      "modelB": {
        "slug": "gpt-5-5-pro",
        "canonicalModelKey": "gpt-5-5-pro",
        "model": "GPT-5.5 Pro",
        "creator": "OpenAI",
        "sourceType": "Proprietary",
        "reasoningType": "Reasoning",
        "contextWindow": "1M",
        "contextWindowTokens": 1000000,
        "displayScore": 100,
        "rankingEligible": false,
        "overallRank": null,
        "url": "https://benchlm.ai/models/gpt-5-5-pro",
        "markdownUrl": "https://benchlm.ai/md/models/gpt-5-5-pro.md"
      },
      "overallWinner": "B",
      "winner": {
        "slug": "gpt-5-5-pro",
        "canonicalModelKey": "gpt-5-5-pro",
        "model": "GPT-5.5 Pro",
        "creator": "OpenAI",
        "sourceType": "Proprietary",
        "reasoningType": "Reasoning",
        "contextWindow": "1M",
        "contextWindowTokens": 1000000,
        "displayScore": 100,
        "rankingEligible": false,
        "overallRank": null,
        "url": "https://benchlm.ai/models/gpt-5-5-pro",
        "markdownUrl": "https://benchlm.ai/md/models/gpt-5-5-pro.md"
      },
      "scoreDiff": 50,
      "winsA": 0,
      "winsB": 0,
      "comparableCategoryCount": 0,
      "benchmarkCountA": 0,
      "benchmarkCountB": 4,
      "categoryResults": {
        "agentic": {
          "categoryLabel": "Agentic",
          "avgA": null,
          "avgB": 90.1,
          "winner": null,
          "benchmarkCount": 1
        },
        "coding": {
          "categoryLabel": "Coding",
          "avgA": null,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 0
        },
        "multimodalGrounded": {
          "categoryLabel": "Multimodal & Grounded",
          "avgA": null,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 0
        },
        "reasoning": {
          "categoryLabel": "Reasoning",
          "avgA": null,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 0
        },
        "knowledge": {
          "categoryLabel": "Knowledge",
          "avgA": null,
          "avgB": 57.2,
          "winner": null,
          "benchmarkCount": 2
        },
        "instructionFollowing": {
          "categoryLabel": "Instruction Following",
          "avgA": null,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 0
        },
        "multilingual": {
          "categoryLabel": "Multilingual",
          "avgA": null,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 0
        },
        "math": {
          "categoryLabel": "Mathematics",
          "avgA": null,
          "avgB": 52.4,
          "winner": null,
          "benchmarkCount": 1
        }
      }
    },
    {
      "slug": "holo3-35b-a3b-vs-qwen2-5-1m",
      "url": "https://benchlm.ai/compare/holo3-35b-a3b-vs-qwen2-5-1m",
      "markdownUrl": "https://benchlm.ai/md/compare/holo3-35b-a3b-vs-qwen2-5-1m.md",
      "modelA": {
        "slug": "qwen2-5-1m",
        "canonicalModelKey": "qwen2-5-1m",
        "model": "Qwen2.5-1M",
        "creator": "Alibaba",
        "sourceType": "Open Weight",
        "reasoningType": "Non-Reasoning",
        "contextWindow": "1M",
        "contextWindowTokens": 1000000,
        "displayScore": 50,
        "rankingEligible": true,
        "overallRank": 69,
        "url": "https://benchlm.ai/models/qwen2-5-1m",
        "markdownUrl": "https://benchlm.ai/md/models/qwen2-5-1m.md"
      },
      "modelB": {
        "slug": "holo3-35b-a3b",
        "canonicalModelKey": "holo3-35b-a3b",
        "model": "Holo3-35B-A3B",
        "creator": "H Company",
        "sourceType": "Open Weight",
        "reasoningType": "Non-Reasoning",
        "contextWindow": "64K",
        "contextWindowTokens": 64000,
        "displayScore": 100,
        "rankingEligible": false,
        "overallRank": null,
        "url": "https://benchlm.ai/models/holo3-35b-a3b",
        "markdownUrl": "https://benchlm.ai/md/models/holo3-35b-a3b.md"
      },
      "overallWinner": "B",
      "winner": {
        "slug": "holo3-35b-a3b",
        "canonicalModelKey": "holo3-35b-a3b",
        "model": "Holo3-35B-A3B",
        "creator": "H Company",
        "sourceType": "Open Weight",
        "reasoningType": "Non-Reasoning",
        "contextWindow": "64K",
        "contextWindowTokens": 64000,
        "displayScore": 100,
        "rankingEligible": false,
        "overallRank": null,
        "url": "https://benchlm.ai/models/holo3-35b-a3b",
        "markdownUrl": "https://benchlm.ai/md/models/holo3-35b-a3b.md"
      },
      "scoreDiff": 50,
      "winsA": 0,
      "winsB": 0,
      "comparableCategoryCount": 0,
      "benchmarkCountA": 0,
      "benchmarkCountB": 1,
      "categoryResults": {
        "agentic": {
          "categoryLabel": "Agentic",
          "avgA": null,
          "avgB": 82.6,
          "winner": null,
          "benchmarkCount": 1
        },
        "coding": {
          "categoryLabel": "Coding",
          "avgA": null,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 0
        },
        "multimodalGrounded": {
          "categoryLabel": "Multimodal & Grounded",
          "avgA": null,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 0
        },
        "reasoning": {
          "categoryLabel": "Reasoning",
          "avgA": null,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 0
        },
        "knowledge": {
          "categoryLabel": "Knowledge",
          "avgA": null,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 0
        },
        "instructionFollowing": {
          "categoryLabel": "Instruction Following",
          "avgA": null,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 0
        },
        "multilingual": {
          "categoryLabel": "Multilingual",
          "avgA": null,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 0
        },
        "math": {
          "categoryLabel": "Mathematics",
          "avgA": null,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 0
        }
      }
    },
    {
      "slug": "claude-4-sonnet-vs-gpt-5-5-pro",
      "url": "https://benchlm.ai/compare/claude-4-sonnet-vs-gpt-5-5-pro",
      "markdownUrl": "https://benchlm.ai/md/compare/claude-4-sonnet-vs-gpt-5-5-pro.md",
      "modelA": {
        "slug": "claude-4-sonnet",
        "canonicalModelKey": "claude-4-sonnet",
        "model": "Claude 4 Sonnet",
        "creator": "Anthropic",
        "sourceType": "Proprietary",
        "reasoningType": "Non-Reasoning",
        "contextWindow": "200K",
        "contextWindowTokens": 200000,
        "displayScore": 50,
        "rankingEligible": true,
        "overallRank": 70,
        "url": "https://benchlm.ai/models/claude-4-sonnet",
        "markdownUrl": "https://benchlm.ai/md/models/claude-4-sonnet.md"
      },
      "modelB": {
        "slug": "gpt-5-5-pro",
        "canonicalModelKey": "gpt-5-5-pro",
        "model": "GPT-5.5 Pro",
        "creator": "OpenAI",
        "sourceType": "Proprietary",
        "reasoningType": "Reasoning",
        "contextWindow": "1M",
        "contextWindowTokens": 1000000,
        "displayScore": 100,
        "rankingEligible": false,
        "overallRank": null,
        "url": "https://benchlm.ai/models/gpt-5-5-pro",
        "markdownUrl": "https://benchlm.ai/md/models/gpt-5-5-pro.md"
      },
      "overallWinner": "B",
      "winner": {
        "slug": "gpt-5-5-pro",
        "canonicalModelKey": "gpt-5-5-pro",
        "model": "GPT-5.5 Pro",
        "creator": "OpenAI",
        "sourceType": "Proprietary",
        "reasoningType": "Reasoning",
        "contextWindow": "1M",
        "contextWindowTokens": 1000000,
        "displayScore": 100,
        "rankingEligible": false,
        "overallRank": null,
        "url": "https://benchlm.ai/models/gpt-5-5-pro",
        "markdownUrl": "https://benchlm.ai/md/models/gpt-5-5-pro.md"
      },
      "scoreDiff": 50,
      "winsA": 0,
      "winsB": 0,
      "comparableCategoryCount": 0,
      "benchmarkCountA": 20,
      "benchmarkCountB": 4,
      "categoryResults": {
        "agentic": {
          "categoryLabel": "Agentic",
          "avgA": null,
          "avgB": 90.1,
          "winner": null,
          "benchmarkCount": 6
        },
        "coding": {
          "categoryLabel": "Coding",
          "avgA": 72.7,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 4
        },
        "multimodalGrounded": {
          "categoryLabel": "Multimodal & Grounded",
          "avgA": null,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 2
        },
        "reasoning": {
          "categoryLabel": "Reasoning",
          "avgA": null,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 2
        },
        "knowledge": {
          "categoryLabel": "Knowledge",
          "avgA": null,
          "avgB": 57.2,
          "winner": null,
          "benchmarkCount": 8
        },
        "instructionFollowing": {
          "categoryLabel": "Instruction Following",
          "avgA": null,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 1
        },
        "multilingual": {
          "categoryLabel": "Multilingual",
          "avgA": null,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 0
        },
        "math": {
          "categoryLabel": "Mathematics",
          "avgA": null,
          "avgB": 52.4,
          "winner": null,
          "benchmarkCount": 1
        }
      }
    },
    {
      "slug": "claude-4-sonnet-vs-holo3-35b-a3b",
      "url": "https://benchlm.ai/compare/claude-4-sonnet-vs-holo3-35b-a3b",
      "markdownUrl": "https://benchlm.ai/md/compare/claude-4-sonnet-vs-holo3-35b-a3b.md",
      "modelA": {
        "slug": "claude-4-sonnet",
        "canonicalModelKey": "claude-4-sonnet",
        "model": "Claude 4 Sonnet",
        "creator": "Anthropic",
        "sourceType": "Proprietary",
        "reasoningType": "Non-Reasoning",
        "contextWindow": "200K",
        "contextWindowTokens": 200000,
        "displayScore": 50,
        "rankingEligible": true,
        "overallRank": 70,
        "url": "https://benchlm.ai/models/claude-4-sonnet",
        "markdownUrl": "https://benchlm.ai/md/models/claude-4-sonnet.md"
      },
      "modelB": {
        "slug": "holo3-35b-a3b",
        "canonicalModelKey": "holo3-35b-a3b",
        "model": "Holo3-35B-A3B",
        "creator": "H Company",
        "sourceType": "Open Weight",
        "reasoningType": "Non-Reasoning",
        "contextWindow": "64K",
        "contextWindowTokens": 64000,
        "displayScore": 100,
        "rankingEligible": false,
        "overallRank": null,
        "url": "https://benchlm.ai/models/holo3-35b-a3b",
        "markdownUrl": "https://benchlm.ai/md/models/holo3-35b-a3b.md"
      },
      "overallWinner": "B",
      "winner": {
        "slug": "holo3-35b-a3b",
        "canonicalModelKey": "holo3-35b-a3b",
        "model": "Holo3-35B-A3B",
        "creator": "H Company",
        "sourceType": "Open Weight",
        "reasoningType": "Non-Reasoning",
        "contextWindow": "64K",
        "contextWindowTokens": 64000,
        "displayScore": 100,
        "rankingEligible": false,
        "overallRank": null,
        "url": "https://benchlm.ai/models/holo3-35b-a3b",
        "markdownUrl": "https://benchlm.ai/md/models/holo3-35b-a3b.md"
      },
      "scoreDiff": 50,
      "winsA": 0,
      "winsB": 0,
      "comparableCategoryCount": 0,
      "benchmarkCountA": 20,
      "benchmarkCountB": 1,
      "categoryResults": {
        "agentic": {
          "categoryLabel": "Agentic",
          "avgA": null,
          "avgB": 82.6,
          "winner": null,
          "benchmarkCount": 6
        },
        "coding": {
          "categoryLabel": "Coding",
          "avgA": 72.7,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 4
        },
        "multimodalGrounded": {
          "categoryLabel": "Multimodal & Grounded",
          "avgA": null,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 2
        },
        "reasoning": {
          "categoryLabel": "Reasoning",
          "avgA": null,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 2
        },
        "knowledge": {
          "categoryLabel": "Knowledge",
          "avgA": null,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 6
        },
        "instructionFollowing": {
          "categoryLabel": "Instruction Following",
          "avgA": null,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 1
        },
        "multilingual": {
          "categoryLabel": "Multilingual",
          "avgA": null,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 0
        },
        "math": {
          "categoryLabel": "Mathematics",
          "avgA": null,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 0
        }
      }
    },
    {
      "slug": "gpt-4o-mini-vs-gpt-5-5-pro",
      "url": "https://benchlm.ai/compare/gpt-4o-mini-vs-gpt-5-5-pro",
      "markdownUrl": "https://benchlm.ai/md/compare/gpt-4o-mini-vs-gpt-5-5-pro.md",
      "modelA": {
        "slug": "gpt-4o-mini",
        "canonicalModelKey": "gpt-4o-mini",
        "model": "GPT-4o mini",
        "creator": "OpenAI",
        "sourceType": "Proprietary",
        "reasoningType": "Non-Reasoning",
        "contextWindow": "128K",
        "contextWindowTokens": 128000,
        "displayScore": 49,
        "rankingEligible": true,
        "overallRank": 71,
        "url": "https://benchlm.ai/models/gpt-4o-mini",
        "markdownUrl": "https://benchlm.ai/md/models/gpt-4o-mini.md"
      },
      "modelB": {
        "slug": "gpt-5-5-pro",
        "canonicalModelKey": "gpt-5-5-pro",
        "model": "GPT-5.5 Pro",
        "creator": "OpenAI",
        "sourceType": "Proprietary",
        "reasoningType": "Reasoning",
        "contextWindow": "1M",
        "contextWindowTokens": 1000000,
        "displayScore": 100,
        "rankingEligible": false,
        "overallRank": null,
        "url": "https://benchlm.ai/models/gpt-5-5-pro",
        "markdownUrl": "https://benchlm.ai/md/models/gpt-5-5-pro.md"
      },
      "overallWinner": "B",
      "winner": {
        "slug": "gpt-5-5-pro",
        "canonicalModelKey": "gpt-5-5-pro",
        "model": "GPT-5.5 Pro",
        "creator": "OpenAI",
        "sourceType": "Proprietary",
        "reasoningType": "Reasoning",
        "contextWindow": "1M",
        "contextWindowTokens": 1000000,
        "displayScore": 100,
        "rankingEligible": false,
        "overallRank": null,
        "url": "https://benchlm.ai/models/gpt-5-5-pro",
        "markdownUrl": "https://benchlm.ai/md/models/gpt-5-5-pro.md"
      },
      "scoreDiff": 51,
      "winsA": 0,
      "winsB": 0,
      "comparableCategoryCount": 0,
      "benchmarkCountA": 6,
      "benchmarkCountB": 4,
      "categoryResults": {
        "agentic": {
          "categoryLabel": "Agentic",
          "avgA": null,
          "avgB": 90.1,
          "winner": null,
          "benchmarkCount": 1
        },
        "coding": {
          "categoryLabel": "Coding",
          "avgA": null,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 1
        },
        "multimodalGrounded": {
          "categoryLabel": "Multimodal & Grounded",
          "avgA": null,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 1
        },
        "reasoning": {
          "categoryLabel": "Reasoning",
          "avgA": null,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 0
        },
        "knowledge": {
          "categoryLabel": "Knowledge",
          "avgA": null,
          "avgB": 57.2,
          "winner": null,
          "benchmarkCount": 5
        },
        "instructionFollowing": {
          "categoryLabel": "Instruction Following",
          "avgA": null,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 1
        },
        "multilingual": {
          "categoryLabel": "Multilingual",
          "avgA": null,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 0
        },
        "math": {
          "categoryLabel": "Mathematics",
          "avgA": null,
          "avgB": 52.4,
          "winner": null,
          "benchmarkCount": 1
        }
      }
    },
    {
      "slug": "gpt-4o-mini-vs-holo3-35b-a3b",
      "url": "https://benchlm.ai/compare/gpt-4o-mini-vs-holo3-35b-a3b",
      "markdownUrl": "https://benchlm.ai/md/compare/gpt-4o-mini-vs-holo3-35b-a3b.md",
      "modelA": {
        "slug": "gpt-4o-mini",
        "canonicalModelKey": "gpt-4o-mini",
        "model": "GPT-4o mini",
        "creator": "OpenAI",
        "sourceType": "Proprietary",
        "reasoningType": "Non-Reasoning",
        "contextWindow": "128K",
        "contextWindowTokens": 128000,
        "displayScore": 49,
        "rankingEligible": true,
        "overallRank": 71,
        "url": "https://benchlm.ai/models/gpt-4o-mini",
        "markdownUrl": "https://benchlm.ai/md/models/gpt-4o-mini.md"
      },
      "modelB": {
        "slug": "holo3-35b-a3b",
        "canonicalModelKey": "holo3-35b-a3b",
        "model": "Holo3-35B-A3B",
        "creator": "H Company",
        "sourceType": "Open Weight",
        "reasoningType": "Non-Reasoning",
        "contextWindow": "64K",
        "contextWindowTokens": 64000,
        "displayScore": 100,
        "rankingEligible": false,
        "overallRank": null,
        "url": "https://benchlm.ai/models/holo3-35b-a3b",
        "markdownUrl": "https://benchlm.ai/md/models/holo3-35b-a3b.md"
      },
      "overallWinner": "B",
      "winner": {
        "slug": "holo3-35b-a3b",
        "canonicalModelKey": "holo3-35b-a3b",
        "model": "Holo3-35B-A3B",
        "creator": "H Company",
        "sourceType": "Open Weight",
        "reasoningType": "Non-Reasoning",
        "contextWindow": "64K",
        "contextWindowTokens": 64000,
        "displayScore": 100,
        "rankingEligible": false,
        "overallRank": null,
        "url": "https://benchlm.ai/models/holo3-35b-a3b",
        "markdownUrl": "https://benchlm.ai/md/models/holo3-35b-a3b.md"
      },
      "scoreDiff": 51,
      "winsA": 0,
      "winsB": 0,
      "comparableCategoryCount": 0,
      "benchmarkCountA": 6,
      "benchmarkCountB": 1,
      "categoryResults": {
        "agentic": {
          "categoryLabel": "Agentic",
          "avgA": null,
          "avgB": 82.6,
          "winner": null,
          "benchmarkCount": 1
        },
        "coding": {
          "categoryLabel": "Coding",
          "avgA": null,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 1
        },
        "multimodalGrounded": {
          "categoryLabel": "Multimodal & Grounded",
          "avgA": null,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 1
        },
        "reasoning": {
          "categoryLabel": "Reasoning",
          "avgA": null,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 0
        },
        "knowledge": {
          "categoryLabel": "Knowledge",
          "avgA": null,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 3
        },
        "instructionFollowing": {
          "categoryLabel": "Instruction Following",
          "avgA": null,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 1
        },
        "multilingual": {
          "categoryLabel": "Multilingual",
          "avgA": null,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 0
        },
        "math": {
          "categoryLabel": "Mathematics",
          "avgA": null,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 0
        }
      }
    },
    {
      "slug": "gpt-5-5-pro-vs-qwen2-5-72b",
      "url": "https://benchlm.ai/compare/gpt-5-5-pro-vs-qwen2-5-72b",
      "markdownUrl": "https://benchlm.ai/md/compare/gpt-5-5-pro-vs-qwen2-5-72b.md",
      "modelA": {
        "slug": "qwen2-5-72b",
        "canonicalModelKey": "qwen2-5-72b",
        "model": "Qwen2.5-72B",
        "creator": "Alibaba",
        "sourceType": "Open Weight",
        "reasoningType": "Non-Reasoning",
        "contextWindow": "128K",
        "contextWindowTokens": 128000,
        "displayScore": 49,
        "rankingEligible": true,
        "overallRank": 72,
        "url": "https://benchlm.ai/models/qwen2-5-72b",
        "markdownUrl": "https://benchlm.ai/md/models/qwen2-5-72b.md"
      },
      "modelB": {
        "slug": "gpt-5-5-pro",
        "canonicalModelKey": "gpt-5-5-pro",
        "model": "GPT-5.5 Pro",
        "creator": "OpenAI",
        "sourceType": "Proprietary",
        "reasoningType": "Reasoning",
        "contextWindow": "1M",
        "contextWindowTokens": 1000000,
        "displayScore": 100,
        "rankingEligible": false,
        "overallRank": null,
        "url": "https://benchlm.ai/models/gpt-5-5-pro",
        "markdownUrl": "https://benchlm.ai/md/models/gpt-5-5-pro.md"
      },
      "overallWinner": "B",
      "winner": {
        "slug": "gpt-5-5-pro",
        "canonicalModelKey": "gpt-5-5-pro",
        "model": "GPT-5.5 Pro",
        "creator": "OpenAI",
        "sourceType": "Proprietary",
        "reasoningType": "Reasoning",
        "contextWindow": "1M",
        "contextWindowTokens": 1000000,
        "displayScore": 100,
        "rankingEligible": false,
        "overallRank": null,
        "url": "https://benchlm.ai/models/gpt-5-5-pro",
        "markdownUrl": "https://benchlm.ai/md/models/gpt-5-5-pro.md"
      },
      "scoreDiff": 51,
      "winsA": 0,
      "winsB": 0,
      "comparableCategoryCount": 0,
      "benchmarkCountA": 0,
      "benchmarkCountB": 4,
      "categoryResults": {
        "agentic": {
          "categoryLabel": "Agentic",
          "avgA": null,
          "avgB": 90.1,
          "winner": null,
          "benchmarkCount": 1
        },
        "coding": {
          "categoryLabel": "Coding",
          "avgA": null,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 0
        },
        "multimodalGrounded": {
          "categoryLabel": "Multimodal & Grounded",
          "avgA": null,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 0
        },
        "reasoning": {
          "categoryLabel": "Reasoning",
          "avgA": null,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 0
        },
        "knowledge": {
          "categoryLabel": "Knowledge",
          "avgA": null,
          "avgB": 57.2,
          "winner": null,
          "benchmarkCount": 2
        },
        "instructionFollowing": {
          "categoryLabel": "Instruction Following",
          "avgA": null,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 0
        },
        "multilingual": {
          "categoryLabel": "Multilingual",
          "avgA": null,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 0
        },
        "math": {
          "categoryLabel": "Mathematics",
          "avgA": null,
          "avgB": 52.4,
          "winner": null,
          "benchmarkCount": 1
        }
      }
    },
    {
      "slug": "holo3-35b-a3b-vs-qwen2-5-72b",
      "url": "https://benchlm.ai/compare/holo3-35b-a3b-vs-qwen2-5-72b",
      "markdownUrl": "https://benchlm.ai/md/compare/holo3-35b-a3b-vs-qwen2-5-72b.md",
      "modelA": {
        "slug": "qwen2-5-72b",
        "canonicalModelKey": "qwen2-5-72b",
        "model": "Qwen2.5-72B",
        "creator": "Alibaba",
        "sourceType": "Open Weight",
        "reasoningType": "Non-Reasoning",
        "contextWindow": "128K",
        "contextWindowTokens": 128000,
        "displayScore": 49,
        "rankingEligible": true,
        "overallRank": 72,
        "url": "https://benchlm.ai/models/qwen2-5-72b",
        "markdownUrl": "https://benchlm.ai/md/models/qwen2-5-72b.md"
      },
      "modelB": {
        "slug": "holo3-35b-a3b",
        "canonicalModelKey": "holo3-35b-a3b",
        "model": "Holo3-35B-A3B",
        "creator": "H Company",
        "sourceType": "Open Weight",
        "reasoningType": "Non-Reasoning",
        "contextWindow": "64K",
        "contextWindowTokens": 64000,
        "displayScore": 100,
        "rankingEligible": false,
        "overallRank": null,
        "url": "https://benchlm.ai/models/holo3-35b-a3b",
        "markdownUrl": "https://benchlm.ai/md/models/holo3-35b-a3b.md"
      },
      "overallWinner": "B",
      "winner": {
        "slug": "holo3-35b-a3b",
        "canonicalModelKey": "holo3-35b-a3b",
        "model": "Holo3-35B-A3B",
        "creator": "H Company",
        "sourceType": "Open Weight",
        "reasoningType": "Non-Reasoning",
        "contextWindow": "64K",
        "contextWindowTokens": 64000,
        "displayScore": 100,
        "rankingEligible": false,
        "overallRank": null,
        "url": "https://benchlm.ai/models/holo3-35b-a3b",
        "markdownUrl": "https://benchlm.ai/md/models/holo3-35b-a3b.md"
      },
      "scoreDiff": 51,
      "winsA": 0,
      "winsB": 0,
      "comparableCategoryCount": 0,
      "benchmarkCountA": 0,
      "benchmarkCountB": 1,
      "categoryResults": {
        "agentic": {
          "categoryLabel": "Agentic",
          "avgA": null,
          "avgB": 82.6,
          "winner": null,
          "benchmarkCount": 1
        },
        "coding": {
          "categoryLabel": "Coding",
          "avgA": null,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 0
        },
        "multimodalGrounded": {
          "categoryLabel": "Multimodal & Grounded",
          "avgA": null,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 0
        },
        "reasoning": {
          "categoryLabel": "Reasoning",
          "avgA": null,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 0
        },
        "knowledge": {
          "categoryLabel": "Knowledge",
          "avgA": null,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 0
        },
        "instructionFollowing": {
          "categoryLabel": "Instruction Following",
          "avgA": null,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 0
        },
        "multilingual": {
          "categoryLabel": "Multilingual",
          "avgA": null,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 0
        },
        "math": {
          "categoryLabel": "Mathematics",
          "avgA": null,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 0
        }
      }
    },
    {
      "slug": "deepseekmath-v2-vs-gpt-5-5-pro",
      "url": "https://benchlm.ai/compare/deepseekmath-v2-vs-gpt-5-5-pro",
      "markdownUrl": "https://benchlm.ai/md/compare/deepseekmath-v2-vs-gpt-5-5-pro.md",
      "modelA": {
        "slug": "deepseekmath-v2",
        "canonicalModelKey": "deepseekmath-v2",
        "model": "DeepSeekMath V2",
        "creator": "DeepSeek",
        "sourceType": "Open Weight",
        "reasoningType": "Reasoning",
        "contextWindow": "128K",
        "contextWindowTokens": 128000,
        "displayScore": 49,
        "rankingEligible": true,
        "overallRank": 73,
        "url": "https://benchlm.ai/models/deepseekmath-v2",
        "markdownUrl": "https://benchlm.ai/md/models/deepseekmath-v2.md"
      },
      "modelB": {
        "slug": "gpt-5-5-pro",
        "canonicalModelKey": "gpt-5-5-pro",
        "model": "GPT-5.5 Pro",
        "creator": "OpenAI",
        "sourceType": "Proprietary",
        "reasoningType": "Reasoning",
        "contextWindow": "1M",
        "contextWindowTokens": 1000000,
        "displayScore": 100,
        "rankingEligible": false,
        "overallRank": null,
        "url": "https://benchlm.ai/models/gpt-5-5-pro",
        "markdownUrl": "https://benchlm.ai/md/models/gpt-5-5-pro.md"
      },
      "overallWinner": "B",
      "winner": {
        "slug": "gpt-5-5-pro",
        "canonicalModelKey": "gpt-5-5-pro",
        "model": "GPT-5.5 Pro",
        "creator": "OpenAI",
        "sourceType": "Proprietary",
        "reasoningType": "Reasoning",
        "contextWindow": "1M",
        "contextWindowTokens": 1000000,
        "displayScore": 100,
        "rankingEligible": false,
        "overallRank": null,
        "url": "https://benchlm.ai/models/gpt-5-5-pro",
        "markdownUrl": "https://benchlm.ai/md/models/gpt-5-5-pro.md"
      },
      "scoreDiff": 51,
      "winsA": 0,
      "winsB": 0,
      "comparableCategoryCount": 0,
      "benchmarkCountA": 0,
      "benchmarkCountB": 4,
      "categoryResults": {
        "agentic": {
          "categoryLabel": "Agentic",
          "avgA": null,
          "avgB": 90.1,
          "winner": null,
          "benchmarkCount": 1
        },
        "coding": {
          "categoryLabel": "Coding",
          "avgA": null,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 0
        },
        "multimodalGrounded": {
          "categoryLabel": "Multimodal & Grounded",
          "avgA": null,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 0
        },
        "reasoning": {
          "categoryLabel": "Reasoning",
          "avgA": null,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 0
        },
        "knowledge": {
          "categoryLabel": "Knowledge",
          "avgA": null,
          "avgB": 57.2,
          "winner": null,
          "benchmarkCount": 2
        },
        "instructionFollowing": {
          "categoryLabel": "Instruction Following",
          "avgA": null,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 0
        },
        "multilingual": {
          "categoryLabel": "Multilingual",
          "avgA": null,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 0
        },
        "math": {
          "categoryLabel": "Mathematics",
          "avgA": null,
          "avgB": 52.4,
          "winner": null,
          "benchmarkCount": 1
        }
      }
    },
    {
      "slug": "deepseekmath-v2-vs-holo3-35b-a3b",
      "url": "https://benchlm.ai/compare/deepseekmath-v2-vs-holo3-35b-a3b",
      "markdownUrl": "https://benchlm.ai/md/compare/deepseekmath-v2-vs-holo3-35b-a3b.md",
      "modelA": {
        "slug": "deepseekmath-v2",
        "canonicalModelKey": "deepseekmath-v2",
        "model": "DeepSeekMath V2",
        "creator": "DeepSeek",
        "sourceType": "Open Weight",
        "reasoningType": "Reasoning",
        "contextWindow": "128K",
        "contextWindowTokens": 128000,
        "displayScore": 49,
        "rankingEligible": true,
        "overallRank": 73,
        "url": "https://benchlm.ai/models/deepseekmath-v2",
        "markdownUrl": "https://benchlm.ai/md/models/deepseekmath-v2.md"
      },
      "modelB": {
        "slug": "holo3-35b-a3b",
        "canonicalModelKey": "holo3-35b-a3b",
        "model": "Holo3-35B-A3B",
        "creator": "H Company",
        "sourceType": "Open Weight",
        "reasoningType": "Non-Reasoning",
        "contextWindow": "64K",
        "contextWindowTokens": 64000,
        "displayScore": 100,
        "rankingEligible": false,
        "overallRank": null,
        "url": "https://benchlm.ai/models/holo3-35b-a3b",
        "markdownUrl": "https://benchlm.ai/md/models/holo3-35b-a3b.md"
      },
      "overallWinner": "B",
      "winner": {
        "slug": "holo3-35b-a3b",
        "canonicalModelKey": "holo3-35b-a3b",
        "model": "Holo3-35B-A3B",
        "creator": "H Company",
        "sourceType": "Open Weight",
        "reasoningType": "Non-Reasoning",
        "contextWindow": "64K",
        "contextWindowTokens": 64000,
        "displayScore": 100,
        "rankingEligible": false,
        "overallRank": null,
        "url": "https://benchlm.ai/models/holo3-35b-a3b",
        "markdownUrl": "https://benchlm.ai/md/models/holo3-35b-a3b.md"
      },
      "scoreDiff": 51,
      "winsA": 0,
      "winsB": 0,
      "comparableCategoryCount": 0,
      "benchmarkCountA": 0,
      "benchmarkCountB": 1,
      "categoryResults": {
        "agentic": {
          "categoryLabel": "Agentic",
          "avgA": null,
          "avgB": 82.6,
          "winner": null,
          "benchmarkCount": 1
        },
        "coding": {
          "categoryLabel": "Coding",
          "avgA": null,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 0
        },
        "multimodalGrounded": {
          "categoryLabel": "Multimodal & Grounded",
          "avgA": null,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 0
        },
        "reasoning": {
          "categoryLabel": "Reasoning",
          "avgA": null,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 0
        },
        "knowledge": {
          "categoryLabel": "Knowledge",
          "avgA": null,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 0
        },
        "instructionFollowing": {
          "categoryLabel": "Instruction Following",
          "avgA": null,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 0
        },
        "multilingual": {
          "categoryLabel": "Multilingual",
          "avgA": null,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 0
        },
        "math": {
          "categoryLabel": "Mathematics",
          "avgA": null,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 0
        }
      }
    },
    {
      "slug": "gpt-5-5-pro-vs-mistral-large-3",
      "url": "https://benchlm.ai/compare/gpt-5-5-pro-vs-mistral-large-3",
      "markdownUrl": "https://benchlm.ai/md/compare/gpt-5-5-pro-vs-mistral-large-3.md",
      "modelA": {
        "slug": "mistral-large-3",
        "canonicalModelKey": "mistral-large-3",
        "model": "Mistral Large 3",
        "creator": "Mistral",
        "sourceType": "Proprietary",
        "reasoningType": "Non-Reasoning",
        "contextWindow": "128K",
        "contextWindowTokens": 128000,
        "displayScore": 48,
        "rankingEligible": true,
        "overallRank": 74,
        "url": "https://benchlm.ai/models/mistral-large-3",
        "markdownUrl": "https://benchlm.ai/md/models/mistral-large-3.md"
      },
      "modelB": {
        "slug": "gpt-5-5-pro",
        "canonicalModelKey": "gpt-5-5-pro",
        "model": "GPT-5.5 Pro",
        "creator": "OpenAI",
        "sourceType": "Proprietary",
        "reasoningType": "Reasoning",
        "contextWindow": "1M",
        "contextWindowTokens": 1000000,
        "displayScore": 100,
        "rankingEligible": false,
        "overallRank": null,
        "url": "https://benchlm.ai/models/gpt-5-5-pro",
        "markdownUrl": "https://benchlm.ai/md/models/gpt-5-5-pro.md"
      },
      "overallWinner": "B",
      "winner": {
        "slug": "gpt-5-5-pro",
        "canonicalModelKey": "gpt-5-5-pro",
        "model": "GPT-5.5 Pro",
        "creator": "OpenAI",
        "sourceType": "Proprietary",
        "reasoningType": "Reasoning",
        "contextWindow": "1M",
        "contextWindowTokens": 1000000,
        "displayScore": 100,
        "rankingEligible": false,
        "overallRank": null,
        "url": "https://benchlm.ai/models/gpt-5-5-pro",
        "markdownUrl": "https://benchlm.ai/md/models/gpt-5-5-pro.md"
      },
      "scoreDiff": 52,
      "winsA": 0,
      "winsB": 0,
      "comparableCategoryCount": 0,
      "benchmarkCountA": 17,
      "benchmarkCountB": 4,
      "categoryResults": {
        "agentic": {
          "categoryLabel": "Agentic",
          "avgA": null,
          "avgB": 90.1,
          "winner": null,
          "benchmarkCount": 5
        },
        "coding": {
          "categoryLabel": "Coding",
          "avgA": null,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 3
        },
        "multimodalGrounded": {
          "categoryLabel": "Multimodal & Grounded",
          "avgA": null,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 1
        },
        "reasoning": {
          "categoryLabel": "Reasoning",
          "avgA": null,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 2
        },
        "knowledge": {
          "categoryLabel": "Knowledge",
          "avgA": null,
          "avgB": 57.2,
          "winner": null,
          "benchmarkCount": 8
        },
        "instructionFollowing": {
          "categoryLabel": "Instruction Following",
          "avgA": null,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 1
        },
        "multilingual": {
          "categoryLabel": "Multilingual",
          "avgA": null,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 0
        },
        "math": {
          "categoryLabel": "Mathematics",
          "avgA": null,
          "avgB": 52.4,
          "winner": null,
          "benchmarkCount": 1
        }
      }
    },
    {
      "slug": "holo3-35b-a3b-vs-mistral-large-3",
      "url": "https://benchlm.ai/compare/holo3-35b-a3b-vs-mistral-large-3",
      "markdownUrl": "https://benchlm.ai/md/compare/holo3-35b-a3b-vs-mistral-large-3.md",
      "modelA": {
        "slug": "mistral-large-3",
        "canonicalModelKey": "mistral-large-3",
        "model": "Mistral Large 3",
        "creator": "Mistral",
        "sourceType": "Proprietary",
        "reasoningType": "Non-Reasoning",
        "contextWindow": "128K",
        "contextWindowTokens": 128000,
        "displayScore": 48,
        "rankingEligible": true,
        "overallRank": 74,
        "url": "https://benchlm.ai/models/mistral-large-3",
        "markdownUrl": "https://benchlm.ai/md/models/mistral-large-3.md"
      },
      "modelB": {
        "slug": "holo3-35b-a3b",
        "canonicalModelKey": "holo3-35b-a3b",
        "model": "Holo3-35B-A3B",
        "creator": "H Company",
        "sourceType": "Open Weight",
        "reasoningType": "Non-Reasoning",
        "contextWindow": "64K",
        "contextWindowTokens": 64000,
        "displayScore": 100,
        "rankingEligible": false,
        "overallRank": null,
        "url": "https://benchlm.ai/models/holo3-35b-a3b",
        "markdownUrl": "https://benchlm.ai/md/models/holo3-35b-a3b.md"
      },
      "overallWinner": "B",
      "winner": {
        "slug": "holo3-35b-a3b",
        "canonicalModelKey": "holo3-35b-a3b",
        "model": "Holo3-35B-A3B",
        "creator": "H Company",
        "sourceType": "Open Weight",
        "reasoningType": "Non-Reasoning",
        "contextWindow": "64K",
        "contextWindowTokens": 64000,
        "displayScore": 100,
        "rankingEligible": false,
        "overallRank": null,
        "url": "https://benchlm.ai/models/holo3-35b-a3b",
        "markdownUrl": "https://benchlm.ai/md/models/holo3-35b-a3b.md"
      },
      "scoreDiff": 52,
      "winsA": 0,
      "winsB": 0,
      "comparableCategoryCount": 0,
      "benchmarkCountA": 17,
      "benchmarkCountB": 1,
      "categoryResults": {
        "agentic": {
          "categoryLabel": "Agentic",
          "avgA": null,
          "avgB": 82.6,
          "winner": null,
          "benchmarkCount": 5
        },
        "coding": {
          "categoryLabel": "Coding",
          "avgA": null,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 3
        },
        "multimodalGrounded": {
          "categoryLabel": "Multimodal & Grounded",
          "avgA": null,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 1
        },
        "reasoning": {
          "categoryLabel": "Reasoning",
          "avgA": null,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 2
        },
        "knowledge": {
          "categoryLabel": "Knowledge",
          "avgA": null,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 6
        },
        "instructionFollowing": {
          "categoryLabel": "Instruction Following",
          "avgA": null,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 1
        },
        "multilingual": {
          "categoryLabel": "Multilingual",
          "avgA": null,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 0
        },
        "math": {
          "categoryLabel": "Mathematics",
          "avgA": null,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 0
        }
      }
    },
    {
      "slug": "gemini-3-1-flash-lite-vs-gpt-5-5-pro",
      "url": "https://benchlm.ai/compare/gemini-3-1-flash-lite-vs-gpt-5-5-pro",
      "markdownUrl": "https://benchlm.ai/md/compare/gemini-3-1-flash-lite-vs-gpt-5-5-pro.md",
      "modelA": {
        "slug": "gemini-3-1-flash-lite",
        "canonicalModelKey": "gemini-3-1-flash-lite",
        "model": "Gemini 3.1 Flash-Lite",
        "creator": "Google",
        "sourceType": "Proprietary",
        "reasoningType": "Non-Reasoning",
        "contextWindow": "1M",
        "contextWindowTokens": 1000000,
        "displayScore": 47,
        "rankingEligible": true,
        "overallRank": 75,
        "url": "https://benchlm.ai/models/gemini-3-1-flash-lite",
        "markdownUrl": "https://benchlm.ai/md/models/gemini-3-1-flash-lite.md"
      },
      "modelB": {
        "slug": "gpt-5-5-pro",
        "canonicalModelKey": "gpt-5-5-pro",
        "model": "GPT-5.5 Pro",
        "creator": "OpenAI",
        "sourceType": "Proprietary",
        "reasoningType": "Reasoning",
        "contextWindow": "1M",
        "contextWindowTokens": 1000000,
        "displayScore": 100,
        "rankingEligible": false,
        "overallRank": null,
        "url": "https://benchlm.ai/models/gpt-5-5-pro",
        "markdownUrl": "https://benchlm.ai/md/models/gpt-5-5-pro.md"
      },
      "overallWinner": "B",
      "winner": {
        "slug": "gpt-5-5-pro",
        "canonicalModelKey": "gpt-5-5-pro",
        "model": "GPT-5.5 Pro",
        "creator": "OpenAI",
        "sourceType": "Proprietary",
        "reasoningType": "Reasoning",
        "contextWindow": "1M",
        "contextWindowTokens": 1000000,
        "displayScore": 100,
        "rankingEligible": false,
        "overallRank": null,
        "url": "https://benchlm.ai/models/gpt-5-5-pro",
        "markdownUrl": "https://benchlm.ai/md/models/gpt-5-5-pro.md"
      },
      "scoreDiff": 53,
      "winsA": 0,
      "winsB": 0,
      "comparableCategoryCount": 0,
      "benchmarkCountA": 21,
      "benchmarkCountB": 4,
      "categoryResults": {
        "agentic": {
          "categoryLabel": "Agentic",
          "avgA": null,
          "avgB": 90.1,
          "winner": null,
          "benchmarkCount": 7
        },
        "coding": {
          "categoryLabel": "Coding",
          "avgA": null,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 4
        },
        "multimodalGrounded": {
          "categoryLabel": "Multimodal & Grounded",
          "avgA": 73.2,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 2
        },
        "reasoning": {
          "categoryLabel": "Reasoning",
          "avgA": null,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 2
        },
        "knowledge": {
          "categoryLabel": "Knowledge",
          "avgA": null,
          "avgB": 57.2,
          "winner": null,
          "benchmarkCount": 8
        },
        "instructionFollowing": {
          "categoryLabel": "Instruction Following",
          "avgA": null,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 1
        },
        "multilingual": {
          "categoryLabel": "Multilingual",
          "avgA": null,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 0
        },
        "math": {
          "categoryLabel": "Mathematics",
          "avgA": null,
          "avgB": 52.4,
          "winner": null,
          "benchmarkCount": 1
        }
      }
    },
    {
      "slug": "gemini-3-1-flash-lite-vs-holo3-35b-a3b",
      "url": "https://benchlm.ai/compare/gemini-3-1-flash-lite-vs-holo3-35b-a3b",
      "markdownUrl": "https://benchlm.ai/md/compare/gemini-3-1-flash-lite-vs-holo3-35b-a3b.md",
      "modelA": {
        "slug": "gemini-3-1-flash-lite",
        "canonicalModelKey": "gemini-3-1-flash-lite",
        "model": "Gemini 3.1 Flash-Lite",
        "creator": "Google",
        "sourceType": "Proprietary",
        "reasoningType": "Non-Reasoning",
        "contextWindow": "1M",
        "contextWindowTokens": 1000000,
        "displayScore": 47,
        "rankingEligible": true,
        "overallRank": 75,
        "url": "https://benchlm.ai/models/gemini-3-1-flash-lite",
        "markdownUrl": "https://benchlm.ai/md/models/gemini-3-1-flash-lite.md"
      },
      "modelB": {
        "slug": "holo3-35b-a3b",
        "canonicalModelKey": "holo3-35b-a3b",
        "model": "Holo3-35B-A3B",
        "creator": "H Company",
        "sourceType": "Open Weight",
        "reasoningType": "Non-Reasoning",
        "contextWindow": "64K",
        "contextWindowTokens": 64000,
        "displayScore": 100,
        "rankingEligible": false,
        "overallRank": null,
        "url": "https://benchlm.ai/models/holo3-35b-a3b",
        "markdownUrl": "https://benchlm.ai/md/models/holo3-35b-a3b.md"
      },
      "overallWinner": "B",
      "winner": {
        "slug": "holo3-35b-a3b",
        "canonicalModelKey": "holo3-35b-a3b",
        "model": "Holo3-35B-A3B",
        "creator": "H Company",
        "sourceType": "Open Weight",
        "reasoningType": "Non-Reasoning",
        "contextWindow": "64K",
        "contextWindowTokens": 64000,
        "displayScore": 100,
        "rankingEligible": false,
        "overallRank": null,
        "url": "https://benchlm.ai/models/holo3-35b-a3b",
        "markdownUrl": "https://benchlm.ai/md/models/holo3-35b-a3b.md"
      },
      "scoreDiff": 53,
      "winsA": 0,
      "winsB": 0,
      "comparableCategoryCount": 0,
      "benchmarkCountA": 21,
      "benchmarkCountB": 1,
      "categoryResults": {
        "agentic": {
          "categoryLabel": "Agentic",
          "avgA": null,
          "avgB": 82.6,
          "winner": null,
          "benchmarkCount": 7
        },
        "coding": {
          "categoryLabel": "Coding",
          "avgA": null,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 4
        },
        "multimodalGrounded": {
          "categoryLabel": "Multimodal & Grounded",
          "avgA": 73.2,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 2
        },
        "reasoning": {
          "categoryLabel": "Reasoning",
          "avgA": null,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 2
        },
        "knowledge": {
          "categoryLabel": "Knowledge",
          "avgA": null,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 6
        },
        "instructionFollowing": {
          "categoryLabel": "Instruction Following",
          "avgA": null,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 1
        },
        "multilingual": {
          "categoryLabel": "Multilingual",
          "avgA": null,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 0
        },
        "math": {
          "categoryLabel": "Mathematics",
          "avgA": null,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 0
        }
      }
    },
    {
      "slug": "gpt-5-5-pro-vs-qwen3-235b-2507-reasoning",
      "url": "https://benchlm.ai/compare/gpt-5-5-pro-vs-qwen3-235b-2507-reasoning",
      "markdownUrl": "https://benchlm.ai/md/compare/gpt-5-5-pro-vs-qwen3-235b-2507-reasoning.md",
      "modelA": {
        "slug": "qwen3-235b-2507-reasoning",
        "canonicalModelKey": "qwen3-235b-2507-reasoning",
        "model": "Qwen3 235B 2507 (Reasoning)",
        "creator": "Alibaba",
        "sourceType": "Open Weight",
        "reasoningType": "Reasoning",
        "contextWindow": "128K",
        "contextWindowTokens": 128000,
        "displayScore": 45,
        "rankingEligible": true,
        "overallRank": 76,
        "url": "https://benchlm.ai/models/qwen3-235b-2507-reasoning",
        "markdownUrl": "https://benchlm.ai/md/models/qwen3-235b-2507-reasoning.md"
      },
      "modelB": {
        "slug": "gpt-5-5-pro",
        "canonicalModelKey": "gpt-5-5-pro",
        "model": "GPT-5.5 Pro",
        "creator": "OpenAI",
        "sourceType": "Proprietary",
        "reasoningType": "Reasoning",
        "contextWindow": "1M",
        "contextWindowTokens": 1000000,
        "displayScore": 100,
        "rankingEligible": false,
        "overallRank": null,
        "url": "https://benchlm.ai/models/gpt-5-5-pro",
        "markdownUrl": "https://benchlm.ai/md/models/gpt-5-5-pro.md"
      },
      "overallWinner": "B",
      "winner": {
        "slug": "gpt-5-5-pro",
        "canonicalModelKey": "gpt-5-5-pro",
        "model": "GPT-5.5 Pro",
        "creator": "OpenAI",
        "sourceType": "Proprietary",
        "reasoningType": "Reasoning",
        "contextWindow": "1M",
        "contextWindowTokens": 1000000,
        "displayScore": 100,
        "rankingEligible": false,
        "overallRank": null,
        "url": "https://benchlm.ai/models/gpt-5-5-pro",
        "markdownUrl": "https://benchlm.ai/md/models/gpt-5-5-pro.md"
      },
      "scoreDiff": 55,
      "winsA": 0,
      "winsB": 0,
      "comparableCategoryCount": 0,
      "benchmarkCountA": 0,
      "benchmarkCountB": 4,
      "categoryResults": {
        "agentic": {
          "categoryLabel": "Agentic",
          "avgA": null,
          "avgB": 90.1,
          "winner": null,
          "benchmarkCount": 1
        },
        "coding": {
          "categoryLabel": "Coding",
          "avgA": null,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 0
        },
        "multimodalGrounded": {
          "categoryLabel": "Multimodal & Grounded",
          "avgA": null,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 0
        },
        "reasoning": {
          "categoryLabel": "Reasoning",
          "avgA": null,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 0
        },
        "knowledge": {
          "categoryLabel": "Knowledge",
          "avgA": null,
          "avgB": 57.2,
          "winner": null,
          "benchmarkCount": 2
        },
        "instructionFollowing": {
          "categoryLabel": "Instruction Following",
          "avgA": null,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 0
        },
        "multilingual": {
          "categoryLabel": "Multilingual",
          "avgA": null,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 0
        },
        "math": {
          "categoryLabel": "Mathematics",
          "avgA": null,
          "avgB": 52.4,
          "winner": null,
          "benchmarkCount": 1
        }
      }
    },
    {
      "slug": "holo3-35b-a3b-vs-qwen3-235b-2507-reasoning",
      "url": "https://benchlm.ai/compare/holo3-35b-a3b-vs-qwen3-235b-2507-reasoning",
      "markdownUrl": "https://benchlm.ai/md/compare/holo3-35b-a3b-vs-qwen3-235b-2507-reasoning.md",
      "modelA": {
        "slug": "qwen3-235b-2507-reasoning",
        "canonicalModelKey": "qwen3-235b-2507-reasoning",
        "model": "Qwen3 235B 2507 (Reasoning)",
        "creator": "Alibaba",
        "sourceType": "Open Weight",
        "reasoningType": "Reasoning",
        "contextWindow": "128K",
        "contextWindowTokens": 128000,
        "displayScore": 45,
        "rankingEligible": true,
        "overallRank": 76,
        "url": "https://benchlm.ai/models/qwen3-235b-2507-reasoning",
        "markdownUrl": "https://benchlm.ai/md/models/qwen3-235b-2507-reasoning.md"
      },
      "modelB": {
        "slug": "holo3-35b-a3b",
        "canonicalModelKey": "holo3-35b-a3b",
        "model": "Holo3-35B-A3B",
        "creator": "H Company",
        "sourceType": "Open Weight",
        "reasoningType": "Non-Reasoning",
        "contextWindow": "64K",
        "contextWindowTokens": 64000,
        "displayScore": 100,
        "rankingEligible": false,
        "overallRank": null,
        "url": "https://benchlm.ai/models/holo3-35b-a3b",
        "markdownUrl": "https://benchlm.ai/md/models/holo3-35b-a3b.md"
      },
      "overallWinner": "B",
      "winner": {
        "slug": "holo3-35b-a3b",
        "canonicalModelKey": "holo3-35b-a3b",
        "model": "Holo3-35B-A3B",
        "creator": "H Company",
        "sourceType": "Open Weight",
        "reasoningType": "Non-Reasoning",
        "contextWindow": "64K",
        "contextWindowTokens": 64000,
        "displayScore": 100,
        "rankingEligible": false,
        "overallRank": null,
        "url": "https://benchlm.ai/models/holo3-35b-a3b",
        "markdownUrl": "https://benchlm.ai/md/models/holo3-35b-a3b.md"
      },
      "scoreDiff": 55,
      "winsA": 0,
      "winsB": 0,
      "comparableCategoryCount": 0,
      "benchmarkCountA": 0,
      "benchmarkCountB": 1,
      "categoryResults": {
        "agentic": {
          "categoryLabel": "Agentic",
          "avgA": null,
          "avgB": 82.6,
          "winner": null,
          "benchmarkCount": 1
        },
        "coding": {
          "categoryLabel": "Coding",
          "avgA": null,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 0
        },
        "multimodalGrounded": {
          "categoryLabel": "Multimodal & Grounded",
          "avgA": null,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 0
        },
        "reasoning": {
          "categoryLabel": "Reasoning",
          "avgA": null,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 0
        },
        "knowledge": {
          "categoryLabel": "Knowledge",
          "avgA": null,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 0
        },
        "instructionFollowing": {
          "categoryLabel": "Instruction Following",
          "avgA": null,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 0
        },
        "multilingual": {
          "categoryLabel": "Multilingual",
          "avgA": null,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 0
        },
        "math": {
          "categoryLabel": "Mathematics",
          "avgA": null,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 0
        }
      }
    },
    {
      "slug": "gpt-4-1-mini-vs-gpt-5-5-pro",
      "url": "https://benchlm.ai/compare/gpt-4-1-mini-vs-gpt-5-5-pro",
      "markdownUrl": "https://benchlm.ai/md/compare/gpt-4-1-mini-vs-gpt-5-5-pro.md",
      "modelA": {
        "slug": "gpt-4-1-mini",
        "canonicalModelKey": "gpt-4-1-mini",
        "model": "GPT-4.1 mini",
        "creator": "OpenAI",
        "sourceType": "Proprietary",
        "reasoningType": "Non-Reasoning",
        "contextWindow": "1M",
        "contextWindowTokens": 1000000,
        "displayScore": 45,
        "rankingEligible": true,
        "overallRank": 77,
        "url": "https://benchlm.ai/models/gpt-4-1-mini",
        "markdownUrl": "https://benchlm.ai/md/models/gpt-4-1-mini.md"
      },
      "modelB": {
        "slug": "gpt-5-5-pro",
        "canonicalModelKey": "gpt-5-5-pro",
        "model": "GPT-5.5 Pro",
        "creator": "OpenAI",
        "sourceType": "Proprietary",
        "reasoningType": "Reasoning",
        "contextWindow": "1M",
        "contextWindowTokens": 1000000,
        "displayScore": 100,
        "rankingEligible": false,
        "overallRank": null,
        "url": "https://benchlm.ai/models/gpt-5-5-pro",
        "markdownUrl": "https://benchlm.ai/md/models/gpt-5-5-pro.md"
      },
      "overallWinner": "B",
      "winner": {
        "slug": "gpt-5-5-pro",
        "canonicalModelKey": "gpt-5-5-pro",
        "model": "GPT-5.5 Pro",
        "creator": "OpenAI",
        "sourceType": "Proprietary",
        "reasoningType": "Reasoning",
        "contextWindow": "1M",
        "contextWindowTokens": 1000000,
        "displayScore": 100,
        "rankingEligible": false,
        "overallRank": null,
        "url": "https://benchlm.ai/models/gpt-5-5-pro",
        "markdownUrl": "https://benchlm.ai/md/models/gpt-5-5-pro.md"
      },
      "scoreDiff": 55,
      "winsA": 1,
      "winsB": 0,
      "comparableCategoryCount": 1,
      "benchmarkCountA": 22,
      "benchmarkCountB": 4,
      "categoryResults": {
        "agentic": {
          "categoryLabel": "Agentic",
          "avgA": null,
          "avgB": 90.1,
          "winner": null,
          "benchmarkCount": 5
        },
        "coding": {
          "categoryLabel": "Coding",
          "avgA": 23.6,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 4
        },
        "multimodalGrounded": {
          "categoryLabel": "Multimodal & Grounded",
          "avgA": null,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 2
        },
        "reasoning": {
          "categoryLabel": "Reasoning",
          "avgA": null,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 2
        },
        "knowledge": {
          "categoryLabel": "Knowledge",
          "avgA": 64.2,
          "avgB": 57.2,
          "winner": "A",
          "benchmarkCount": 10
        },
        "instructionFollowing": {
          "categoryLabel": "Instruction Following",
          "avgA": 88.5,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 2
        },
        "multilingual": {
          "categoryLabel": "Multilingual",
          "avgA": null,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 0
        },
        "math": {
          "categoryLabel": "Mathematics",
          "avgA": null,
          "avgB": 52.4,
          "winner": null,
          "benchmarkCount": 1
        }
      }
    },
    {
      "slug": "gpt-4-1-mini-vs-holo3-35b-a3b",
      "url": "https://benchlm.ai/compare/gpt-4-1-mini-vs-holo3-35b-a3b",
      "markdownUrl": "https://benchlm.ai/md/compare/gpt-4-1-mini-vs-holo3-35b-a3b.md",
      "modelA": {
        "slug": "gpt-4-1-mini",
        "canonicalModelKey": "gpt-4-1-mini",
        "model": "GPT-4.1 mini",
        "creator": "OpenAI",
        "sourceType": "Proprietary",
        "reasoningType": "Non-Reasoning",
        "contextWindow": "1M",
        "contextWindowTokens": 1000000,
        "displayScore": 45,
        "rankingEligible": true,
        "overallRank": 77,
        "url": "https://benchlm.ai/models/gpt-4-1-mini",
        "markdownUrl": "https://benchlm.ai/md/models/gpt-4-1-mini.md"
      },
      "modelB": {
        "slug": "holo3-35b-a3b",
        "canonicalModelKey": "holo3-35b-a3b",
        "model": "Holo3-35B-A3B",
        "creator": "H Company",
        "sourceType": "Open Weight",
        "reasoningType": "Non-Reasoning",
        "contextWindow": "64K",
        "contextWindowTokens": 64000,
        "displayScore": 100,
        "rankingEligible": false,
        "overallRank": null,
        "url": "https://benchlm.ai/models/holo3-35b-a3b",
        "markdownUrl": "https://benchlm.ai/md/models/holo3-35b-a3b.md"
      },
      "overallWinner": "B",
      "winner": {
        "slug": "holo3-35b-a3b",
        "canonicalModelKey": "holo3-35b-a3b",
        "model": "Holo3-35B-A3B",
        "creator": "H Company",
        "sourceType": "Open Weight",
        "reasoningType": "Non-Reasoning",
        "contextWindow": "64K",
        "contextWindowTokens": 64000,
        "displayScore": 100,
        "rankingEligible": false,
        "overallRank": null,
        "url": "https://benchlm.ai/models/holo3-35b-a3b",
        "markdownUrl": "https://benchlm.ai/md/models/holo3-35b-a3b.md"
      },
      "scoreDiff": 55,
      "winsA": 0,
      "winsB": 0,
      "comparableCategoryCount": 0,
      "benchmarkCountA": 22,
      "benchmarkCountB": 1,
      "categoryResults": {
        "agentic": {
          "categoryLabel": "Agentic",
          "avgA": null,
          "avgB": 82.6,
          "winner": null,
          "benchmarkCount": 5
        },
        "coding": {
          "categoryLabel": "Coding",
          "avgA": 23.6,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 4
        },
        "multimodalGrounded": {
          "categoryLabel": "Multimodal & Grounded",
          "avgA": null,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 2
        },
        "reasoning": {
          "categoryLabel": "Reasoning",
          "avgA": null,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 2
        },
        "knowledge": {
          "categoryLabel": "Knowledge",
          "avgA": 64.2,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 8
        },
        "instructionFollowing": {
          "categoryLabel": "Instruction Following",
          "avgA": 88.5,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 2
        },
        "multilingual": {
          "categoryLabel": "Multilingual",
          "avgA": null,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 0
        },
        "math": {
          "categoryLabel": "Mathematics",
          "avgA": null,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 0
        }
      }
    },
    {
      "slug": "gpt-5-5-pro-vs-nemotron-3-super-100b",
      "url": "https://benchlm.ai/compare/gpt-5-5-pro-vs-nemotron-3-super-100b",
      "markdownUrl": "https://benchlm.ai/md/compare/gpt-5-5-pro-vs-nemotron-3-super-100b.md",
      "modelA": {
        "slug": "nemotron-3-super-100b",
        "canonicalModelKey": "nemotron-3-super-100b",
        "model": "Nemotron 3 Super 100B",
        "creator": "NVIDIA",
        "sourceType": "Open Weight",
        "reasoningType": "Non-Reasoning",
        "contextWindow": "1M",
        "contextWindowTokens": 1000000,
        "displayScore": 43,
        "rankingEligible": true,
        "overallRank": 78,
        "url": "https://benchlm.ai/models/nemotron-3-super-100b",
        "markdownUrl": "https://benchlm.ai/md/models/nemotron-3-super-100b.md"
      },
      "modelB": {
        "slug": "gpt-5-5-pro",
        "canonicalModelKey": "gpt-5-5-pro",
        "model": "GPT-5.5 Pro",
        "creator": "OpenAI",
        "sourceType": "Proprietary",
        "reasoningType": "Reasoning",
        "contextWindow": "1M",
        "contextWindowTokens": 1000000,
        "displayScore": 100,
        "rankingEligible": false,
        "overallRank": null,
        "url": "https://benchlm.ai/models/gpt-5-5-pro",
        "markdownUrl": "https://benchlm.ai/md/models/gpt-5-5-pro.md"
      },
      "overallWinner": "B",
      "winner": {
        "slug": "gpt-5-5-pro",
        "canonicalModelKey": "gpt-5-5-pro",
        "model": "GPT-5.5 Pro",
        "creator": "OpenAI",
        "sourceType": "Proprietary",
        "reasoningType": "Reasoning",
        "contextWindow": "1M",
        "contextWindowTokens": 1000000,
        "displayScore": 100,
        "rankingEligible": false,
        "overallRank": null,
        "url": "https://benchlm.ai/models/gpt-5-5-pro",
        "markdownUrl": "https://benchlm.ai/md/models/gpt-5-5-pro.md"
      },
      "scoreDiff": 57,
      "winsA": 0,
      "winsB": 0,
      "comparableCategoryCount": 0,
      "benchmarkCountA": 1,
      "benchmarkCountB": 4,
      "categoryResults": {
        "agentic": {
          "categoryLabel": "Agentic",
          "avgA": null,
          "avgB": 90.1,
          "winner": null,
          "benchmarkCount": 2
        },
        "coding": {
          "categoryLabel": "Coding",
          "avgA": null,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 0
        },
        "multimodalGrounded": {
          "categoryLabel": "Multimodal & Grounded",
          "avgA": null,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 0
        },
        "reasoning": {
          "categoryLabel": "Reasoning",
          "avgA": null,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 0
        },
        "knowledge": {
          "categoryLabel": "Knowledge",
          "avgA": null,
          "avgB": 57.2,
          "winner": null,
          "benchmarkCount": 2
        },
        "instructionFollowing": {
          "categoryLabel": "Instruction Following",
          "avgA": null,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 0
        },
        "multilingual": {
          "categoryLabel": "Multilingual",
          "avgA": null,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 0
        },
        "math": {
          "categoryLabel": "Mathematics",
          "avgA": null,
          "avgB": 52.4,
          "winner": null,
          "benchmarkCount": 1
        }
      }
    },
    {
      "slug": "holo3-35b-a3b-vs-nemotron-3-super-100b",
      "url": "https://benchlm.ai/compare/holo3-35b-a3b-vs-nemotron-3-super-100b",
      "markdownUrl": "https://benchlm.ai/md/compare/holo3-35b-a3b-vs-nemotron-3-super-100b.md",
      "modelA": {
        "slug": "nemotron-3-super-100b",
        "canonicalModelKey": "nemotron-3-super-100b",
        "model": "Nemotron 3 Super 100B",
        "creator": "NVIDIA",
        "sourceType": "Open Weight",
        "reasoningType": "Non-Reasoning",
        "contextWindow": "1M",
        "contextWindowTokens": 1000000,
        "displayScore": 43,
        "rankingEligible": true,
        "overallRank": 78,
        "url": "https://benchlm.ai/models/nemotron-3-super-100b",
        "markdownUrl": "https://benchlm.ai/md/models/nemotron-3-super-100b.md"
      },
      "modelB": {
        "slug": "holo3-35b-a3b",
        "canonicalModelKey": "holo3-35b-a3b",
        "model": "Holo3-35B-A3B",
        "creator": "H Company",
        "sourceType": "Open Weight",
        "reasoningType": "Non-Reasoning",
        "contextWindow": "64K",
        "contextWindowTokens": 64000,
        "displayScore": 100,
        "rankingEligible": false,
        "overallRank": null,
        "url": "https://benchlm.ai/models/holo3-35b-a3b",
        "markdownUrl": "https://benchlm.ai/md/models/holo3-35b-a3b.md"
      },
      "overallWinner": "B",
      "winner": {
        "slug": "holo3-35b-a3b",
        "canonicalModelKey": "holo3-35b-a3b",
        "model": "Holo3-35B-A3B",
        "creator": "H Company",
        "sourceType": "Open Weight",
        "reasoningType": "Non-Reasoning",
        "contextWindow": "64K",
        "contextWindowTokens": 64000,
        "displayScore": 100,
        "rankingEligible": false,
        "overallRank": null,
        "url": "https://benchlm.ai/models/holo3-35b-a3b",
        "markdownUrl": "https://benchlm.ai/md/models/holo3-35b-a3b.md"
      },
      "scoreDiff": 57,
      "winsA": 0,
      "winsB": 0,
      "comparableCategoryCount": 0,
      "benchmarkCountA": 1,
      "benchmarkCountB": 1,
      "categoryResults": {
        "agentic": {
          "categoryLabel": "Agentic",
          "avgA": null,
          "avgB": 82.6,
          "winner": null,
          "benchmarkCount": 2
        },
        "coding": {
          "categoryLabel": "Coding",
          "avgA": null,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 0
        },
        "multimodalGrounded": {
          "categoryLabel": "Multimodal & Grounded",
          "avgA": null,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 0
        },
        "reasoning": {
          "categoryLabel": "Reasoning",
          "avgA": null,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 0
        },
        "knowledge": {
          "categoryLabel": "Knowledge",
          "avgA": null,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 0
        },
        "instructionFollowing": {
          "categoryLabel": "Instruction Following",
          "avgA": null,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 0
        },
        "multilingual": {
          "categoryLabel": "Multilingual",
          "avgA": null,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 0
        },
        "math": {
          "categoryLabel": "Mathematics",
          "avgA": null,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 0
        }
      }
    },
    {
      "slug": "gpt-5-5-pro-vs-o4-mini-high",
      "url": "https://benchlm.ai/compare/gpt-5-5-pro-vs-o4-mini-high",
      "markdownUrl": "https://benchlm.ai/md/compare/gpt-5-5-pro-vs-o4-mini-high.md",
      "modelA": {
        "slug": "o4-mini-high",
        "canonicalModelKey": "o4-mini-high",
        "model": "o4-mini (high)",
        "creator": "OpenAI",
        "sourceType": "Proprietary",
        "reasoningType": "Reasoning",
        "contextWindow": "200K",
        "contextWindowTokens": 200000,
        "displayScore": 43,
        "rankingEligible": true,
        "overallRank": 79,
        "url": "https://benchlm.ai/models/o4-mini-high",
        "markdownUrl": "https://benchlm.ai/md/models/o4-mini-high.md"
      },
      "modelB": {
        "slug": "gpt-5-5-pro",
        "canonicalModelKey": "gpt-5-5-pro",
        "model": "GPT-5.5 Pro",
        "creator": "OpenAI",
        "sourceType": "Proprietary",
        "reasoningType": "Reasoning",
        "contextWindow": "1M",
        "contextWindowTokens": 1000000,
        "displayScore": 100,
        "rankingEligible": false,
        "overallRank": null,
        "url": "https://benchlm.ai/models/gpt-5-5-pro",
        "markdownUrl": "https://benchlm.ai/md/models/gpt-5-5-pro.md"
      },
      "overallWinner": "B",
      "winner": {
        "slug": "gpt-5-5-pro",
        "canonicalModelKey": "gpt-5-5-pro",
        "model": "GPT-5.5 Pro",
        "creator": "OpenAI",
        "sourceType": "Proprietary",
        "reasoningType": "Reasoning",
        "contextWindow": "1M",
        "contextWindowTokens": 1000000,
        "displayScore": 100,
        "rankingEligible": false,
        "overallRank": null,
        "url": "https://benchlm.ai/models/gpt-5-5-pro",
        "markdownUrl": "https://benchlm.ai/md/models/gpt-5-5-pro.md"
      },
      "scoreDiff": 57,
      "winsA": 0,
      "winsB": 0,
      "comparableCategoryCount": 0,
      "benchmarkCountA": 0,
      "benchmarkCountB": 4,
      "categoryResults": {
        "agentic": {
          "categoryLabel": "Agentic",
          "avgA": null,
          "avgB": 90.1,
          "winner": null,
          "benchmarkCount": 1
        },
        "coding": {
          "categoryLabel": "Coding",
          "avgA": null,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 0
        },
        "multimodalGrounded": {
          "categoryLabel": "Multimodal & Grounded",
          "avgA": null,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 0
        },
        "reasoning": {
          "categoryLabel": "Reasoning",
          "avgA": null,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 0
        },
        "knowledge": {
          "categoryLabel": "Knowledge",
          "avgA": null,
          "avgB": 57.2,
          "winner": null,
          "benchmarkCount": 2
        },
        "instructionFollowing": {
          "categoryLabel": "Instruction Following",
          "avgA": null,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 0
        },
        "multilingual": {
          "categoryLabel": "Multilingual",
          "avgA": null,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 0
        },
        "math": {
          "categoryLabel": "Mathematics",
          "avgA": null,
          "avgB": 52.4,
          "winner": null,
          "benchmarkCount": 1
        }
      }
    },
    {
      "slug": "holo3-35b-a3b-vs-o4-mini-high",
      "url": "https://benchlm.ai/compare/holo3-35b-a3b-vs-o4-mini-high",
      "markdownUrl": "https://benchlm.ai/md/compare/holo3-35b-a3b-vs-o4-mini-high.md",
      "modelA": {
        "slug": "o4-mini-high",
        "canonicalModelKey": "o4-mini-high",
        "model": "o4-mini (high)",
        "creator": "OpenAI",
        "sourceType": "Proprietary",
        "reasoningType": "Reasoning",
        "contextWindow": "200K",
        "contextWindowTokens": 200000,
        "displayScore": 43,
        "rankingEligible": true,
        "overallRank": 79,
        "url": "https://benchlm.ai/models/o4-mini-high",
        "markdownUrl": "https://benchlm.ai/md/models/o4-mini-high.md"
      },
      "modelB": {
        "slug": "holo3-35b-a3b",
        "canonicalModelKey": "holo3-35b-a3b",
        "model": "Holo3-35B-A3B",
        "creator": "H Company",
        "sourceType": "Open Weight",
        "reasoningType": "Non-Reasoning",
        "contextWindow": "64K",
        "contextWindowTokens": 64000,
        "displayScore": 100,
        "rankingEligible": false,
        "overallRank": null,
        "url": "https://benchlm.ai/models/holo3-35b-a3b",
        "markdownUrl": "https://benchlm.ai/md/models/holo3-35b-a3b.md"
      },
      "overallWinner": "B",
      "winner": {
        "slug": "holo3-35b-a3b",
        "canonicalModelKey": "holo3-35b-a3b",
        "model": "Holo3-35B-A3B",
        "creator": "H Company",
        "sourceType": "Open Weight",
        "reasoningType": "Non-Reasoning",
        "contextWindow": "64K",
        "contextWindowTokens": 64000,
        "displayScore": 100,
        "rankingEligible": false,
        "overallRank": null,
        "url": "https://benchlm.ai/models/holo3-35b-a3b",
        "markdownUrl": "https://benchlm.ai/md/models/holo3-35b-a3b.md"
      },
      "scoreDiff": 57,
      "winsA": 0,
      "winsB": 0,
      "comparableCategoryCount": 0,
      "benchmarkCountA": 0,
      "benchmarkCountB": 1,
      "categoryResults": {
        "agentic": {
          "categoryLabel": "Agentic",
          "avgA": null,
          "avgB": 82.6,
          "winner": null,
          "benchmarkCount": 1
        },
        "coding": {
          "categoryLabel": "Coding",
          "avgA": null,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 0
        },
        "multimodalGrounded": {
          "categoryLabel": "Multimodal & Grounded",
          "avgA": null,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 0
        },
        "reasoning": {
          "categoryLabel": "Reasoning",
          "avgA": null,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 0
        },
        "knowledge": {
          "categoryLabel": "Knowledge",
          "avgA": null,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 0
        },
        "instructionFollowing": {
          "categoryLabel": "Instruction Following",
          "avgA": null,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 0
        },
        "multilingual": {
          "categoryLabel": "Multilingual",
          "avgA": null,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 0
        },
        "math": {
          "categoryLabel": "Mathematics",
          "avgA": null,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 0
        }
      }
    },
    {
      "slug": "claude-4-1-opus-thinking-vs-gpt-5-5-pro",
      "url": "https://benchlm.ai/compare/claude-4-1-opus-thinking-vs-gpt-5-5-pro",
      "markdownUrl": "https://benchlm.ai/md/compare/claude-4-1-opus-thinking-vs-gpt-5-5-pro.md",
      "modelA": {
        "slug": "claude-4-1-opus-thinking",
        "canonicalModelKey": "claude-4-1-opus-thinking",
        "model": "Claude 4.1 Opus Thinking",
        "creator": "Anthropic",
        "sourceType": "Proprietary",
        "reasoningType": "Reasoning",
        "contextWindow": "200K",
        "contextWindowTokens": 200000,
        "displayScore": 43,
        "rankingEligible": true,
        "overallRank": 80,
        "url": "https://benchlm.ai/models/claude-4-1-opus-thinking",
        "markdownUrl": "https://benchlm.ai/md/models/claude-4-1-opus-thinking.md"
      },
      "modelB": {
        "slug": "gpt-5-5-pro",
        "canonicalModelKey": "gpt-5-5-pro",
        "model": "GPT-5.5 Pro",
        "creator": "OpenAI",
        "sourceType": "Proprietary",
        "reasoningType": "Reasoning",
        "contextWindow": "1M",
        "contextWindowTokens": 1000000,
        "displayScore": 100,
        "rankingEligible": false,
        "overallRank": null,
        "url": "https://benchlm.ai/models/gpt-5-5-pro",
        "markdownUrl": "https://benchlm.ai/md/models/gpt-5-5-pro.md"
      },
      "overallWinner": "B",
      "winner": {
        "slug": "gpt-5-5-pro",
        "canonicalModelKey": "gpt-5-5-pro",
        "model": "GPT-5.5 Pro",
        "creator": "OpenAI",
        "sourceType": "Proprietary",
        "reasoningType": "Reasoning",
        "contextWindow": "1M",
        "contextWindowTokens": 1000000,
        "displayScore": 100,
        "rankingEligible": false,
        "overallRank": null,
        "url": "https://benchlm.ai/models/gpt-5-5-pro",
        "markdownUrl": "https://benchlm.ai/md/models/gpt-5-5-pro.md"
      },
      "scoreDiff": 57,
      "winsA": 0,
      "winsB": 0,
      "comparableCategoryCount": 0,
      "benchmarkCountA": 11,
      "benchmarkCountB": 4,
      "categoryResults": {
        "agentic": {
          "categoryLabel": "Agentic",
          "avgA": null,
          "avgB": 90.1,
          "winner": null,
          "benchmarkCount": 2
        },
        "coding": {
          "categoryLabel": "Coding",
          "avgA": null,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 3
        },
        "multimodalGrounded": {
          "categoryLabel": "Multimodal & Grounded",
          "avgA": null,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 1
        },
        "reasoning": {
          "categoryLabel": "Reasoning",
          "avgA": null,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 2
        },
        "knowledge": {
          "categoryLabel": "Knowledge",
          "avgA": null,
          "avgB": 57.2,
          "winner": null,
          "benchmarkCount": 5
        },
        "instructionFollowing": {
          "categoryLabel": "Instruction Following",
          "avgA": null,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 1
        },
        "multilingual": {
          "categoryLabel": "Multilingual",
          "avgA": null,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 0
        },
        "math": {
          "categoryLabel": "Mathematics",
          "avgA": null,
          "avgB": 52.4,
          "winner": null,
          "benchmarkCount": 1
        }
      }
    },
    {
      "slug": "claude-4-1-opus-thinking-vs-holo3-35b-a3b",
      "url": "https://benchlm.ai/compare/claude-4-1-opus-thinking-vs-holo3-35b-a3b",
      "markdownUrl": "https://benchlm.ai/md/compare/claude-4-1-opus-thinking-vs-holo3-35b-a3b.md",
      "modelA": {
        "slug": "claude-4-1-opus-thinking",
        "canonicalModelKey": "claude-4-1-opus-thinking",
        "model": "Claude 4.1 Opus Thinking",
        "creator": "Anthropic",
        "sourceType": "Proprietary",
        "reasoningType": "Reasoning",
        "contextWindow": "200K",
        "contextWindowTokens": 200000,
        "displayScore": 43,
        "rankingEligible": true,
        "overallRank": 80,
        "url": "https://benchlm.ai/models/claude-4-1-opus-thinking",
        "markdownUrl": "https://benchlm.ai/md/models/claude-4-1-opus-thinking.md"
      },
      "modelB": {
        "slug": "holo3-35b-a3b",
        "canonicalModelKey": "holo3-35b-a3b",
        "model": "Holo3-35B-A3B",
        "creator": "H Company",
        "sourceType": "Open Weight",
        "reasoningType": "Non-Reasoning",
        "contextWindow": "64K",
        "contextWindowTokens": 64000,
        "displayScore": 100,
        "rankingEligible": false,
        "overallRank": null,
        "url": "https://benchlm.ai/models/holo3-35b-a3b",
        "markdownUrl": "https://benchlm.ai/md/models/holo3-35b-a3b.md"
      },
      "overallWinner": "B",
      "winner": {
        "slug": "holo3-35b-a3b",
        "canonicalModelKey": "holo3-35b-a3b",
        "model": "Holo3-35B-A3B",
        "creator": "H Company",
        "sourceType": "Open Weight",
        "reasoningType": "Non-Reasoning",
        "contextWindow": "64K",
        "contextWindowTokens": 64000,
        "displayScore": 100,
        "rankingEligible": false,
        "overallRank": null,
        "url": "https://benchlm.ai/models/holo3-35b-a3b",
        "markdownUrl": "https://benchlm.ai/md/models/holo3-35b-a3b.md"
      },
      "scoreDiff": 57,
      "winsA": 0,
      "winsB": 0,
      "comparableCategoryCount": 0,
      "benchmarkCountA": 11,
      "benchmarkCountB": 1,
      "categoryResults": {
        "agentic": {
          "categoryLabel": "Agentic",
          "avgA": null,
          "avgB": 82.6,
          "winner": null,
          "benchmarkCount": 2
        },
        "coding": {
          "categoryLabel": "Coding",
          "avgA": null,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 3
        },
        "multimodalGrounded": {
          "categoryLabel": "Multimodal & Grounded",
          "avgA": null,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 1
        },
        "reasoning": {
          "categoryLabel": "Reasoning",
          "avgA": null,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 2
        },
        "knowledge": {
          "categoryLabel": "Knowledge",
          "avgA": null,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 3
        },
        "instructionFollowing": {
          "categoryLabel": "Instruction Following",
          "avgA": null,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 1
        },
        "multilingual": {
          "categoryLabel": "Multilingual",
          "avgA": null,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 0
        },
        "math": {
          "categoryLabel": "Mathematics",
          "avgA": null,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 0
        }
      }
    },
    {
      "slug": "gpt-4o-vs-gpt-5-5-pro",
      "url": "https://benchlm.ai/compare/gpt-4o-vs-gpt-5-5-pro",
      "markdownUrl": "https://benchlm.ai/md/compare/gpt-4o-vs-gpt-5-5-pro.md",
      "modelA": {
        "slug": "gpt-4o",
        "canonicalModelKey": "gpt-4o",
        "model": "GPT-4o",
        "creator": "OpenAI",
        "sourceType": "Proprietary",
        "reasoningType": "Non-Reasoning",
        "contextWindow": "128K",
        "contextWindowTokens": 128000,
        "displayScore": 42,
        "rankingEligible": true,
        "overallRank": 81,
        "url": "https://benchlm.ai/models/gpt-4o",
        "markdownUrl": "https://benchlm.ai/md/models/gpt-4o.md"
      },
      "modelB": {
        "slug": "gpt-5-5-pro",
        "canonicalModelKey": "gpt-5-5-pro",
        "model": "GPT-5.5 Pro",
        "creator": "OpenAI",
        "sourceType": "Proprietary",
        "reasoningType": "Reasoning",
        "contextWindow": "1M",
        "contextWindowTokens": 1000000,
        "displayScore": 100,
        "rankingEligible": false,
        "overallRank": null,
        "url": "https://benchlm.ai/models/gpt-5-5-pro",
        "markdownUrl": "https://benchlm.ai/md/models/gpt-5-5-pro.md"
      },
      "overallWinner": "B",
      "winner": {
        "slug": "gpt-5-5-pro",
        "canonicalModelKey": "gpt-5-5-pro",
        "model": "GPT-5.5 Pro",
        "creator": "OpenAI",
        "sourceType": "Proprietary",
        "reasoningType": "Reasoning",
        "contextWindow": "1M",
        "contextWindowTokens": 1000000,
        "displayScore": 100,
        "rankingEligible": false,
        "overallRank": null,
        "url": "https://benchlm.ai/models/gpt-5-5-pro",
        "markdownUrl": "https://benchlm.ai/md/models/gpt-5-5-pro.md"
      },
      "scoreDiff": 58,
      "winsA": 0,
      "winsB": 0,
      "comparableCategoryCount": 0,
      "benchmarkCountA": 17,
      "benchmarkCountB": 4,
      "categoryResults": {
        "agentic": {
          "categoryLabel": "Agentic",
          "avgA": null,
          "avgB": 90.1,
          "winner": null,
          "benchmarkCount": 5
        },
        "coding": {
          "categoryLabel": "Coding",
          "avgA": null,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 3
        },
        "multimodalGrounded": {
          "categoryLabel": "Multimodal & Grounded",
          "avgA": null,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 1
        },
        "reasoning": {
          "categoryLabel": "Reasoning",
          "avgA": null,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 2
        },
        "knowledge": {
          "categoryLabel": "Knowledge",
          "avgA": null,
          "avgB": 57.2,
          "winner": null,
          "benchmarkCount": 8
        },
        "instructionFollowing": {
          "categoryLabel": "Instruction Following",
          "avgA": null,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 1
        },
        "multilingual": {
          "categoryLabel": "Multilingual",
          "avgA": null,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 0
        },
        "math": {
          "categoryLabel": "Mathematics",
          "avgA": null,
          "avgB": 52.4,
          "winner": null,
          "benchmarkCount": 1
        }
      }
    },
    {
      "slug": "gpt-4o-vs-holo3-35b-a3b",
      "url": "https://benchlm.ai/compare/gpt-4o-vs-holo3-35b-a3b",
      "markdownUrl": "https://benchlm.ai/md/compare/gpt-4o-vs-holo3-35b-a3b.md",
      "modelA": {
        "slug": "gpt-4o",
        "canonicalModelKey": "gpt-4o",
        "model": "GPT-4o",
        "creator": "OpenAI",
        "sourceType": "Proprietary",
        "reasoningType": "Non-Reasoning",
        "contextWindow": "128K",
        "contextWindowTokens": 128000,
        "displayScore": 42,
        "rankingEligible": true,
        "overallRank": 81,
        "url": "https://benchlm.ai/models/gpt-4o",
        "markdownUrl": "https://benchlm.ai/md/models/gpt-4o.md"
      },
      "modelB": {
        "slug": "holo3-35b-a3b",
        "canonicalModelKey": "holo3-35b-a3b",
        "model": "Holo3-35B-A3B",
        "creator": "H Company",
        "sourceType": "Open Weight",
        "reasoningType": "Non-Reasoning",
        "contextWindow": "64K",
        "contextWindowTokens": 64000,
        "displayScore": 100,
        "rankingEligible": false,
        "overallRank": null,
        "url": "https://benchlm.ai/models/holo3-35b-a3b",
        "markdownUrl": "https://benchlm.ai/md/models/holo3-35b-a3b.md"
      },
      "overallWinner": "B",
      "winner": {
        "slug": "holo3-35b-a3b",
        "canonicalModelKey": "holo3-35b-a3b",
        "model": "Holo3-35B-A3B",
        "creator": "H Company",
        "sourceType": "Open Weight",
        "reasoningType": "Non-Reasoning",
        "contextWindow": "64K",
        "contextWindowTokens": 64000,
        "displayScore": 100,
        "rankingEligible": false,
        "overallRank": null,
        "url": "https://benchlm.ai/models/holo3-35b-a3b",
        "markdownUrl": "https://benchlm.ai/md/models/holo3-35b-a3b.md"
      },
      "scoreDiff": 58,
      "winsA": 0,
      "winsB": 0,
      "comparableCategoryCount": 0,
      "benchmarkCountA": 17,
      "benchmarkCountB": 1,
      "categoryResults": {
        "agentic": {
          "categoryLabel": "Agentic",
          "avgA": null,
          "avgB": 82.6,
          "winner": null,
          "benchmarkCount": 5
        },
        "coding": {
          "categoryLabel": "Coding",
          "avgA": null,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 3
        },
        "multimodalGrounded": {
          "categoryLabel": "Multimodal & Grounded",
          "avgA": null,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 1
        },
        "reasoning": {
          "categoryLabel": "Reasoning",
          "avgA": null,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 2
        },
        "knowledge": {
          "categoryLabel": "Knowledge",
          "avgA": null,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 6
        },
        "instructionFollowing": {
          "categoryLabel": "Instruction Following",
          "avgA": null,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 1
        },
        "multilingual": {
          "categoryLabel": "Multilingual",
          "avgA": null,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 0
        },
        "math": {
          "categoryLabel": "Mathematics",
          "avgA": null,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 0
        }
      }
    },
    {
      "slug": "gpt-5-5-pro-vs-kimi-k2",
      "url": "https://benchlm.ai/compare/gpt-5-5-pro-vs-kimi-k2",
      "markdownUrl": "https://benchlm.ai/md/compare/gpt-5-5-pro-vs-kimi-k2.md",
      "modelA": {
        "slug": "kimi-k2",
        "canonicalModelKey": "kimi-k2",
        "model": "Kimi K2",
        "creator": "Moonshot AI",
        "sourceType": "Proprietary",
        "reasoningType": "Non-Reasoning",
        "contextWindow": "128K",
        "contextWindowTokens": 128000,
        "displayScore": 41,
        "rankingEligible": true,
        "overallRank": 82,
        "url": "https://benchlm.ai/models/kimi-k2",
        "markdownUrl": "https://benchlm.ai/md/models/kimi-k2.md"
      },
      "modelB": {
        "slug": "gpt-5-5-pro",
        "canonicalModelKey": "gpt-5-5-pro",
        "model": "GPT-5.5 Pro",
        "creator": "OpenAI",
        "sourceType": "Proprietary",
        "reasoningType": "Reasoning",
        "contextWindow": "1M",
        "contextWindowTokens": 1000000,
        "displayScore": 100,
        "rankingEligible": false,
        "overallRank": null,
        "url": "https://benchlm.ai/models/gpt-5-5-pro",
        "markdownUrl": "https://benchlm.ai/md/models/gpt-5-5-pro.md"
      },
      "overallWinner": "B",
      "winner": {
        "slug": "gpt-5-5-pro",
        "canonicalModelKey": "gpt-5-5-pro",
        "model": "GPT-5.5 Pro",
        "creator": "OpenAI",
        "sourceType": "Proprietary",
        "reasoningType": "Reasoning",
        "contextWindow": "1M",
        "contextWindowTokens": 1000000,
        "displayScore": 100,
        "rankingEligible": false,
        "overallRank": null,
        "url": "https://benchlm.ai/models/gpt-5-5-pro",
        "markdownUrl": "https://benchlm.ai/md/models/gpt-5-5-pro.md"
      },
      "scoreDiff": 59,
      "winsA": 0,
      "winsB": 0,
      "comparableCategoryCount": 0,
      "benchmarkCountA": 17,
      "benchmarkCountB": 4,
      "categoryResults": {
        "agentic": {
          "categoryLabel": "Agentic",
          "avgA": null,
          "avgB": 90.1,
          "winner": null,
          "benchmarkCount": 5
        },
        "coding": {
          "categoryLabel": "Coding",
          "avgA": null,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 3
        },
        "multimodalGrounded": {
          "categoryLabel": "Multimodal & Grounded",
          "avgA": null,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 1
        },
        "reasoning": {
          "categoryLabel": "Reasoning",
          "avgA": null,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 2
        },
        "knowledge": {
          "categoryLabel": "Knowledge",
          "avgA": null,
          "avgB": 57.2,
          "winner": null,
          "benchmarkCount": 8
        },
        "instructionFollowing": {
          "categoryLabel": "Instruction Following",
          "avgA": null,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 1
        },
        "multilingual": {
          "categoryLabel": "Multilingual",
          "avgA": null,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 0
        },
        "math": {
          "categoryLabel": "Mathematics",
          "avgA": null,
          "avgB": 52.4,
          "winner": null,
          "benchmarkCount": 1
        }
      }
    },
    {
      "slug": "holo3-35b-a3b-vs-kimi-k2",
      "url": "https://benchlm.ai/compare/holo3-35b-a3b-vs-kimi-k2",
      "markdownUrl": "https://benchlm.ai/md/compare/holo3-35b-a3b-vs-kimi-k2.md",
      "modelA": {
        "slug": "kimi-k2",
        "canonicalModelKey": "kimi-k2",
        "model": "Kimi K2",
        "creator": "Moonshot AI",
        "sourceType": "Proprietary",
        "reasoningType": "Non-Reasoning",
        "contextWindow": "128K",
        "contextWindowTokens": 128000,
        "displayScore": 41,
        "rankingEligible": true,
        "overallRank": 82,
        "url": "https://benchlm.ai/models/kimi-k2",
        "markdownUrl": "https://benchlm.ai/md/models/kimi-k2.md"
      },
      "modelB": {
        "slug": "holo3-35b-a3b",
        "canonicalModelKey": "holo3-35b-a3b",
        "model": "Holo3-35B-A3B",
        "creator": "H Company",
        "sourceType": "Open Weight",
        "reasoningType": "Non-Reasoning",
        "contextWindow": "64K",
        "contextWindowTokens": 64000,
        "displayScore": 100,
        "rankingEligible": false,
        "overallRank": null,
        "url": "https://benchlm.ai/models/holo3-35b-a3b",
        "markdownUrl": "https://benchlm.ai/md/models/holo3-35b-a3b.md"
      },
      "overallWinner": "B",
      "winner": {
        "slug": "holo3-35b-a3b",
        "canonicalModelKey": "holo3-35b-a3b",
        "model": "Holo3-35B-A3B",
        "creator": "H Company",
        "sourceType": "Open Weight",
        "reasoningType": "Non-Reasoning",
        "contextWindow": "64K",
        "contextWindowTokens": 64000,
        "displayScore": 100,
        "rankingEligible": false,
        "overallRank": null,
        "url": "https://benchlm.ai/models/holo3-35b-a3b",
        "markdownUrl": "https://benchlm.ai/md/models/holo3-35b-a3b.md"
      },
      "scoreDiff": 59,
      "winsA": 0,
      "winsB": 0,
      "comparableCategoryCount": 0,
      "benchmarkCountA": 17,
      "benchmarkCountB": 1,
      "categoryResults": {
        "agentic": {
          "categoryLabel": "Agentic",
          "avgA": null,
          "avgB": 82.6,
          "winner": null,
          "benchmarkCount": 5
        },
        "coding": {
          "categoryLabel": "Coding",
          "avgA": null,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 3
        },
        "multimodalGrounded": {
          "categoryLabel": "Multimodal & Grounded",
          "avgA": null,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 1
        },
        "reasoning": {
          "categoryLabel": "Reasoning",
          "avgA": null,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 2
        },
        "knowledge": {
          "categoryLabel": "Knowledge",
          "avgA": null,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 6
        },
        "instructionFollowing": {
          "categoryLabel": "Instruction Following",
          "avgA": null,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 1
        },
        "multilingual": {
          "categoryLabel": "Multilingual",
          "avgA": null,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 0
        },
        "math": {
          "categoryLabel": "Mathematics",
          "avgA": null,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 0
        }
      }
    },
    {
      "slug": "gpt-5-5-pro-vs-llama-3-1-405b",
      "url": "https://benchlm.ai/compare/gpt-5-5-pro-vs-llama-3-1-405b",
      "markdownUrl": "https://benchlm.ai/md/compare/gpt-5-5-pro-vs-llama-3-1-405b.md",
      "modelA": {
        "slug": "llama-3-1-405b",
        "canonicalModelKey": "llama-3-1-405b",
        "model": "Llama 3.1 405B",
        "creator": "Meta",
        "sourceType": "Open Weight",
        "reasoningType": "Non-Reasoning",
        "contextWindow": "128K",
        "contextWindowTokens": 128000,
        "displayScore": 40,
        "rankingEligible": true,
        "overallRank": 83,
        "url": "https://benchlm.ai/models/llama-3-1-405b",
        "markdownUrl": "https://benchlm.ai/md/models/llama-3-1-405b.md"
      },
      "modelB": {
        "slug": "gpt-5-5-pro",
        "canonicalModelKey": "gpt-5-5-pro",
        "model": "GPT-5.5 Pro",
        "creator": "OpenAI",
        "sourceType": "Proprietary",
        "reasoningType": "Reasoning",
        "contextWindow": "1M",
        "contextWindowTokens": 1000000,
        "displayScore": 100,
        "rankingEligible": false,
        "overallRank": null,
        "url": "https://benchlm.ai/models/gpt-5-5-pro",
        "markdownUrl": "https://benchlm.ai/md/models/gpt-5-5-pro.md"
      },
      "overallWinner": "B",
      "winner": {
        "slug": "gpt-5-5-pro",
        "canonicalModelKey": "gpt-5-5-pro",
        "model": "GPT-5.5 Pro",
        "creator": "OpenAI",
        "sourceType": "Proprietary",
        "reasoningType": "Reasoning",
        "contextWindow": "1M",
        "contextWindowTokens": 1000000,
        "displayScore": 100,
        "rankingEligible": false,
        "overallRank": null,
        "url": "https://benchlm.ai/models/gpt-5-5-pro",
        "markdownUrl": "https://benchlm.ai/md/models/gpt-5-5-pro.md"
      },
      "scoreDiff": 60,
      "winsA": 0,
      "winsB": 0,
      "comparableCategoryCount": 0,
      "benchmarkCountA": 16,
      "benchmarkCountB": 4,
      "categoryResults": {
        "agentic": {
          "categoryLabel": "Agentic",
          "avgA": null,
          "avgB": 90.1,
          "winner": null,
          "benchmarkCount": 5
        },
        "coding": {
          "categoryLabel": "Coding",
          "avgA": null,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 3
        },
        "multimodalGrounded": {
          "categoryLabel": "Multimodal & Grounded",
          "avgA": null,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 0
        },
        "reasoning": {
          "categoryLabel": "Reasoning",
          "avgA": null,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 2
        },
        "knowledge": {
          "categoryLabel": "Knowledge",
          "avgA": null,
          "avgB": 57.2,
          "winner": null,
          "benchmarkCount": 8
        },
        "instructionFollowing": {
          "categoryLabel": "Instruction Following",
          "avgA": null,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 1
        },
        "multilingual": {
          "categoryLabel": "Multilingual",
          "avgA": null,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 0
        },
        "math": {
          "categoryLabel": "Mathematics",
          "avgA": null,
          "avgB": 52.4,
          "winner": null,
          "benchmarkCount": 1
        }
      }
    },
    {
      "slug": "holo3-35b-a3b-vs-llama-3-1-405b",
      "url": "https://benchlm.ai/compare/holo3-35b-a3b-vs-llama-3-1-405b",
      "markdownUrl": "https://benchlm.ai/md/compare/holo3-35b-a3b-vs-llama-3-1-405b.md",
      "modelA": {
        "slug": "llama-3-1-405b",
        "canonicalModelKey": "llama-3-1-405b",
        "model": "Llama 3.1 405B",
        "creator": "Meta",
        "sourceType": "Open Weight",
        "reasoningType": "Non-Reasoning",
        "contextWindow": "128K",
        "contextWindowTokens": 128000,
        "displayScore": 40,
        "rankingEligible": true,
        "overallRank": 83,
        "url": "https://benchlm.ai/models/llama-3-1-405b",
        "markdownUrl": "https://benchlm.ai/md/models/llama-3-1-405b.md"
      },
      "modelB": {
        "slug": "holo3-35b-a3b",
        "canonicalModelKey": "holo3-35b-a3b",
        "model": "Holo3-35B-A3B",
        "creator": "H Company",
        "sourceType": "Open Weight",
        "reasoningType": "Non-Reasoning",
        "contextWindow": "64K",
        "contextWindowTokens": 64000,
        "displayScore": 100,
        "rankingEligible": false,
        "overallRank": null,
        "url": "https://benchlm.ai/models/holo3-35b-a3b",
        "markdownUrl": "https://benchlm.ai/md/models/holo3-35b-a3b.md"
      },
      "overallWinner": "B",
      "winner": {
        "slug": "holo3-35b-a3b",
        "canonicalModelKey": "holo3-35b-a3b",
        "model": "Holo3-35B-A3B",
        "creator": "H Company",
        "sourceType": "Open Weight",
        "reasoningType": "Non-Reasoning",
        "contextWindow": "64K",
        "contextWindowTokens": 64000,
        "displayScore": 100,
        "rankingEligible": false,
        "overallRank": null,
        "url": "https://benchlm.ai/models/holo3-35b-a3b",
        "markdownUrl": "https://benchlm.ai/md/models/holo3-35b-a3b.md"
      },
      "scoreDiff": 60,
      "winsA": 0,
      "winsB": 0,
      "comparableCategoryCount": 0,
      "benchmarkCountA": 16,
      "benchmarkCountB": 1,
      "categoryResults": {
        "agentic": {
          "categoryLabel": "Agentic",
          "avgA": null,
          "avgB": 82.6,
          "winner": null,
          "benchmarkCount": 5
        },
        "coding": {
          "categoryLabel": "Coding",
          "avgA": null,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 3
        },
        "multimodalGrounded": {
          "categoryLabel": "Multimodal & Grounded",
          "avgA": null,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 0
        },
        "reasoning": {
          "categoryLabel": "Reasoning",
          "avgA": null,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 2
        },
        "knowledge": {
          "categoryLabel": "Knowledge",
          "avgA": null,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 6
        },
        "instructionFollowing": {
          "categoryLabel": "Instruction Following",
          "avgA": null,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 1
        },
        "multilingual": {
          "categoryLabel": "Multilingual",
          "avgA": null,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 0
        },
        "math": {
          "categoryLabel": "Mathematics",
          "avgA": null,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 0
        }
      }
    },
    {
      "slug": "claude-3-5-sonnet-vs-gpt-5-5-pro",
      "url": "https://benchlm.ai/compare/claude-3-5-sonnet-vs-gpt-5-5-pro",
      "markdownUrl": "https://benchlm.ai/md/compare/claude-3-5-sonnet-vs-gpt-5-5-pro.md",
      "modelA": {
        "slug": "claude-3-5-sonnet",
        "canonicalModelKey": "claude-3-5-sonnet",
        "model": "Claude 3.5 Sonnet",
        "creator": "Anthropic",
        "sourceType": "Proprietary",
        "reasoningType": "Non-Reasoning",
        "contextWindow": "200K",
        "contextWindowTokens": 200000,
        "displayScore": 40,
        "rankingEligible": true,
        "overallRank": 84,
        "url": "https://benchlm.ai/models/claude-3-5-sonnet",
        "markdownUrl": "https://benchlm.ai/md/models/claude-3-5-sonnet.md"
      },
      "modelB": {
        "slug": "gpt-5-5-pro",
        "canonicalModelKey": "gpt-5-5-pro",
        "model": "GPT-5.5 Pro",
        "creator": "OpenAI",
        "sourceType": "Proprietary",
        "reasoningType": "Reasoning",
        "contextWindow": "1M",
        "contextWindowTokens": 1000000,
        "displayScore": 100,
        "rankingEligible": false,
        "overallRank": null,
        "url": "https://benchlm.ai/models/gpt-5-5-pro",
        "markdownUrl": "https://benchlm.ai/md/models/gpt-5-5-pro.md"
      },
      "overallWinner": "B",
      "winner": {
        "slug": "gpt-5-5-pro",
        "canonicalModelKey": "gpt-5-5-pro",
        "model": "GPT-5.5 Pro",
        "creator": "OpenAI",
        "sourceType": "Proprietary",
        "reasoningType": "Reasoning",
        "contextWindow": "1M",
        "contextWindowTokens": 1000000,
        "displayScore": 100,
        "rankingEligible": false,
        "overallRank": null,
        "url": "https://benchlm.ai/models/gpt-5-5-pro",
        "markdownUrl": "https://benchlm.ai/md/models/gpt-5-5-pro.md"
      },
      "scoreDiff": 60,
      "winsA": 1,
      "winsB": 0,
      "comparableCategoryCount": 1,
      "benchmarkCountA": 2,
      "benchmarkCountB": 4,
      "categoryResults": {
        "agentic": {
          "categoryLabel": "Agentic",
          "avgA": null,
          "avgB": 90.1,
          "winner": null,
          "benchmarkCount": 1
        },
        "coding": {
          "categoryLabel": "Coding",
          "avgA": 49,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 1
        },
        "multimodalGrounded": {
          "categoryLabel": "Multimodal & Grounded",
          "avgA": null,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 0
        },
        "reasoning": {
          "categoryLabel": "Reasoning",
          "avgA": null,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 0
        },
        "knowledge": {
          "categoryLabel": "Knowledge",
          "avgA": 59.4,
          "avgB": 57.2,
          "winner": "A",
          "benchmarkCount": 3
        },
        "instructionFollowing": {
          "categoryLabel": "Instruction Following",
          "avgA": null,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 0
        },
        "multilingual": {
          "categoryLabel": "Multilingual",
          "avgA": null,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 0
        },
        "math": {
          "categoryLabel": "Mathematics",
          "avgA": null,
          "avgB": 52.4,
          "winner": null,
          "benchmarkCount": 1
        }
      }
    },
    {
      "slug": "claude-3-5-sonnet-vs-holo3-35b-a3b",
      "url": "https://benchlm.ai/compare/claude-3-5-sonnet-vs-holo3-35b-a3b",
      "markdownUrl": "https://benchlm.ai/md/compare/claude-3-5-sonnet-vs-holo3-35b-a3b.md",
      "modelA": {
        "slug": "claude-3-5-sonnet",
        "canonicalModelKey": "claude-3-5-sonnet",
        "model": "Claude 3.5 Sonnet",
        "creator": "Anthropic",
        "sourceType": "Proprietary",
        "reasoningType": "Non-Reasoning",
        "contextWindow": "200K",
        "contextWindowTokens": 200000,
        "displayScore": 40,
        "rankingEligible": true,
        "overallRank": 84,
        "url": "https://benchlm.ai/models/claude-3-5-sonnet",
        "markdownUrl": "https://benchlm.ai/md/models/claude-3-5-sonnet.md"
      },
      "modelB": {
        "slug": "holo3-35b-a3b",
        "canonicalModelKey": "holo3-35b-a3b",
        "model": "Holo3-35B-A3B",
        "creator": "H Company",
        "sourceType": "Open Weight",
        "reasoningType": "Non-Reasoning",
        "contextWindow": "64K",
        "contextWindowTokens": 64000,
        "displayScore": 100,
        "rankingEligible": false,
        "overallRank": null,
        "url": "https://benchlm.ai/models/holo3-35b-a3b",
        "markdownUrl": "https://benchlm.ai/md/models/holo3-35b-a3b.md"
      },
      "overallWinner": "B",
      "winner": {
        "slug": "holo3-35b-a3b",
        "canonicalModelKey": "holo3-35b-a3b",
        "model": "Holo3-35B-A3B",
        "creator": "H Company",
        "sourceType": "Open Weight",
        "reasoningType": "Non-Reasoning",
        "contextWindow": "64K",
        "contextWindowTokens": 64000,
        "displayScore": 100,
        "rankingEligible": false,
        "overallRank": null,
        "url": "https://benchlm.ai/models/holo3-35b-a3b",
        "markdownUrl": "https://benchlm.ai/md/models/holo3-35b-a3b.md"
      },
      "scoreDiff": 60,
      "winsA": 0,
      "winsB": 0,
      "comparableCategoryCount": 0,
      "benchmarkCountA": 2,
      "benchmarkCountB": 1,
      "categoryResults": {
        "agentic": {
          "categoryLabel": "Agentic",
          "avgA": null,
          "avgB": 82.6,
          "winner": null,
          "benchmarkCount": 1
        },
        "coding": {
          "categoryLabel": "Coding",
          "avgA": 49,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 1
        },
        "multimodalGrounded": {
          "categoryLabel": "Multimodal & Grounded",
          "avgA": null,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 0
        },
        "reasoning": {
          "categoryLabel": "Reasoning",
          "avgA": null,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 0
        },
        "knowledge": {
          "categoryLabel": "Knowledge",
          "avgA": 59.4,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 1
        },
        "instructionFollowing": {
          "categoryLabel": "Instruction Following",
          "avgA": null,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 0
        },
        "multilingual": {
          "categoryLabel": "Multilingual",
          "avgA": null,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 0
        },
        "math": {
          "categoryLabel": "Mathematics",
          "avgA": null,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 0
        }
      }
    },
    {
      "slug": "gpt-5-5-pro-vs-grok-code-fast-1",
      "url": "https://benchlm.ai/compare/gpt-5-5-pro-vs-grok-code-fast-1",
      "markdownUrl": "https://benchlm.ai/md/compare/gpt-5-5-pro-vs-grok-code-fast-1.md",
      "modelA": {
        "slug": "grok-code-fast-1",
        "canonicalModelKey": "grok-code-fast-1",
        "model": "Grok Code Fast 1",
        "creator": "xAI",
        "sourceType": "Proprietary",
        "reasoningType": "Non-Reasoning",
        "contextWindow": "256K",
        "contextWindowTokens": 256000,
        "displayScore": 39,
        "rankingEligible": true,
        "overallRank": 85,
        "url": "https://benchlm.ai/models/grok-code-fast-1",
        "markdownUrl": "https://benchlm.ai/md/models/grok-code-fast-1.md"
      },
      "modelB": {
        "slug": "gpt-5-5-pro",
        "canonicalModelKey": "gpt-5-5-pro",
        "model": "GPT-5.5 Pro",
        "creator": "OpenAI",
        "sourceType": "Proprietary",
        "reasoningType": "Reasoning",
        "contextWindow": "1M",
        "contextWindowTokens": 1000000,
        "displayScore": 100,
        "rankingEligible": false,
        "overallRank": null,
        "url": "https://benchlm.ai/models/gpt-5-5-pro",
        "markdownUrl": "https://benchlm.ai/md/models/gpt-5-5-pro.md"
      },
      "overallWinner": "B",
      "winner": {
        "slug": "gpt-5-5-pro",
        "canonicalModelKey": "gpt-5-5-pro",
        "model": "GPT-5.5 Pro",
        "creator": "OpenAI",
        "sourceType": "Proprietary",
        "reasoningType": "Reasoning",
        "contextWindow": "1M",
        "contextWindowTokens": 1000000,
        "displayScore": 100,
        "rankingEligible": false,
        "overallRank": null,
        "url": "https://benchlm.ai/models/gpt-5-5-pro",
        "markdownUrl": "https://benchlm.ai/md/models/gpt-5-5-pro.md"
      },
      "scoreDiff": 61,
      "winsA": 0,
      "winsB": 0,
      "comparableCategoryCount": 0,
      "benchmarkCountA": 17,
      "benchmarkCountB": 4,
      "categoryResults": {
        "agentic": {
          "categoryLabel": "Agentic",
          "avgA": null,
          "avgB": 90.1,
          "winner": null,
          "benchmarkCount": 5
        },
        "coding": {
          "categoryLabel": "Coding",
          "avgA": 70.8,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 4
        },
        "multimodalGrounded": {
          "categoryLabel": "Multimodal & Grounded",
          "avgA": null,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 0
        },
        "reasoning": {
          "categoryLabel": "Reasoning",
          "avgA": null,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 2
        },
        "knowledge": {
          "categoryLabel": "Knowledge",
          "avgA": null,
          "avgB": 57.2,
          "winner": null,
          "benchmarkCount": 8
        },
        "instructionFollowing": {
          "categoryLabel": "Instruction Following",
          "avgA": null,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 1
        },
        "multilingual": {
          "categoryLabel": "Multilingual",
          "avgA": null,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 0
        },
        "math": {
          "categoryLabel": "Mathematics",
          "avgA": null,
          "avgB": 52.4,
          "winner": null,
          "benchmarkCount": 1
        }
      }
    },
    {
      "slug": "grok-code-fast-1-vs-holo3-35b-a3b",
      "url": "https://benchlm.ai/compare/grok-code-fast-1-vs-holo3-35b-a3b",
      "markdownUrl": "https://benchlm.ai/md/compare/grok-code-fast-1-vs-holo3-35b-a3b.md",
      "modelA": {
        "slug": "grok-code-fast-1",
        "canonicalModelKey": "grok-code-fast-1",
        "model": "Grok Code Fast 1",
        "creator": "xAI",
        "sourceType": "Proprietary",
        "reasoningType": "Non-Reasoning",
        "contextWindow": "256K",
        "contextWindowTokens": 256000,
        "displayScore": 39,
        "rankingEligible": true,
        "overallRank": 85,
        "url": "https://benchlm.ai/models/grok-code-fast-1",
        "markdownUrl": "https://benchlm.ai/md/models/grok-code-fast-1.md"
      },
      "modelB": {
        "slug": "holo3-35b-a3b",
        "canonicalModelKey": "holo3-35b-a3b",
        "model": "Holo3-35B-A3B",
        "creator": "H Company",
        "sourceType": "Open Weight",
        "reasoningType": "Non-Reasoning",
        "contextWindow": "64K",
        "contextWindowTokens": 64000,
        "displayScore": 100,
        "rankingEligible": false,
        "overallRank": null,
        "url": "https://benchlm.ai/models/holo3-35b-a3b",
        "markdownUrl": "https://benchlm.ai/md/models/holo3-35b-a3b.md"
      },
      "overallWinner": "B",
      "winner": {
        "slug": "holo3-35b-a3b",
        "canonicalModelKey": "holo3-35b-a3b",
        "model": "Holo3-35B-A3B",
        "creator": "H Company",
        "sourceType": "Open Weight",
        "reasoningType": "Non-Reasoning",
        "contextWindow": "64K",
        "contextWindowTokens": 64000,
        "displayScore": 100,
        "rankingEligible": false,
        "overallRank": null,
        "url": "https://benchlm.ai/models/holo3-35b-a3b",
        "markdownUrl": "https://benchlm.ai/md/models/holo3-35b-a3b.md"
      },
      "scoreDiff": 61,
      "winsA": 0,
      "winsB": 0,
      "comparableCategoryCount": 0,
      "benchmarkCountA": 17,
      "benchmarkCountB": 1,
      "categoryResults": {
        "agentic": {
          "categoryLabel": "Agentic",
          "avgA": null,
          "avgB": 82.6,
          "winner": null,
          "benchmarkCount": 5
        },
        "coding": {
          "categoryLabel": "Coding",
          "avgA": 70.8,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 4
        },
        "multimodalGrounded": {
          "categoryLabel": "Multimodal & Grounded",
          "avgA": null,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 0
        },
        "reasoning": {
          "categoryLabel": "Reasoning",
          "avgA": null,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 2
        },
        "knowledge": {
          "categoryLabel": "Knowledge",
          "avgA": null,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 6
        },
        "instructionFollowing": {
          "categoryLabel": "Instruction Following",
          "avgA": null,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 1
        },
        "multilingual": {
          "categoryLabel": "Multilingual",
          "avgA": null,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 0
        },
        "math": {
          "categoryLabel": "Mathematics",
          "avgA": null,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 0
        }
      }
    },
    {
      "slug": "gpt-5-5-pro-vs-sarvam-105b",
      "url": "https://benchlm.ai/compare/gpt-5-5-pro-vs-sarvam-105b",
      "markdownUrl": "https://benchlm.ai/md/compare/gpt-5-5-pro-vs-sarvam-105b.md",
      "modelA": {
        "slug": "sarvam-105b",
        "canonicalModelKey": "sarvam-105b",
        "model": "Sarvam 105B",
        "creator": "Sarvam",
        "sourceType": "Open Weight",
        "reasoningType": "Reasoning",
        "contextWindow": "128K",
        "contextWindowTokens": 128000,
        "displayScore": 39,
        "rankingEligible": true,
        "overallRank": 86,
        "url": "https://benchlm.ai/models/sarvam-105b",
        "markdownUrl": "https://benchlm.ai/md/models/sarvam-105b.md"
      },
      "modelB": {
        "slug": "gpt-5-5-pro",
        "canonicalModelKey": "gpt-5-5-pro",
        "model": "GPT-5.5 Pro",
        "creator": "OpenAI",
        "sourceType": "Proprietary",
        "reasoningType": "Reasoning",
        "contextWindow": "1M",
        "contextWindowTokens": 1000000,
        "displayScore": 100,
        "rankingEligible": false,
        "overallRank": null,
        "url": "https://benchlm.ai/models/gpt-5-5-pro",
        "markdownUrl": "https://benchlm.ai/md/models/gpt-5-5-pro.md"
      },
      "overallWinner": "B",
      "winner": {
        "slug": "gpt-5-5-pro",
        "canonicalModelKey": "gpt-5-5-pro",
        "model": "GPT-5.5 Pro",
        "creator": "OpenAI",
        "sourceType": "Proprietary",
        "reasoningType": "Reasoning",
        "contextWindow": "1M",
        "contextWindowTokens": 1000000,
        "displayScore": 100,
        "rankingEligible": false,
        "overallRank": null,
        "url": "https://benchlm.ai/models/gpt-5-5-pro",
        "markdownUrl": "https://benchlm.ai/md/models/gpt-5-5-pro.md"
      },
      "scoreDiff": 61,
      "winsA": 0,
      "winsB": 0,
      "comparableCategoryCount": 0,
      "benchmarkCountA": 16,
      "benchmarkCountB": 4,
      "categoryResults": {
        "agentic": {
          "categoryLabel": "Agentic",
          "avgA": null,
          "avgB": 90.1,
          "winner": null,
          "benchmarkCount": 5
        },
        "coding": {
          "categoryLabel": "Coding",
          "avgA": null,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 3
        },
        "multimodalGrounded": {
          "categoryLabel": "Multimodal & Grounded",
          "avgA": null,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 0
        },
        "reasoning": {
          "categoryLabel": "Reasoning",
          "avgA": null,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 2
        },
        "knowledge": {
          "categoryLabel": "Knowledge",
          "avgA": null,
          "avgB": 57.2,
          "winner": null,
          "benchmarkCount": 8
        },
        "instructionFollowing": {
          "categoryLabel": "Instruction Following",
          "avgA": null,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 1
        },
        "multilingual": {
          "categoryLabel": "Multilingual",
          "avgA": null,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 0
        },
        "math": {
          "categoryLabel": "Mathematics",
          "avgA": null,
          "avgB": 52.4,
          "winner": null,
          "benchmarkCount": 1
        }
      }
    },
    {
      "slug": "holo3-35b-a3b-vs-sarvam-105b",
      "url": "https://benchlm.ai/compare/holo3-35b-a3b-vs-sarvam-105b",
      "markdownUrl": "https://benchlm.ai/md/compare/holo3-35b-a3b-vs-sarvam-105b.md",
      "modelA": {
        "slug": "sarvam-105b",
        "canonicalModelKey": "sarvam-105b",
        "model": "Sarvam 105B",
        "creator": "Sarvam",
        "sourceType": "Open Weight",
        "reasoningType": "Reasoning",
        "contextWindow": "128K",
        "contextWindowTokens": 128000,
        "displayScore": 39,
        "rankingEligible": true,
        "overallRank": 86,
        "url": "https://benchlm.ai/models/sarvam-105b",
        "markdownUrl": "https://benchlm.ai/md/models/sarvam-105b.md"
      },
      "modelB": {
        "slug": "holo3-35b-a3b",
        "canonicalModelKey": "holo3-35b-a3b",
        "model": "Holo3-35B-A3B",
        "creator": "H Company",
        "sourceType": "Open Weight",
        "reasoningType": "Non-Reasoning",
        "contextWindow": "64K",
        "contextWindowTokens": 64000,
        "displayScore": 100,
        "rankingEligible": false,
        "overallRank": null,
        "url": "https://benchlm.ai/models/holo3-35b-a3b",
        "markdownUrl": "https://benchlm.ai/md/models/holo3-35b-a3b.md"
      },
      "overallWinner": "B",
      "winner": {
        "slug": "holo3-35b-a3b",
        "canonicalModelKey": "holo3-35b-a3b",
        "model": "Holo3-35B-A3B",
        "creator": "H Company",
        "sourceType": "Open Weight",
        "reasoningType": "Non-Reasoning",
        "contextWindow": "64K",
        "contextWindowTokens": 64000,
        "displayScore": 100,
        "rankingEligible": false,
        "overallRank": null,
        "url": "https://benchlm.ai/models/holo3-35b-a3b",
        "markdownUrl": "https://benchlm.ai/md/models/holo3-35b-a3b.md"
      },
      "scoreDiff": 61,
      "winsA": 0,
      "winsB": 0,
      "comparableCategoryCount": 0,
      "benchmarkCountA": 16,
      "benchmarkCountB": 1,
      "categoryResults": {
        "agentic": {
          "categoryLabel": "Agentic",
          "avgA": null,
          "avgB": 82.6,
          "winner": null,
          "benchmarkCount": 5
        },
        "coding": {
          "categoryLabel": "Coding",
          "avgA": null,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 3
        },
        "multimodalGrounded": {
          "categoryLabel": "Multimodal & Grounded",
          "avgA": null,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 0
        },
        "reasoning": {
          "categoryLabel": "Reasoning",
          "avgA": null,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 2
        },
        "knowledge": {
          "categoryLabel": "Knowledge",
          "avgA": null,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 6
        },
        "instructionFollowing": {
          "categoryLabel": "Instruction Following",
          "avgA": null,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 1
        },
        "multilingual": {
          "categoryLabel": "Multilingual",
          "avgA": null,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 0
        },
        "math": {
          "categoryLabel": "Mathematics",
          "avgA": null,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 0
        }
      }
    },
    {
      "slug": "gpt-5-5-pro-vs-mistral-large-2",
      "url": "https://benchlm.ai/compare/gpt-5-5-pro-vs-mistral-large-2",
      "markdownUrl": "https://benchlm.ai/md/compare/gpt-5-5-pro-vs-mistral-large-2.md",
      "modelA": {
        "slug": "mistral-large-2",
        "canonicalModelKey": "mistral-large-2",
        "model": "Mistral Large 2",
        "creator": "Mistral",
        "sourceType": "Proprietary",
        "reasoningType": "Non-Reasoning",
        "contextWindow": "128K",
        "contextWindowTokens": 128000,
        "displayScore": 38,
        "rankingEligible": true,
        "overallRank": 87,
        "url": "https://benchlm.ai/models/mistral-large-2",
        "markdownUrl": "https://benchlm.ai/md/models/mistral-large-2.md"
      },
      "modelB": {
        "slug": "gpt-5-5-pro",
        "canonicalModelKey": "gpt-5-5-pro",
        "model": "GPT-5.5 Pro",
        "creator": "OpenAI",
        "sourceType": "Proprietary",
        "reasoningType": "Reasoning",
        "contextWindow": "1M",
        "contextWindowTokens": 1000000,
        "displayScore": 100,
        "rankingEligible": false,
        "overallRank": null,
        "url": "https://benchlm.ai/models/gpt-5-5-pro",
        "markdownUrl": "https://benchlm.ai/md/models/gpt-5-5-pro.md"
      },
      "overallWinner": "B",
      "winner": {
        "slug": "gpt-5-5-pro",
        "canonicalModelKey": "gpt-5-5-pro",
        "model": "GPT-5.5 Pro",
        "creator": "OpenAI",
        "sourceType": "Proprietary",
        "reasoningType": "Reasoning",
        "contextWindow": "1M",
        "contextWindowTokens": 1000000,
        "displayScore": 100,
        "rankingEligible": false,
        "overallRank": null,
        "url": "https://benchlm.ai/models/gpt-5-5-pro",
        "markdownUrl": "https://benchlm.ai/md/models/gpt-5-5-pro.md"
      },
      "scoreDiff": 62,
      "winsA": 0,
      "winsB": 0,
      "comparableCategoryCount": 0,
      "benchmarkCountA": 16,
      "benchmarkCountB": 4,
      "categoryResults": {
        "agentic": {
          "categoryLabel": "Agentic",
          "avgA": null,
          "avgB": 90.1,
          "winner": null,
          "benchmarkCount": 5
        },
        "coding": {
          "categoryLabel": "Coding",
          "avgA": null,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 3
        },
        "multimodalGrounded": {
          "categoryLabel": "Multimodal & Grounded",
          "avgA": null,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 0
        },
        "reasoning": {
          "categoryLabel": "Reasoning",
          "avgA": null,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 2
        },
        "knowledge": {
          "categoryLabel": "Knowledge",
          "avgA": null,
          "avgB": 57.2,
          "winner": null,
          "benchmarkCount": 8
        },
        "instructionFollowing": {
          "categoryLabel": "Instruction Following",
          "avgA": null,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 1
        },
        "multilingual": {
          "categoryLabel": "Multilingual",
          "avgA": null,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 0
        },
        "math": {
          "categoryLabel": "Mathematics",
          "avgA": null,
          "avgB": 52.4,
          "winner": null,
          "benchmarkCount": 1
        }
      }
    },
    {
      "slug": "holo3-35b-a3b-vs-mistral-large-2",
      "url": "https://benchlm.ai/compare/holo3-35b-a3b-vs-mistral-large-2",
      "markdownUrl": "https://benchlm.ai/md/compare/holo3-35b-a3b-vs-mistral-large-2.md",
      "modelA": {
        "slug": "mistral-large-2",
        "canonicalModelKey": "mistral-large-2",
        "model": "Mistral Large 2",
        "creator": "Mistral",
        "sourceType": "Proprietary",
        "reasoningType": "Non-Reasoning",
        "contextWindow": "128K",
        "contextWindowTokens": 128000,
        "displayScore": 38,
        "rankingEligible": true,
        "overallRank": 87,
        "url": "https://benchlm.ai/models/mistral-large-2",
        "markdownUrl": "https://benchlm.ai/md/models/mistral-large-2.md"
      },
      "modelB": {
        "slug": "holo3-35b-a3b",
        "canonicalModelKey": "holo3-35b-a3b",
        "model": "Holo3-35B-A3B",
        "creator": "H Company",
        "sourceType": "Open Weight",
        "reasoningType": "Non-Reasoning",
        "contextWindow": "64K",
        "contextWindowTokens": 64000,
        "displayScore": 100,
        "rankingEligible": false,
        "overallRank": null,
        "url": "https://benchlm.ai/models/holo3-35b-a3b",
        "markdownUrl": "https://benchlm.ai/md/models/holo3-35b-a3b.md"
      },
      "overallWinner": "B",
      "winner": {
        "slug": "holo3-35b-a3b",
        "canonicalModelKey": "holo3-35b-a3b",
        "model": "Holo3-35B-A3B",
        "creator": "H Company",
        "sourceType": "Open Weight",
        "reasoningType": "Non-Reasoning",
        "contextWindow": "64K",
        "contextWindowTokens": 64000,
        "displayScore": 100,
        "rankingEligible": false,
        "overallRank": null,
        "url": "https://benchlm.ai/models/holo3-35b-a3b",
        "markdownUrl": "https://benchlm.ai/md/models/holo3-35b-a3b.md"
      },
      "scoreDiff": 62,
      "winsA": 0,
      "winsB": 0,
      "comparableCategoryCount": 0,
      "benchmarkCountA": 16,
      "benchmarkCountB": 1,
      "categoryResults": {
        "agentic": {
          "categoryLabel": "Agentic",
          "avgA": null,
          "avgB": 82.6,
          "winner": null,
          "benchmarkCount": 5
        },
        "coding": {
          "categoryLabel": "Coding",
          "avgA": null,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 3
        },
        "multimodalGrounded": {
          "categoryLabel": "Multimodal & Grounded",
          "avgA": null,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 0
        },
        "reasoning": {
          "categoryLabel": "Reasoning",
          "avgA": null,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 2
        },
        "knowledge": {
          "categoryLabel": "Knowledge",
          "avgA": null,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 6
        },
        "instructionFollowing": {
          "categoryLabel": "Instruction Following",
          "avgA": null,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 1
        },
        "multilingual": {
          "categoryLabel": "Multilingual",
          "avgA": null,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 0
        },
        "math": {
          "categoryLabel": "Mathematics",
          "avgA": null,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 0
        }
      }
    },
    {
      "slug": "gemini-2-5-flash-vs-gpt-5-5-pro",
      "url": "https://benchlm.ai/compare/gemini-2-5-flash-vs-gpt-5-5-pro",
      "markdownUrl": "https://benchlm.ai/md/compare/gemini-2-5-flash-vs-gpt-5-5-pro.md",
      "modelA": {
        "slug": "gemini-2-5-flash",
        "canonicalModelKey": "gemini-2-5-flash",
        "model": "Gemini 2.5 Flash",
        "creator": "Google",
        "sourceType": "Proprietary",
        "reasoningType": "Non-Reasoning",
        "contextWindow": "1M",
        "contextWindowTokens": 1000000,
        "displayScore": 37,
        "rankingEligible": true,
        "overallRank": 88,
        "url": "https://benchlm.ai/models/gemini-2-5-flash",
        "markdownUrl": "https://benchlm.ai/md/models/gemini-2-5-flash.md"
      },
      "modelB": {
        "slug": "gpt-5-5-pro",
        "canonicalModelKey": "gpt-5-5-pro",
        "model": "GPT-5.5 Pro",
        "creator": "OpenAI",
        "sourceType": "Proprietary",
        "reasoningType": "Reasoning",
        "contextWindow": "1M",
        "contextWindowTokens": 1000000,
        "displayScore": 100,
        "rankingEligible": false,
        "overallRank": null,
        "url": "https://benchlm.ai/models/gpt-5-5-pro",
        "markdownUrl": "https://benchlm.ai/md/models/gpt-5-5-pro.md"
      },
      "overallWinner": "B",
      "winner": {
        "slug": "gpt-5-5-pro",
        "canonicalModelKey": "gpt-5-5-pro",
        "model": "GPT-5.5 Pro",
        "creator": "OpenAI",
        "sourceType": "Proprietary",
        "reasoningType": "Reasoning",
        "contextWindow": "1M",
        "contextWindowTokens": 1000000,
        "displayScore": 100,
        "rankingEligible": false,
        "overallRank": null,
        "url": "https://benchlm.ai/models/gpt-5-5-pro",
        "markdownUrl": "https://benchlm.ai/md/models/gpt-5-5-pro.md"
      },
      "scoreDiff": 63,
      "winsA": 0,
      "winsB": 0,
      "comparableCategoryCount": 0,
      "benchmarkCountA": 18,
      "benchmarkCountB": 4,
      "categoryResults": {
        "agentic": {
          "categoryLabel": "Agentic",
          "avgA": null,
          "avgB": 90.1,
          "winner": null,
          "benchmarkCount": 5
        },
        "coding": {
          "categoryLabel": "Coding",
          "avgA": null,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 3
        },
        "multimodalGrounded": {
          "categoryLabel": "Multimodal & Grounded",
          "avgA": null,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 2
        },
        "reasoning": {
          "categoryLabel": "Reasoning",
          "avgA": null,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 2
        },
        "knowledge": {
          "categoryLabel": "Knowledge",
          "avgA": null,
          "avgB": 57.2,
          "winner": null,
          "benchmarkCount": 8
        },
        "instructionFollowing": {
          "categoryLabel": "Instruction Following",
          "avgA": null,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 1
        },
        "multilingual": {
          "categoryLabel": "Multilingual",
          "avgA": null,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 0
        },
        "math": {
          "categoryLabel": "Mathematics",
          "avgA": null,
          "avgB": 52.4,
          "winner": null,
          "benchmarkCount": 1
        }
      }
    },
    {
      "slug": "gemini-2-5-flash-vs-holo3-35b-a3b",
      "url": "https://benchlm.ai/compare/gemini-2-5-flash-vs-holo3-35b-a3b",
      "markdownUrl": "https://benchlm.ai/md/compare/gemini-2-5-flash-vs-holo3-35b-a3b.md",
      "modelA": {
        "slug": "gemini-2-5-flash",
        "canonicalModelKey": "gemini-2-5-flash",
        "model": "Gemini 2.5 Flash",
        "creator": "Google",
        "sourceType": "Proprietary",
        "reasoningType": "Non-Reasoning",
        "contextWindow": "1M",
        "contextWindowTokens": 1000000,
        "displayScore": 37,
        "rankingEligible": true,
        "overallRank": 88,
        "url": "https://benchlm.ai/models/gemini-2-5-flash",
        "markdownUrl": "https://benchlm.ai/md/models/gemini-2-5-flash.md"
      },
      "modelB": {
        "slug": "holo3-35b-a3b",
        "canonicalModelKey": "holo3-35b-a3b",
        "model": "Holo3-35B-A3B",
        "creator": "H Company",
        "sourceType": "Open Weight",
        "reasoningType": "Non-Reasoning",
        "contextWindow": "64K",
        "contextWindowTokens": 64000,
        "displayScore": 100,
        "rankingEligible": false,
        "overallRank": null,
        "url": "https://benchlm.ai/models/holo3-35b-a3b",
        "markdownUrl": "https://benchlm.ai/md/models/holo3-35b-a3b.md"
      },
      "overallWinner": "B",
      "winner": {
        "slug": "holo3-35b-a3b",
        "canonicalModelKey": "holo3-35b-a3b",
        "model": "Holo3-35B-A3B",
        "creator": "H Company",
        "sourceType": "Open Weight",
        "reasoningType": "Non-Reasoning",
        "contextWindow": "64K",
        "contextWindowTokens": 64000,
        "displayScore": 100,
        "rankingEligible": false,
        "overallRank": null,
        "url": "https://benchlm.ai/models/holo3-35b-a3b",
        "markdownUrl": "https://benchlm.ai/md/models/holo3-35b-a3b.md"
      },
      "scoreDiff": 63,
      "winsA": 0,
      "winsB": 0,
      "comparableCategoryCount": 0,
      "benchmarkCountA": 18,
      "benchmarkCountB": 1,
      "categoryResults": {
        "agentic": {
          "categoryLabel": "Agentic",
          "avgA": null,
          "avgB": 82.6,
          "winner": null,
          "benchmarkCount": 5
        },
        "coding": {
          "categoryLabel": "Coding",
          "avgA": null,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 3
        },
        "multimodalGrounded": {
          "categoryLabel": "Multimodal & Grounded",
          "avgA": null,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 2
        },
        "reasoning": {
          "categoryLabel": "Reasoning",
          "avgA": null,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 2
        },
        "knowledge": {
          "categoryLabel": "Knowledge",
          "avgA": null,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 6
        },
        "instructionFollowing": {
          "categoryLabel": "Instruction Following",
          "avgA": null,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 1
        },
        "multilingual": {
          "categoryLabel": "Multilingual",
          "avgA": null,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 0
        },
        "math": {
          "categoryLabel": "Mathematics",
          "avgA": null,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 0
        }
      }
    },
    {
      "slug": "gemini-1-5-pro-vs-gpt-5-5-pro",
      "url": "https://benchlm.ai/compare/gemini-1-5-pro-vs-gpt-5-5-pro",
      "markdownUrl": "https://benchlm.ai/md/compare/gemini-1-5-pro-vs-gpt-5-5-pro.md",
      "modelA": {
        "slug": "gemini-1-5-pro",
        "canonicalModelKey": "gemini-1-5-pro",
        "model": "Gemini 1.5 Pro",
        "creator": "Google",
        "sourceType": "Proprietary",
        "reasoningType": "Non-Reasoning",
        "contextWindow": "2M",
        "contextWindowTokens": 2000000,
        "displayScore": 35,
        "rankingEligible": true,
        "overallRank": 89,
        "url": "https://benchlm.ai/models/gemini-1-5-pro",
        "markdownUrl": "https://benchlm.ai/md/models/gemini-1-5-pro.md"
      },
      "modelB": {
        "slug": "gpt-5-5-pro",
        "canonicalModelKey": "gpt-5-5-pro",
        "model": "GPT-5.5 Pro",
        "creator": "OpenAI",
        "sourceType": "Proprietary",
        "reasoningType": "Reasoning",
        "contextWindow": "1M",
        "contextWindowTokens": 1000000,
        "displayScore": 100,
        "rankingEligible": false,
        "overallRank": null,
        "url": "https://benchlm.ai/models/gpt-5-5-pro",
        "markdownUrl": "https://benchlm.ai/md/models/gpt-5-5-pro.md"
      },
      "overallWinner": "B",
      "winner": {
        "slug": "gpt-5-5-pro",
        "canonicalModelKey": "gpt-5-5-pro",
        "model": "GPT-5.5 Pro",
        "creator": "OpenAI",
        "sourceType": "Proprietary",
        "reasoningType": "Reasoning",
        "contextWindow": "1M",
        "contextWindowTokens": 1000000,
        "displayScore": 100,
        "rankingEligible": false,
        "overallRank": null,
        "url": "https://benchlm.ai/models/gpt-5-5-pro",
        "markdownUrl": "https://benchlm.ai/md/models/gpt-5-5-pro.md"
      },
      "scoreDiff": 65,
      "winsA": 0,
      "winsB": 0,
      "comparableCategoryCount": 0,
      "benchmarkCountA": 6,
      "benchmarkCountB": 4,
      "categoryResults": {
        "agentic": {
          "categoryLabel": "Agentic",
          "avgA": null,
          "avgB": 90.1,
          "winner": null,
          "benchmarkCount": 1
        },
        "coding": {
          "categoryLabel": "Coding",
          "avgA": null,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 2
        },
        "multimodalGrounded": {
          "categoryLabel": "Multimodal & Grounded",
          "avgA": null,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 1
        },
        "reasoning": {
          "categoryLabel": "Reasoning",
          "avgA": null,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 0
        },
        "knowledge": {
          "categoryLabel": "Knowledge",
          "avgA": null,
          "avgB": 57.2,
          "winner": null,
          "benchmarkCount": 5
        },
        "instructionFollowing": {
          "categoryLabel": "Instruction Following",
          "avgA": null,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 0
        },
        "multilingual": {
          "categoryLabel": "Multilingual",
          "avgA": null,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 0
        },
        "math": {
          "categoryLabel": "Mathematics",
          "avgA": null,
          "avgB": 52.4,
          "winner": null,
          "benchmarkCount": 1
        }
      }
    },
    {
      "slug": "gemini-1-5-pro-vs-holo3-35b-a3b",
      "url": "https://benchlm.ai/compare/gemini-1-5-pro-vs-holo3-35b-a3b",
      "markdownUrl": "https://benchlm.ai/md/compare/gemini-1-5-pro-vs-holo3-35b-a3b.md",
      "modelA": {
        "slug": "gemini-1-5-pro",
        "canonicalModelKey": "gemini-1-5-pro",
        "model": "Gemini 1.5 Pro",
        "creator": "Google",
        "sourceType": "Proprietary",
        "reasoningType": "Non-Reasoning",
        "contextWindow": "2M",
        "contextWindowTokens": 2000000,
        "displayScore": 35,
        "rankingEligible": true,
        "overallRank": 89,
        "url": "https://benchlm.ai/models/gemini-1-5-pro",
        "markdownUrl": "https://benchlm.ai/md/models/gemini-1-5-pro.md"
      },
      "modelB": {
        "slug": "holo3-35b-a3b",
        "canonicalModelKey": "holo3-35b-a3b",
        "model": "Holo3-35B-A3B",
        "creator": "H Company",
        "sourceType": "Open Weight",
        "reasoningType": "Non-Reasoning",
        "contextWindow": "64K",
        "contextWindowTokens": 64000,
        "displayScore": 100,
        "rankingEligible": false,
        "overallRank": null,
        "url": "https://benchlm.ai/models/holo3-35b-a3b",
        "markdownUrl": "https://benchlm.ai/md/models/holo3-35b-a3b.md"
      },
      "overallWinner": "B",
      "winner": {
        "slug": "holo3-35b-a3b",
        "canonicalModelKey": "holo3-35b-a3b",
        "model": "Holo3-35B-A3B",
        "creator": "H Company",
        "sourceType": "Open Weight",
        "reasoningType": "Non-Reasoning",
        "contextWindow": "64K",
        "contextWindowTokens": 64000,
        "displayScore": 100,
        "rankingEligible": false,
        "overallRank": null,
        "url": "https://benchlm.ai/models/holo3-35b-a3b",
        "markdownUrl": "https://benchlm.ai/md/models/holo3-35b-a3b.md"
      },
      "scoreDiff": 65,
      "winsA": 0,
      "winsB": 0,
      "comparableCategoryCount": 0,
      "benchmarkCountA": 6,
      "benchmarkCountB": 1,
      "categoryResults": {
        "agentic": {
          "categoryLabel": "Agentic",
          "avgA": null,
          "avgB": 82.6,
          "winner": null,
          "benchmarkCount": 1
        },
        "coding": {
          "categoryLabel": "Coding",
          "avgA": null,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 2
        },
        "multimodalGrounded": {
          "categoryLabel": "Multimodal & Grounded",
          "avgA": null,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 1
        },
        "reasoning": {
          "categoryLabel": "Reasoning",
          "avgA": null,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 0
        },
        "knowledge": {
          "categoryLabel": "Knowledge",
          "avgA": null,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 3
        },
        "instructionFollowing": {
          "categoryLabel": "Instruction Following",
          "avgA": null,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 0
        },
        "multilingual": {
          "categoryLabel": "Multilingual",
          "avgA": null,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 0
        },
        "math": {
          "categoryLabel": "Mathematics",
          "avgA": null,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 0
        }
      }
    },
    {
      "slug": "deepseek-v3-vs-gpt-5-5-pro",
      "url": "https://benchlm.ai/compare/deepseek-v3-vs-gpt-5-5-pro",
      "markdownUrl": "https://benchlm.ai/md/compare/deepseek-v3-vs-gpt-5-5-pro.md",
      "modelA": {
        "slug": "deepseek-v3",
        "canonicalModelKey": "deepseek-v3",
        "model": "DeepSeek V3",
        "creator": "DeepSeek",
        "sourceType": "Open Weight",
        "reasoningType": "Non-Reasoning",
        "contextWindow": "128K",
        "contextWindowTokens": 128000,
        "displayScore": 34,
        "rankingEligible": true,
        "overallRank": 90,
        "url": "https://benchlm.ai/models/deepseek-v3",
        "markdownUrl": "https://benchlm.ai/md/models/deepseek-v3.md"
      },
      "modelB": {
        "slug": "gpt-5-5-pro",
        "canonicalModelKey": "gpt-5-5-pro",
        "model": "GPT-5.5 Pro",
        "creator": "OpenAI",
        "sourceType": "Proprietary",
        "reasoningType": "Reasoning",
        "contextWindow": "1M",
        "contextWindowTokens": 1000000,
        "displayScore": 100,
        "rankingEligible": false,
        "overallRank": null,
        "url": "https://benchlm.ai/models/gpt-5-5-pro",
        "markdownUrl": "https://benchlm.ai/md/models/gpt-5-5-pro.md"
      },
      "overallWinner": "B",
      "winner": {
        "slug": "gpt-5-5-pro",
        "canonicalModelKey": "gpt-5-5-pro",
        "model": "GPT-5.5 Pro",
        "creator": "OpenAI",
        "sourceType": "Proprietary",
        "reasoningType": "Reasoning",
        "contextWindow": "1M",
        "contextWindowTokens": 1000000,
        "displayScore": 100,
        "rankingEligible": false,
        "overallRank": null,
        "url": "https://benchlm.ai/models/gpt-5-5-pro",
        "markdownUrl": "https://benchlm.ai/md/models/gpt-5-5-pro.md"
      },
      "scoreDiff": 66,
      "winsA": 1,
      "winsB": 0,
      "comparableCategoryCount": 1,
      "benchmarkCountA": 22,
      "benchmarkCountB": 4,
      "categoryResults": {
        "agentic": {
          "categoryLabel": "Agentic",
          "avgA": null,
          "avgB": 90.1,
          "winner": null,
          "benchmarkCount": 5
        },
        "coding": {
          "categoryLabel": "Coding",
          "avgA": 39.2,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 5
        },
        "multimodalGrounded": {
          "categoryLabel": "Multimodal & Grounded",
          "avgA": null,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 1
        },
        "reasoning": {
          "categoryLabel": "Reasoning",
          "avgA": null,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 2
        },
        "knowledge": {
          "categoryLabel": "Knowledge",
          "avgA": 70,
          "avgB": 57.2,
          "winner": "A",
          "benchmarkCount": 10
        },
        "instructionFollowing": {
          "categoryLabel": "Instruction Following",
          "avgA": 86.1,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 2
        },
        "multilingual": {
          "categoryLabel": "Multilingual",
          "avgA": null,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 0
        },
        "math": {
          "categoryLabel": "Mathematics",
          "avgA": null,
          "avgB": 52.4,
          "winner": null,
          "benchmarkCount": 1
        }
      }
    },
    {
      "slug": "deepseek-v3-vs-holo3-35b-a3b",
      "url": "https://benchlm.ai/compare/deepseek-v3-vs-holo3-35b-a3b",
      "markdownUrl": "https://benchlm.ai/md/compare/deepseek-v3-vs-holo3-35b-a3b.md",
      "modelA": {
        "slug": "deepseek-v3",
        "canonicalModelKey": "deepseek-v3",
        "model": "DeepSeek V3",
        "creator": "DeepSeek",
        "sourceType": "Open Weight",
        "reasoningType": "Non-Reasoning",
        "contextWindow": "128K",
        "contextWindowTokens": 128000,
        "displayScore": 34,
        "rankingEligible": true,
        "overallRank": 90,
        "url": "https://benchlm.ai/models/deepseek-v3",
        "markdownUrl": "https://benchlm.ai/md/models/deepseek-v3.md"
      },
      "modelB": {
        "slug": "holo3-35b-a3b",
        "canonicalModelKey": "holo3-35b-a3b",
        "model": "Holo3-35B-A3B",
        "creator": "H Company",
        "sourceType": "Open Weight",
        "reasoningType": "Non-Reasoning",
        "contextWindow": "64K",
        "contextWindowTokens": 64000,
        "displayScore": 100,
        "rankingEligible": false,
        "overallRank": null,
        "url": "https://benchlm.ai/models/holo3-35b-a3b",
        "markdownUrl": "https://benchlm.ai/md/models/holo3-35b-a3b.md"
      },
      "overallWinner": "B",
      "winner": {
        "slug": "holo3-35b-a3b",
        "canonicalModelKey": "holo3-35b-a3b",
        "model": "Holo3-35B-A3B",
        "creator": "H Company",
        "sourceType": "Open Weight",
        "reasoningType": "Non-Reasoning",
        "contextWindow": "64K",
        "contextWindowTokens": 64000,
        "displayScore": 100,
        "rankingEligible": false,
        "overallRank": null,
        "url": "https://benchlm.ai/models/holo3-35b-a3b",
        "markdownUrl": "https://benchlm.ai/md/models/holo3-35b-a3b.md"
      },
      "scoreDiff": 66,
      "winsA": 0,
      "winsB": 0,
      "comparableCategoryCount": 0,
      "benchmarkCountA": 22,
      "benchmarkCountB": 1,
      "categoryResults": {
        "agentic": {
          "categoryLabel": "Agentic",
          "avgA": null,
          "avgB": 82.6,
          "winner": null,
          "benchmarkCount": 5
        },
        "coding": {
          "categoryLabel": "Coding",
          "avgA": 39.2,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 5
        },
        "multimodalGrounded": {
          "categoryLabel": "Multimodal & Grounded",
          "avgA": null,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 1
        },
        "reasoning": {
          "categoryLabel": "Reasoning",
          "avgA": null,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 2
        },
        "knowledge": {
          "categoryLabel": "Knowledge",
          "avgA": 70,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 8
        },
        "instructionFollowing": {
          "categoryLabel": "Instruction Following",
          "avgA": 86.1,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 2
        },
        "multilingual": {
          "categoryLabel": "Multilingual",
          "avgA": null,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 0
        },
        "math": {
          "categoryLabel": "Mathematics",
          "avgA": null,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 0
        }
      }
    },
    {
      "slug": "gpt-5-5-pro-vs-gpt-oss-120b",
      "url": "https://benchlm.ai/compare/gpt-5-5-pro-vs-gpt-oss-120b",
      "markdownUrl": "https://benchlm.ai/md/compare/gpt-5-5-pro-vs-gpt-oss-120b.md",
      "modelA": {
        "slug": "gpt-oss-120b",
        "canonicalModelKey": "gpt-oss-120b",
        "model": "GPT-OSS 120B",
        "creator": "OpenAI",
        "sourceType": "Open Weight",
        "reasoningType": "Non-Reasoning",
        "contextWindow": "128K",
        "contextWindowTokens": 128000,
        "displayScore": 34,
        "rankingEligible": true,
        "overallRank": 91,
        "url": "https://benchlm.ai/models/gpt-oss-120b",
        "markdownUrl": "https://benchlm.ai/md/models/gpt-oss-120b.md"
      },
      "modelB": {
        "slug": "gpt-5-5-pro",
        "canonicalModelKey": "gpt-5-5-pro",
        "model": "GPT-5.5 Pro",
        "creator": "OpenAI",
        "sourceType": "Proprietary",
        "reasoningType": "Reasoning",
        "contextWindow": "1M",
        "contextWindowTokens": 1000000,
        "displayScore": 100,
        "rankingEligible": false,
        "overallRank": null,
        "url": "https://benchlm.ai/models/gpt-5-5-pro",
        "markdownUrl": "https://benchlm.ai/md/models/gpt-5-5-pro.md"
      },
      "overallWinner": "B",
      "winner": {
        "slug": "gpt-5-5-pro",
        "canonicalModelKey": "gpt-5-5-pro",
        "model": "GPT-5.5 Pro",
        "creator": "OpenAI",
        "sourceType": "Proprietary",
        "reasoningType": "Reasoning",
        "contextWindow": "1M",
        "contextWindowTokens": 1000000,
        "displayScore": 100,
        "rankingEligible": false,
        "overallRank": null,
        "url": "https://benchlm.ai/models/gpt-5-5-pro",
        "markdownUrl": "https://benchlm.ai/md/models/gpt-5-5-pro.md"
      },
      "scoreDiff": 66,
      "winsA": 0,
      "winsB": 0,
      "comparableCategoryCount": 0,
      "benchmarkCountA": 20,
      "benchmarkCountB": 4,
      "categoryResults": {
        "agentic": {
          "categoryLabel": "Agentic",
          "avgA": null,
          "avgB": 90.1,
          "winner": null,
          "benchmarkCount": 7
        },
        "coding": {
          "categoryLabel": "Coding",
          "avgA": null,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 4
        },
        "multimodalGrounded": {
          "categoryLabel": "Multimodal & Grounded",
          "avgA": null,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 1
        },
        "reasoning": {
          "categoryLabel": "Reasoning",
          "avgA": null,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 2
        },
        "knowledge": {
          "categoryLabel": "Knowledge",
          "avgA": null,
          "avgB": 57.2,
          "winner": null,
          "benchmarkCount": 8
        },
        "instructionFollowing": {
          "categoryLabel": "Instruction Following",
          "avgA": null,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 1
        },
        "multilingual": {
          "categoryLabel": "Multilingual",
          "avgA": null,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 0
        },
        "math": {
          "categoryLabel": "Mathematics",
          "avgA": null,
          "avgB": 52.4,
          "winner": null,
          "benchmarkCount": 1
        }
      }
    },
    {
      "slug": "gpt-oss-120b-vs-holo3-35b-a3b",
      "url": "https://benchlm.ai/compare/gpt-oss-120b-vs-holo3-35b-a3b",
      "markdownUrl": "https://benchlm.ai/md/compare/gpt-oss-120b-vs-holo3-35b-a3b.md",
      "modelA": {
        "slug": "gpt-oss-120b",
        "canonicalModelKey": "gpt-oss-120b",
        "model": "GPT-OSS 120B",
        "creator": "OpenAI",
        "sourceType": "Open Weight",
        "reasoningType": "Non-Reasoning",
        "contextWindow": "128K",
        "contextWindowTokens": 128000,
        "displayScore": 34,
        "rankingEligible": true,
        "overallRank": 91,
        "url": "https://benchlm.ai/models/gpt-oss-120b",
        "markdownUrl": "https://benchlm.ai/md/models/gpt-oss-120b.md"
      },
      "modelB": {
        "slug": "holo3-35b-a3b",
        "canonicalModelKey": "holo3-35b-a3b",
        "model": "Holo3-35B-A3B",
        "creator": "H Company",
        "sourceType": "Open Weight",
        "reasoningType": "Non-Reasoning",
        "contextWindow": "64K",
        "contextWindowTokens": 64000,
        "displayScore": 100,
        "rankingEligible": false,
        "overallRank": null,
        "url": "https://benchlm.ai/models/holo3-35b-a3b",
        "markdownUrl": "https://benchlm.ai/md/models/holo3-35b-a3b.md"
      },
      "overallWinner": "B",
      "winner": {
        "slug": "holo3-35b-a3b",
        "canonicalModelKey": "holo3-35b-a3b",
        "model": "Holo3-35B-A3B",
        "creator": "H Company",
        "sourceType": "Open Weight",
        "reasoningType": "Non-Reasoning",
        "contextWindow": "64K",
        "contextWindowTokens": 64000,
        "displayScore": 100,
        "rankingEligible": false,
        "overallRank": null,
        "url": "https://benchlm.ai/models/holo3-35b-a3b",
        "markdownUrl": "https://benchlm.ai/md/models/holo3-35b-a3b.md"
      },
      "scoreDiff": 66,
      "winsA": 0,
      "winsB": 0,
      "comparableCategoryCount": 0,
      "benchmarkCountA": 20,
      "benchmarkCountB": 1,
      "categoryResults": {
        "agentic": {
          "categoryLabel": "Agentic",
          "avgA": null,
          "avgB": 82.6,
          "winner": null,
          "benchmarkCount": 7
        },
        "coding": {
          "categoryLabel": "Coding",
          "avgA": null,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 4
        },
        "multimodalGrounded": {
          "categoryLabel": "Multimodal & Grounded",
          "avgA": null,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 1
        },
        "reasoning": {
          "categoryLabel": "Reasoning",
          "avgA": null,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 2
        },
        "knowledge": {
          "categoryLabel": "Knowledge",
          "avgA": null,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 6
        },
        "instructionFollowing": {
          "categoryLabel": "Instruction Following",
          "avgA": null,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 1
        },
        "multilingual": {
          "categoryLabel": "Multilingual",
          "avgA": null,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 0
        },
        "math": {
          "categoryLabel": "Mathematics",
          "avgA": null,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 0
        }
      }
    },
    {
      "slug": "claude-3-opus-vs-gpt-5-5-pro",
      "url": "https://benchlm.ai/compare/claude-3-opus-vs-gpt-5-5-pro",
      "markdownUrl": "https://benchlm.ai/md/compare/claude-3-opus-vs-gpt-5-5-pro.md",
      "modelA": {
        "slug": "claude-3-opus",
        "canonicalModelKey": "claude-3-opus",
        "model": "Claude 3 Opus",
        "creator": "Anthropic",
        "sourceType": "Proprietary",
        "reasoningType": "Non-Reasoning",
        "contextWindow": "200K",
        "contextWindowTokens": 200000,
        "displayScore": 34,
        "rankingEligible": true,
        "overallRank": 92,
        "url": "https://benchlm.ai/models/claude-3-opus",
        "markdownUrl": "https://benchlm.ai/md/models/claude-3-opus.md"
      },
      "modelB": {
        "slug": "gpt-5-5-pro",
        "canonicalModelKey": "gpt-5-5-pro",
        "model": "GPT-5.5 Pro",
        "creator": "OpenAI",
        "sourceType": "Proprietary",
        "reasoningType": "Reasoning",
        "contextWindow": "1M",
        "contextWindowTokens": 1000000,
        "displayScore": 100,
        "rankingEligible": false,
        "overallRank": null,
        "url": "https://benchlm.ai/models/gpt-5-5-pro",
        "markdownUrl": "https://benchlm.ai/md/models/gpt-5-5-pro.md"
      },
      "overallWinner": "B",
      "winner": {
        "slug": "gpt-5-5-pro",
        "canonicalModelKey": "gpt-5-5-pro",
        "model": "GPT-5.5 Pro",
        "creator": "OpenAI",
        "sourceType": "Proprietary",
        "reasoningType": "Reasoning",
        "contextWindow": "1M",
        "contextWindowTokens": 1000000,
        "displayScore": 100,
        "rankingEligible": false,
        "overallRank": null,
        "url": "https://benchlm.ai/models/gpt-5-5-pro",
        "markdownUrl": "https://benchlm.ai/md/models/gpt-5-5-pro.md"
      },
      "scoreDiff": 66,
      "winsA": 0,
      "winsB": 0,
      "comparableCategoryCount": 0,
      "benchmarkCountA": 5,
      "benchmarkCountB": 4,
      "categoryResults": {
        "agentic": {
          "categoryLabel": "Agentic",
          "avgA": null,
          "avgB": 90.1,
          "winner": null,
          "benchmarkCount": 1
        },
        "coding": {
          "categoryLabel": "Coding",
          "avgA": null,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 2
        },
        "multimodalGrounded": {
          "categoryLabel": "Multimodal & Grounded",
          "avgA": null,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 0
        },
        "reasoning": {
          "categoryLabel": "Reasoning",
          "avgA": null,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 0
        },
        "knowledge": {
          "categoryLabel": "Knowledge",
          "avgA": null,
          "avgB": 57.2,
          "winner": null,
          "benchmarkCount": 5
        },
        "instructionFollowing": {
          "categoryLabel": "Instruction Following",
          "avgA": null,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 0
        },
        "multilingual": {
          "categoryLabel": "Multilingual",
          "avgA": null,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 0
        },
        "math": {
          "categoryLabel": "Mathematics",
          "avgA": null,
          "avgB": 52.4,
          "winner": null,
          "benchmarkCount": 1
        }
      }
    },
    {
      "slug": "claude-3-opus-vs-holo3-35b-a3b",
      "url": "https://benchlm.ai/compare/claude-3-opus-vs-holo3-35b-a3b",
      "markdownUrl": "https://benchlm.ai/md/compare/claude-3-opus-vs-holo3-35b-a3b.md",
      "modelA": {
        "slug": "claude-3-opus",
        "canonicalModelKey": "claude-3-opus",
        "model": "Claude 3 Opus",
        "creator": "Anthropic",
        "sourceType": "Proprietary",
        "reasoningType": "Non-Reasoning",
        "contextWindow": "200K",
        "contextWindowTokens": 200000,
        "displayScore": 34,
        "rankingEligible": true,
        "overallRank": 92,
        "url": "https://benchlm.ai/models/claude-3-opus",
        "markdownUrl": "https://benchlm.ai/md/models/claude-3-opus.md"
      },
      "modelB": {
        "slug": "holo3-35b-a3b",
        "canonicalModelKey": "holo3-35b-a3b",
        "model": "Holo3-35B-A3B",
        "creator": "H Company",
        "sourceType": "Open Weight",
        "reasoningType": "Non-Reasoning",
        "contextWindow": "64K",
        "contextWindowTokens": 64000,
        "displayScore": 100,
        "rankingEligible": false,
        "overallRank": null,
        "url": "https://benchlm.ai/models/holo3-35b-a3b",
        "markdownUrl": "https://benchlm.ai/md/models/holo3-35b-a3b.md"
      },
      "overallWinner": "B",
      "winner": {
        "slug": "holo3-35b-a3b",
        "canonicalModelKey": "holo3-35b-a3b",
        "model": "Holo3-35B-A3B",
        "creator": "H Company",
        "sourceType": "Open Weight",
        "reasoningType": "Non-Reasoning",
        "contextWindow": "64K",
        "contextWindowTokens": 64000,
        "displayScore": 100,
        "rankingEligible": false,
        "overallRank": null,
        "url": "https://benchlm.ai/models/holo3-35b-a3b",
        "markdownUrl": "https://benchlm.ai/md/models/holo3-35b-a3b.md"
      },
      "scoreDiff": 66,
      "winsA": 0,
      "winsB": 0,
      "comparableCategoryCount": 0,
      "benchmarkCountA": 5,
      "benchmarkCountB": 1,
      "categoryResults": {
        "agentic": {
          "categoryLabel": "Agentic",
          "avgA": null,
          "avgB": 82.6,
          "winner": null,
          "benchmarkCount": 1
        },
        "coding": {
          "categoryLabel": "Coding",
          "avgA": null,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 2
        },
        "multimodalGrounded": {
          "categoryLabel": "Multimodal & Grounded",
          "avgA": null,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 0
        },
        "reasoning": {
          "categoryLabel": "Reasoning",
          "avgA": null,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 0
        },
        "knowledge": {
          "categoryLabel": "Knowledge",
          "avgA": null,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 3
        },
        "instructionFollowing": {
          "categoryLabel": "Instruction Following",
          "avgA": null,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 0
        },
        "multilingual": {
          "categoryLabel": "Multilingual",
          "avgA": null,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 0
        },
        "math": {
          "categoryLabel": "Mathematics",
          "avgA": null,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 0
        }
      }
    },
    {
      "slug": "gpt-5-5-pro-vs-minicpm5-1b",
      "url": "https://benchlm.ai/compare/gpt-5-5-pro-vs-minicpm5-1b",
      "markdownUrl": "https://benchlm.ai/md/compare/gpt-5-5-pro-vs-minicpm5-1b.md",
      "modelA": {
        "slug": "minicpm5-1b",
        "canonicalModelKey": "minicpm5-1b",
        "model": "MiniCPM5-1B",
        "creator": "OpenBMB",
        "sourceType": "Open Weight",
        "reasoningType": "Reasoning",
        "contextWindow": "131K",
        "contextWindowTokens": 131000,
        "displayScore": 34,
        "rankingEligible": true,
        "overallRank": 93,
        "url": "https://benchlm.ai/models/minicpm5-1b",
        "markdownUrl": "https://benchlm.ai/md/models/minicpm5-1b.md"
      },
      "modelB": {
        "slug": "gpt-5-5-pro",
        "canonicalModelKey": "gpt-5-5-pro",
        "model": "GPT-5.5 Pro",
        "creator": "OpenAI",
        "sourceType": "Proprietary",
        "reasoningType": "Reasoning",
        "contextWindow": "1M",
        "contextWindowTokens": 1000000,
        "displayScore": 100,
        "rankingEligible": false,
        "overallRank": null,
        "url": "https://benchlm.ai/models/gpt-5-5-pro",
        "markdownUrl": "https://benchlm.ai/md/models/gpt-5-5-pro.md"
      },
      "overallWinner": "B",
      "winner": {
        "slug": "gpt-5-5-pro",
        "canonicalModelKey": "gpt-5-5-pro",
        "model": "GPT-5.5 Pro",
        "creator": "OpenAI",
        "sourceType": "Proprietary",
        "reasoningType": "Reasoning",
        "contextWindow": "1M",
        "contextWindowTokens": 1000000,
        "displayScore": 100,
        "rankingEligible": false,
        "overallRank": null,
        "url": "https://benchlm.ai/models/gpt-5-5-pro",
        "markdownUrl": "https://benchlm.ai/md/models/gpt-5-5-pro.md"
      },
      "scoreDiff": 66,
      "winsA": 1,
      "winsB": 1,
      "comparableCategoryCount": 2,
      "benchmarkCountA": 14,
      "benchmarkCountB": 4,
      "categoryResults": {
        "agentic": {
          "categoryLabel": "Agentic",
          "avgA": null,
          "avgB": 90.1,
          "winner": null,
          "benchmarkCount": 2
        },
        "coding": {
          "categoryLabel": "Coding",
          "avgA": null,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 2
        },
        "multimodalGrounded": {
          "categoryLabel": "Multimodal & Grounded",
          "avgA": null,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 0
        },
        "reasoning": {
          "categoryLabel": "Reasoning",
          "avgA": null,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 1
        },
        "knowledge": {
          "categoryLabel": "Knowledge",
          "avgA": 39.8,
          "avgB": 57.2,
          "winner": "B",
          "benchmarkCount": 6
        },
        "instructionFollowing": {
          "categoryLabel": "Instruction Following",
          "avgA": 68.6,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 2
        },
        "multilingual": {
          "categoryLabel": "Multilingual",
          "avgA": null,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 0
        },
        "math": {
          "categoryLabel": "Mathematics",
          "avgA": 59.6,
          "avgB": 52.4,
          "winner": "A",
          "benchmarkCount": 5
        }
      }
    },
    {
      "slug": "holo3-35b-a3b-vs-minicpm5-1b",
      "url": "https://benchlm.ai/compare/holo3-35b-a3b-vs-minicpm5-1b",
      "markdownUrl": "https://benchlm.ai/md/compare/holo3-35b-a3b-vs-minicpm5-1b.md",
      "modelA": {
        "slug": "minicpm5-1b",
        "canonicalModelKey": "minicpm5-1b",
        "model": "MiniCPM5-1B",
        "creator": "OpenBMB",
        "sourceType": "Open Weight",
        "reasoningType": "Reasoning",
        "contextWindow": "131K",
        "contextWindowTokens": 131000,
        "displayScore": 34,
        "rankingEligible": true,
        "overallRank": 93,
        "url": "https://benchlm.ai/models/minicpm5-1b",
        "markdownUrl": "https://benchlm.ai/md/models/minicpm5-1b.md"
      },
      "modelB": {
        "slug": "holo3-35b-a3b",
        "canonicalModelKey": "holo3-35b-a3b",
        "model": "Holo3-35B-A3B",
        "creator": "H Company",
        "sourceType": "Open Weight",
        "reasoningType": "Non-Reasoning",
        "contextWindow": "64K",
        "contextWindowTokens": 64000,
        "displayScore": 100,
        "rankingEligible": false,
        "overallRank": null,
        "url": "https://benchlm.ai/models/holo3-35b-a3b",
        "markdownUrl": "https://benchlm.ai/md/models/holo3-35b-a3b.md"
      },
      "overallWinner": "B",
      "winner": {
        "slug": "holo3-35b-a3b",
        "canonicalModelKey": "holo3-35b-a3b",
        "model": "Holo3-35B-A3B",
        "creator": "H Company",
        "sourceType": "Open Weight",
        "reasoningType": "Non-Reasoning",
        "contextWindow": "64K",
        "contextWindowTokens": 64000,
        "displayScore": 100,
        "rankingEligible": false,
        "overallRank": null,
        "url": "https://benchlm.ai/models/holo3-35b-a3b",
        "markdownUrl": "https://benchlm.ai/md/models/holo3-35b-a3b.md"
      },
      "scoreDiff": 66,
      "winsA": 0,
      "winsB": 0,
      "comparableCategoryCount": 0,
      "benchmarkCountA": 14,
      "benchmarkCountB": 1,
      "categoryResults": {
        "agentic": {
          "categoryLabel": "Agentic",
          "avgA": null,
          "avgB": 82.6,
          "winner": null,
          "benchmarkCount": 2
        },
        "coding": {
          "categoryLabel": "Coding",
          "avgA": null,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 2
        },
        "multimodalGrounded": {
          "categoryLabel": "Multimodal & Grounded",
          "avgA": null,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 0
        },
        "reasoning": {
          "categoryLabel": "Reasoning",
          "avgA": null,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 1
        },
        "knowledge": {
          "categoryLabel": "Knowledge",
          "avgA": 39.8,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 4
        },
        "instructionFollowing": {
          "categoryLabel": "Instruction Following",
          "avgA": 68.6,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 2
        },
        "multilingual": {
          "categoryLabel": "Multilingual",
          "avgA": null,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 0
        },
        "math": {
          "categoryLabel": "Mathematics",
          "avgA": 59.6,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 4
        }
      }
    },
    {
      "slug": "deepseek-r1-vs-gpt-5-5-pro",
      "url": "https://benchlm.ai/compare/deepseek-r1-vs-gpt-5-5-pro",
      "markdownUrl": "https://benchlm.ai/md/compare/deepseek-r1-vs-gpt-5-5-pro.md",
      "modelA": {
        "slug": "deepseek-r1",
        "canonicalModelKey": "deepseek-r1",
        "model": "DeepSeek-R1",
        "creator": "DeepSeek",
        "sourceType": "Open Weight",
        "reasoningType": "Reasoning",
        "contextWindow": "128K",
        "contextWindowTokens": 128000,
        "displayScore": 32,
        "rankingEligible": true,
        "overallRank": 94,
        "url": "https://benchlm.ai/models/deepseek-r1",
        "markdownUrl": "https://benchlm.ai/md/models/deepseek-r1.md"
      },
      "modelB": {
        "slug": "gpt-5-5-pro",
        "canonicalModelKey": "gpt-5-5-pro",
        "model": "GPT-5.5 Pro",
        "creator": "OpenAI",
        "sourceType": "Proprietary",
        "reasoningType": "Reasoning",
        "contextWindow": "1M",
        "contextWindowTokens": 1000000,
        "displayScore": 100,
        "rankingEligible": false,
        "overallRank": null,
        "url": "https://benchlm.ai/models/gpt-5-5-pro",
        "markdownUrl": "https://benchlm.ai/md/models/gpt-5-5-pro.md"
      },
      "overallWinner": "B",
      "winner": {
        "slug": "gpt-5-5-pro",
        "canonicalModelKey": "gpt-5-5-pro",
        "model": "GPT-5.5 Pro",
        "creator": "OpenAI",
        "sourceType": "Proprietary",
        "reasoningType": "Reasoning",
        "contextWindow": "1M",
        "contextWindowTokens": 1000000,
        "displayScore": 100,
        "rankingEligible": false,
        "overallRank": null,
        "url": "https://benchlm.ai/models/gpt-5-5-pro",
        "markdownUrl": "https://benchlm.ai/md/models/gpt-5-5-pro.md"
      },
      "scoreDiff": 68,
      "winsA": 0,
      "winsB": 0,
      "comparableCategoryCount": 0,
      "benchmarkCountA": 16,
      "benchmarkCountB": 4,
      "categoryResults": {
        "agentic": {
          "categoryLabel": "Agentic",
          "avgA": null,
          "avgB": 90.1,
          "winner": null,
          "benchmarkCount": 5
        },
        "coding": {
          "categoryLabel": "Coding",
          "avgA": null,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 3
        },
        "multimodalGrounded": {
          "categoryLabel": "Multimodal & Grounded",
          "avgA": null,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 0
        },
        "reasoning": {
          "categoryLabel": "Reasoning",
          "avgA": null,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 2
        },
        "knowledge": {
          "categoryLabel": "Knowledge",
          "avgA": null,
          "avgB": 57.2,
          "winner": null,
          "benchmarkCount": 8
        },
        "instructionFollowing": {
          "categoryLabel": "Instruction Following",
          "avgA": null,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 1
        },
        "multilingual": {
          "categoryLabel": "Multilingual",
          "avgA": null,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 0
        },
        "math": {
          "categoryLabel": "Mathematics",
          "avgA": null,
          "avgB": 52.4,
          "winner": null,
          "benchmarkCount": 1
        }
      }
    },
    {
      "slug": "deepseek-r1-vs-holo3-35b-a3b",
      "url": "https://benchlm.ai/compare/deepseek-r1-vs-holo3-35b-a3b",
      "markdownUrl": "https://benchlm.ai/md/compare/deepseek-r1-vs-holo3-35b-a3b.md",
      "modelA": {
        "slug": "deepseek-r1",
        "canonicalModelKey": "deepseek-r1",
        "model": "DeepSeek-R1",
        "creator": "DeepSeek",
        "sourceType": "Open Weight",
        "reasoningType": "Reasoning",
        "contextWindow": "128K",
        "contextWindowTokens": 128000,
        "displayScore": 32,
        "rankingEligible": true,
        "overallRank": 94,
        "url": "https://benchlm.ai/models/deepseek-r1",
        "markdownUrl": "https://benchlm.ai/md/models/deepseek-r1.md"
      },
      "modelB": {
        "slug": "holo3-35b-a3b",
        "canonicalModelKey": "holo3-35b-a3b",
        "model": "Holo3-35B-A3B",
        "creator": "H Company",
        "sourceType": "Open Weight",
        "reasoningType": "Non-Reasoning",
        "contextWindow": "64K",
        "contextWindowTokens": 64000,
        "displayScore": 100,
        "rankingEligible": false,
        "overallRank": null,
        "url": "https://benchlm.ai/models/holo3-35b-a3b",
        "markdownUrl": "https://benchlm.ai/md/models/holo3-35b-a3b.md"
      },
      "overallWinner": "B",
      "winner": {
        "slug": "holo3-35b-a3b",
        "canonicalModelKey": "holo3-35b-a3b",
        "model": "Holo3-35B-A3B",
        "creator": "H Company",
        "sourceType": "Open Weight",
        "reasoningType": "Non-Reasoning",
        "contextWindow": "64K",
        "contextWindowTokens": 64000,
        "displayScore": 100,
        "rankingEligible": false,
        "overallRank": null,
        "url": "https://benchlm.ai/models/holo3-35b-a3b",
        "markdownUrl": "https://benchlm.ai/md/models/holo3-35b-a3b.md"
      },
      "scoreDiff": 68,
      "winsA": 0,
      "winsB": 0,
      "comparableCategoryCount": 0,
      "benchmarkCountA": 16,
      "benchmarkCountB": 1,
      "categoryResults": {
        "agentic": {
          "categoryLabel": "Agentic",
          "avgA": null,
          "avgB": 82.6,
          "winner": null,
          "benchmarkCount": 5
        },
        "coding": {
          "categoryLabel": "Coding",
          "avgA": null,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 3
        },
        "multimodalGrounded": {
          "categoryLabel": "Multimodal & Grounded",
          "avgA": null,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 0
        },
        "reasoning": {
          "categoryLabel": "Reasoning",
          "avgA": null,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 2
        },
        "knowledge": {
          "categoryLabel": "Knowledge",
          "avgA": null,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 6
        },
        "instructionFollowing": {
          "categoryLabel": "Instruction Following",
          "avgA": null,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 1
        },
        "multilingual": {
          "categoryLabel": "Multilingual",
          "avgA": null,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 0
        },
        "math": {
          "categoryLabel": "Mathematics",
          "avgA": null,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 0
        }
      }
    },
    {
      "slug": "gpt-5-5-pro-vs-qwen3-235b-2507",
      "url": "https://benchlm.ai/compare/gpt-5-5-pro-vs-qwen3-235b-2507",
      "markdownUrl": "https://benchlm.ai/md/compare/gpt-5-5-pro-vs-qwen3-235b-2507.md",
      "modelA": {
        "slug": "qwen3-235b-2507",
        "canonicalModelKey": "qwen3-235b-2507",
        "model": "Qwen3 235B 2507",
        "creator": "Alibaba",
        "sourceType": "Open Weight",
        "reasoningType": "Non-Reasoning",
        "contextWindow": "128K",
        "contextWindowTokens": 128000,
        "displayScore": 32,
        "rankingEligible": true,
        "overallRank": 95,
        "url": "https://benchlm.ai/models/qwen3-235b-2507",
        "markdownUrl": "https://benchlm.ai/md/models/qwen3-235b-2507.md"
      },
      "modelB": {
        "slug": "gpt-5-5-pro",
        "canonicalModelKey": "gpt-5-5-pro",
        "model": "GPT-5.5 Pro",
        "creator": "OpenAI",
        "sourceType": "Proprietary",
        "reasoningType": "Reasoning",
        "contextWindow": "1M",
        "contextWindowTokens": 1000000,
        "displayScore": 100,
        "rankingEligible": false,
        "overallRank": null,
        "url": "https://benchlm.ai/models/gpt-5-5-pro",
        "markdownUrl": "https://benchlm.ai/md/models/gpt-5-5-pro.md"
      },
      "overallWinner": "B",
      "winner": {
        "slug": "gpt-5-5-pro",
        "canonicalModelKey": "gpt-5-5-pro",
        "model": "GPT-5.5 Pro",
        "creator": "OpenAI",
        "sourceType": "Proprietary",
        "reasoningType": "Reasoning",
        "contextWindow": "1M",
        "contextWindowTokens": 1000000,
        "displayScore": 100,
        "rankingEligible": false,
        "overallRank": null,
        "url": "https://benchlm.ai/models/gpt-5-5-pro",
        "markdownUrl": "https://benchlm.ai/md/models/gpt-5-5-pro.md"
      },
      "scoreDiff": 68,
      "winsA": 1,
      "winsB": 0,
      "comparableCategoryCount": 1,
      "benchmarkCountA": 4,
      "benchmarkCountB": 4,
      "categoryResults": {
        "agentic": {
          "categoryLabel": "Agentic",
          "avgA": null,
          "avgB": 90.1,
          "winner": null,
          "benchmarkCount": 1
        },
        "coding": {
          "categoryLabel": "Coding",
          "avgA": null,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 0
        },
        "multimodalGrounded": {
          "categoryLabel": "Multimodal & Grounded",
          "avgA": null,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 0
        },
        "reasoning": {
          "categoryLabel": "Reasoning",
          "avgA": null,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 0
        },
        "knowledge": {
          "categoryLabel": "Knowledge",
          "avgA": 76.2,
          "avgB": 57.2,
          "winner": "A",
          "benchmarkCount": 5
        },
        "instructionFollowing": {
          "categoryLabel": "Instruction Following",
          "avgA": null,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 0
        },
        "multilingual": {
          "categoryLabel": "Multilingual",
          "avgA": 79.4,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 1
        },
        "math": {
          "categoryLabel": "Mathematics",
          "avgA": null,
          "avgB": 52.4,
          "winner": null,
          "benchmarkCount": 1
        }
      }
    },
    {
      "slug": "holo3-35b-a3b-vs-qwen3-235b-2507",
      "url": "https://benchlm.ai/compare/holo3-35b-a3b-vs-qwen3-235b-2507",
      "markdownUrl": "https://benchlm.ai/md/compare/holo3-35b-a3b-vs-qwen3-235b-2507.md",
      "modelA": {
        "slug": "qwen3-235b-2507",
        "canonicalModelKey": "qwen3-235b-2507",
        "model": "Qwen3 235B 2507",
        "creator": "Alibaba",
        "sourceType": "Open Weight",
        "reasoningType": "Non-Reasoning",
        "contextWindow": "128K",
        "contextWindowTokens": 128000,
        "displayScore": 32,
        "rankingEligible": true,
        "overallRank": 95,
        "url": "https://benchlm.ai/models/qwen3-235b-2507",
        "markdownUrl": "https://benchlm.ai/md/models/qwen3-235b-2507.md"
      },
      "modelB": {
        "slug": "holo3-35b-a3b",
        "canonicalModelKey": "holo3-35b-a3b",
        "model": "Holo3-35B-A3B",
        "creator": "H Company",
        "sourceType": "Open Weight",
        "reasoningType": "Non-Reasoning",
        "contextWindow": "64K",
        "contextWindowTokens": 64000,
        "displayScore": 100,
        "rankingEligible": false,
        "overallRank": null,
        "url": "https://benchlm.ai/models/holo3-35b-a3b",
        "markdownUrl": "https://benchlm.ai/md/models/holo3-35b-a3b.md"
      },
      "overallWinner": "B",
      "winner": {
        "slug": "holo3-35b-a3b",
        "canonicalModelKey": "holo3-35b-a3b",
        "model": "Holo3-35B-A3B",
        "creator": "H Company",
        "sourceType": "Open Weight",
        "reasoningType": "Non-Reasoning",
        "contextWindow": "64K",
        "contextWindowTokens": 64000,
        "displayScore": 100,
        "rankingEligible": false,
        "overallRank": null,
        "url": "https://benchlm.ai/models/holo3-35b-a3b",
        "markdownUrl": "https://benchlm.ai/md/models/holo3-35b-a3b.md"
      },
      "scoreDiff": 68,
      "winsA": 0,
      "winsB": 0,
      "comparableCategoryCount": 0,
      "benchmarkCountA": 4,
      "benchmarkCountB": 1,
      "categoryResults": {
        "agentic": {
          "categoryLabel": "Agentic",
          "avgA": null,
          "avgB": 82.6,
          "winner": null,
          "benchmarkCount": 1
        },
        "coding": {
          "categoryLabel": "Coding",
          "avgA": null,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 0
        },
        "multimodalGrounded": {
          "categoryLabel": "Multimodal & Grounded",
          "avgA": null,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 0
        },
        "reasoning": {
          "categoryLabel": "Reasoning",
          "avgA": null,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 0
        },
        "knowledge": {
          "categoryLabel": "Knowledge",
          "avgA": 76.2,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 3
        },
        "instructionFollowing": {
          "categoryLabel": "Instruction Following",
          "avgA": null,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 0
        },
        "multilingual": {
          "categoryLabel": "Multilingual",
          "avgA": 79.4,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 1
        },
        "math": {
          "categoryLabel": "Mathematics",
          "avgA": null,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 0
        }
      }
    },
    {
      "slug": "dbrx-instruct-vs-gpt-5-5-pro",
      "url": "https://benchlm.ai/compare/dbrx-instruct-vs-gpt-5-5-pro",
      "markdownUrl": "https://benchlm.ai/md/compare/dbrx-instruct-vs-gpt-5-5-pro.md",
      "modelA": {
        "slug": "dbrx-instruct",
        "canonicalModelKey": "dbrx-instruct",
        "model": "DBRX Instruct",
        "creator": "Databricks",
        "sourceType": "Open Weight",
        "reasoningType": "Non-Reasoning",
        "contextWindow": "32K",
        "contextWindowTokens": 32000,
        "displayScore": 32,
        "rankingEligible": true,
        "overallRank": 96,
        "url": "https://benchlm.ai/models/dbrx-instruct",
        "markdownUrl": "https://benchlm.ai/md/models/dbrx-instruct.md"
      },
      "modelB": {
        "slug": "gpt-5-5-pro",
        "canonicalModelKey": "gpt-5-5-pro",
        "model": "GPT-5.5 Pro",
        "creator": "OpenAI",
        "sourceType": "Proprietary",
        "reasoningType": "Reasoning",
        "contextWindow": "1M",
        "contextWindowTokens": 1000000,
        "displayScore": 100,
        "rankingEligible": false,
        "overallRank": null,
        "url": "https://benchlm.ai/models/gpt-5-5-pro",
        "markdownUrl": "https://benchlm.ai/md/models/gpt-5-5-pro.md"
      },
      "overallWinner": "B",
      "winner": {
        "slug": "gpt-5-5-pro",
        "canonicalModelKey": "gpt-5-5-pro",
        "model": "GPT-5.5 Pro",
        "creator": "OpenAI",
        "sourceType": "Proprietary",
        "reasoningType": "Reasoning",
        "contextWindow": "1M",
        "contextWindowTokens": 1000000,
        "displayScore": 100,
        "rankingEligible": false,
        "overallRank": null,
        "url": "https://benchlm.ai/models/gpt-5-5-pro",
        "markdownUrl": "https://benchlm.ai/md/models/gpt-5-5-pro.md"
      },
      "scoreDiff": 68,
      "winsA": 0,
      "winsB": 0,
      "comparableCategoryCount": 0,
      "benchmarkCountA": 0,
      "benchmarkCountB": 4,
      "categoryResults": {
        "agentic": {
          "categoryLabel": "Agentic",
          "avgA": null,
          "avgB": 90.1,
          "winner": null,
          "benchmarkCount": 1
        },
        "coding": {
          "categoryLabel": "Coding",
          "avgA": null,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 0
        },
        "multimodalGrounded": {
          "categoryLabel": "Multimodal & Grounded",
          "avgA": null,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 0
        },
        "reasoning": {
          "categoryLabel": "Reasoning",
          "avgA": null,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 0
        },
        "knowledge": {
          "categoryLabel": "Knowledge",
          "avgA": null,
          "avgB": 57.2,
          "winner": null,
          "benchmarkCount": 2
        },
        "instructionFollowing": {
          "categoryLabel": "Instruction Following",
          "avgA": null,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 0
        },
        "multilingual": {
          "categoryLabel": "Multilingual",
          "avgA": null,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 0
        },
        "math": {
          "categoryLabel": "Mathematics",
          "avgA": null,
          "avgB": 52.4,
          "winner": null,
          "benchmarkCount": 1
        }
      }
    },
    {
      "slug": "dbrx-instruct-vs-holo3-35b-a3b",
      "url": "https://benchlm.ai/compare/dbrx-instruct-vs-holo3-35b-a3b",
      "markdownUrl": "https://benchlm.ai/md/compare/dbrx-instruct-vs-holo3-35b-a3b.md",
      "modelA": {
        "slug": "dbrx-instruct",
        "canonicalModelKey": "dbrx-instruct",
        "model": "DBRX Instruct",
        "creator": "Databricks",
        "sourceType": "Open Weight",
        "reasoningType": "Non-Reasoning",
        "contextWindow": "32K",
        "contextWindowTokens": 32000,
        "displayScore": 32,
        "rankingEligible": true,
        "overallRank": 96,
        "url": "https://benchlm.ai/models/dbrx-instruct",
        "markdownUrl": "https://benchlm.ai/md/models/dbrx-instruct.md"
      },
      "modelB": {
        "slug": "holo3-35b-a3b",
        "canonicalModelKey": "holo3-35b-a3b",
        "model": "Holo3-35B-A3B",
        "creator": "H Company",
        "sourceType": "Open Weight",
        "reasoningType": "Non-Reasoning",
        "contextWindow": "64K",
        "contextWindowTokens": 64000,
        "displayScore": 100,
        "rankingEligible": false,
        "overallRank": null,
        "url": "https://benchlm.ai/models/holo3-35b-a3b",
        "markdownUrl": "https://benchlm.ai/md/models/holo3-35b-a3b.md"
      },
      "overallWinner": "B",
      "winner": {
        "slug": "holo3-35b-a3b",
        "canonicalModelKey": "holo3-35b-a3b",
        "model": "Holo3-35B-A3B",
        "creator": "H Company",
        "sourceType": "Open Weight",
        "reasoningType": "Non-Reasoning",
        "contextWindow": "64K",
        "contextWindowTokens": 64000,
        "displayScore": 100,
        "rankingEligible": false,
        "overallRank": null,
        "url": "https://benchlm.ai/models/holo3-35b-a3b",
        "markdownUrl": "https://benchlm.ai/md/models/holo3-35b-a3b.md"
      },
      "scoreDiff": 68,
      "winsA": 0,
      "winsB": 0,
      "comparableCategoryCount": 0,
      "benchmarkCountA": 0,
      "benchmarkCountB": 1,
      "categoryResults": {
        "agentic": {
          "categoryLabel": "Agentic",
          "avgA": null,
          "avgB": 82.6,
          "winner": null,
          "benchmarkCount": 1
        },
        "coding": {
          "categoryLabel": "Coding",
          "avgA": null,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 0
        },
        "multimodalGrounded": {
          "categoryLabel": "Multimodal & Grounded",
          "avgA": null,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 0
        },
        "reasoning": {
          "categoryLabel": "Reasoning",
          "avgA": null,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 0
        },
        "knowledge": {
          "categoryLabel": "Knowledge",
          "avgA": null,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 0
        },
        "instructionFollowing": {
          "categoryLabel": "Instruction Following",
          "avgA": null,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 0
        },
        "multilingual": {
          "categoryLabel": "Multilingual",
          "avgA": null,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 0
        },
        "math": {
          "categoryLabel": "Mathematics",
          "avgA": null,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 0
        }
      }
    },
    {
      "slug": "gpt-5-5-pro-vs-grok-3-beta",
      "url": "https://benchlm.ai/compare/gpt-5-5-pro-vs-grok-3-beta",
      "markdownUrl": "https://benchlm.ai/md/compare/gpt-5-5-pro-vs-grok-3-beta.md",
      "modelA": {
        "slug": "grok-3-beta",
        "canonicalModelKey": "grok-3-beta",
        "model": "Grok 3 [Beta]",
        "creator": "xAI",
        "sourceType": "Proprietary",
        "reasoningType": "Non-Reasoning",
        "contextWindow": "128K",
        "contextWindowTokens": 128000,
        "displayScore": 30,
        "rankingEligible": true,
        "overallRank": 97,
        "url": "https://benchlm.ai/models/grok-3-beta",
        "markdownUrl": "https://benchlm.ai/md/models/grok-3-beta.md"
      },
      "modelB": {
        "slug": "gpt-5-5-pro",
        "canonicalModelKey": "gpt-5-5-pro",
        "model": "GPT-5.5 Pro",
        "creator": "OpenAI",
        "sourceType": "Proprietary",
        "reasoningType": "Reasoning",
        "contextWindow": "1M",
        "contextWindowTokens": 1000000,
        "displayScore": 100,
        "rankingEligible": false,
        "overallRank": null,
        "url": "https://benchlm.ai/models/gpt-5-5-pro",
        "markdownUrl": "https://benchlm.ai/md/models/gpt-5-5-pro.md"
      },
      "overallWinner": "B",
      "winner": {
        "slug": "gpt-5-5-pro",
        "canonicalModelKey": "gpt-5-5-pro",
        "model": "GPT-5.5 Pro",
        "creator": "OpenAI",
        "sourceType": "Proprietary",
        "reasoningType": "Reasoning",
        "contextWindow": "1M",
        "contextWindowTokens": 1000000,
        "displayScore": 100,
        "rankingEligible": false,
        "overallRank": null,
        "url": "https://benchlm.ai/models/gpt-5-5-pro",
        "markdownUrl": "https://benchlm.ai/md/models/gpt-5-5-pro.md"
      },
      "scoreDiff": 70,
      "winsA": 0,
      "winsB": 0,
      "comparableCategoryCount": 0,
      "benchmarkCountA": 0,
      "benchmarkCountB": 4,
      "categoryResults": {
        "agentic": {
          "categoryLabel": "Agentic",
          "avgA": null,
          "avgB": 90.1,
          "winner": null,
          "benchmarkCount": 1
        },
        "coding": {
          "categoryLabel": "Coding",
          "avgA": null,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 0
        },
        "multimodalGrounded": {
          "categoryLabel": "Multimodal & Grounded",
          "avgA": null,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 0
        },
        "reasoning": {
          "categoryLabel": "Reasoning",
          "avgA": null,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 0
        },
        "knowledge": {
          "categoryLabel": "Knowledge",
          "avgA": null,
          "avgB": 57.2,
          "winner": null,
          "benchmarkCount": 2
        },
        "instructionFollowing": {
          "categoryLabel": "Instruction Following",
          "avgA": null,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 0
        },
        "multilingual": {
          "categoryLabel": "Multilingual",
          "avgA": null,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 0
        },
        "math": {
          "categoryLabel": "Mathematics",
          "avgA": null,
          "avgB": 52.4,
          "winner": null,
          "benchmarkCount": 1
        }
      }
    },
    {
      "slug": "grok-3-beta-vs-holo3-35b-a3b",
      "url": "https://benchlm.ai/compare/grok-3-beta-vs-holo3-35b-a3b",
      "markdownUrl": "https://benchlm.ai/md/compare/grok-3-beta-vs-holo3-35b-a3b.md",
      "modelA": {
        "slug": "grok-3-beta",
        "canonicalModelKey": "grok-3-beta",
        "model": "Grok 3 [Beta]",
        "creator": "xAI",
        "sourceType": "Proprietary",
        "reasoningType": "Non-Reasoning",
        "contextWindow": "128K",
        "contextWindowTokens": 128000,
        "displayScore": 30,
        "rankingEligible": true,
        "overallRank": 97,
        "url": "https://benchlm.ai/models/grok-3-beta",
        "markdownUrl": "https://benchlm.ai/md/models/grok-3-beta.md"
      },
      "modelB": {
        "slug": "holo3-35b-a3b",
        "canonicalModelKey": "holo3-35b-a3b",
        "model": "Holo3-35B-A3B",
        "creator": "H Company",
        "sourceType": "Open Weight",
        "reasoningType": "Non-Reasoning",
        "contextWindow": "64K",
        "contextWindowTokens": 64000,
        "displayScore": 100,
        "rankingEligible": false,
        "overallRank": null,
        "url": "https://benchlm.ai/models/holo3-35b-a3b",
        "markdownUrl": "https://benchlm.ai/md/models/holo3-35b-a3b.md"
      },
      "overallWinner": "B",
      "winner": {
        "slug": "holo3-35b-a3b",
        "canonicalModelKey": "holo3-35b-a3b",
        "model": "Holo3-35B-A3B",
        "creator": "H Company",
        "sourceType": "Open Weight",
        "reasoningType": "Non-Reasoning",
        "contextWindow": "64K",
        "contextWindowTokens": 64000,
        "displayScore": 100,
        "rankingEligible": false,
        "overallRank": null,
        "url": "https://benchlm.ai/models/holo3-35b-a3b",
        "markdownUrl": "https://benchlm.ai/md/models/holo3-35b-a3b.md"
      },
      "scoreDiff": 70,
      "winsA": 0,
      "winsB": 0,
      "comparableCategoryCount": 0,
      "benchmarkCountA": 0,
      "benchmarkCountB": 1,
      "categoryResults": {
        "agentic": {
          "categoryLabel": "Agentic",
          "avgA": null,
          "avgB": 82.6,
          "winner": null,
          "benchmarkCount": 1
        },
        "coding": {
          "categoryLabel": "Coding",
          "avgA": null,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 0
        },
        "multimodalGrounded": {
          "categoryLabel": "Multimodal & Grounded",
          "avgA": null,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 0
        },
        "reasoning": {
          "categoryLabel": "Reasoning",
          "avgA": null,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 0
        },
        "knowledge": {
          "categoryLabel": "Knowledge",
          "avgA": null,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 0
        },
        "instructionFollowing": {
          "categoryLabel": "Instruction Following",
          "avgA": null,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 0
        },
        "multilingual": {
          "categoryLabel": "Multilingual",
          "avgA": null,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 0
        },
        "math": {
          "categoryLabel": "Mathematics",
          "avgA": null,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 0
        }
      }
    },
    {
      "slug": "deepseek-v3-1-reasoning-vs-gpt-5-5-pro",
      "url": "https://benchlm.ai/compare/deepseek-v3-1-reasoning-vs-gpt-5-5-pro",
      "markdownUrl": "https://benchlm.ai/md/compare/deepseek-v3-1-reasoning-vs-gpt-5-5-pro.md",
      "modelA": {
        "slug": "deepseek-v3-1-reasoning",
        "canonicalModelKey": "deepseek-v3-1-reasoning",
        "model": "DeepSeek V3.1 (Reasoning)",
        "creator": "DeepSeek",
        "sourceType": "Open Weight",
        "reasoningType": "Reasoning",
        "contextWindow": "128K",
        "contextWindowTokens": 128000,
        "displayScore": 29,
        "rankingEligible": true,
        "overallRank": 98,
        "url": "https://benchlm.ai/models/deepseek-v3-1-reasoning",
        "markdownUrl": "https://benchlm.ai/md/models/deepseek-v3-1-reasoning.md"
      },
      "modelB": {
        "slug": "gpt-5-5-pro",
        "canonicalModelKey": "gpt-5-5-pro",
        "model": "GPT-5.5 Pro",
        "creator": "OpenAI",
        "sourceType": "Proprietary",
        "reasoningType": "Reasoning",
        "contextWindow": "1M",
        "contextWindowTokens": 1000000,
        "displayScore": 100,
        "rankingEligible": false,
        "overallRank": null,
        "url": "https://benchlm.ai/models/gpt-5-5-pro",
        "markdownUrl": "https://benchlm.ai/md/models/gpt-5-5-pro.md"
      },
      "overallWinner": "B",
      "winner": {
        "slug": "gpt-5-5-pro",
        "canonicalModelKey": "gpt-5-5-pro",
        "model": "GPT-5.5 Pro",
        "creator": "OpenAI",
        "sourceType": "Proprietary",
        "reasoningType": "Reasoning",
        "contextWindow": "1M",
        "contextWindowTokens": 1000000,
        "displayScore": 100,
        "rankingEligible": false,
        "overallRank": null,
        "url": "https://benchlm.ai/models/gpt-5-5-pro",
        "markdownUrl": "https://benchlm.ai/md/models/gpt-5-5-pro.md"
      },
      "scoreDiff": 71,
      "winsA": 0,
      "winsB": 0,
      "comparableCategoryCount": 0,
      "benchmarkCountA": 17,
      "benchmarkCountB": 4,
      "categoryResults": {
        "agentic": {
          "categoryLabel": "Agentic",
          "avgA": null,
          "avgB": 90.1,
          "winner": null,
          "benchmarkCount": 5
        },
        "coding": {
          "categoryLabel": "Coding",
          "avgA": null,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 3
        },
        "multimodalGrounded": {
          "categoryLabel": "Multimodal & Grounded",
          "avgA": null,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 1
        },
        "reasoning": {
          "categoryLabel": "Reasoning",
          "avgA": null,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 2
        },
        "knowledge": {
          "categoryLabel": "Knowledge",
          "avgA": null,
          "avgB": 57.2,
          "winner": null,
          "benchmarkCount": 8
        },
        "instructionFollowing": {
          "categoryLabel": "Instruction Following",
          "avgA": null,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 1
        },
        "multilingual": {
          "categoryLabel": "Multilingual",
          "avgA": null,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 0
        },
        "math": {
          "categoryLabel": "Mathematics",
          "avgA": null,
          "avgB": 52.4,
          "winner": null,
          "benchmarkCount": 1
        }
      }
    },
    {
      "slug": "deepseek-v3-1-reasoning-vs-holo3-35b-a3b",
      "url": "https://benchlm.ai/compare/deepseek-v3-1-reasoning-vs-holo3-35b-a3b",
      "markdownUrl": "https://benchlm.ai/md/compare/deepseek-v3-1-reasoning-vs-holo3-35b-a3b.md",
      "modelA": {
        "slug": "deepseek-v3-1-reasoning",
        "canonicalModelKey": "deepseek-v3-1-reasoning",
        "model": "DeepSeek V3.1 (Reasoning)",
        "creator": "DeepSeek",
        "sourceType": "Open Weight",
        "reasoningType": "Reasoning",
        "contextWindow": "128K",
        "contextWindowTokens": 128000,
        "displayScore": 29,
        "rankingEligible": true,
        "overallRank": 98,
        "url": "https://benchlm.ai/models/deepseek-v3-1-reasoning",
        "markdownUrl": "https://benchlm.ai/md/models/deepseek-v3-1-reasoning.md"
      },
      "modelB": {
        "slug": "holo3-35b-a3b",
        "canonicalModelKey": "holo3-35b-a3b",
        "model": "Holo3-35B-A3B",
        "creator": "H Company",
        "sourceType": "Open Weight",
        "reasoningType": "Non-Reasoning",
        "contextWindow": "64K",
        "contextWindowTokens": 64000,
        "displayScore": 100,
        "rankingEligible": false,
        "overallRank": null,
        "url": "https://benchlm.ai/models/holo3-35b-a3b",
        "markdownUrl": "https://benchlm.ai/md/models/holo3-35b-a3b.md"
      },
      "overallWinner": "B",
      "winner": {
        "slug": "holo3-35b-a3b",
        "canonicalModelKey": "holo3-35b-a3b",
        "model": "Holo3-35B-A3B",
        "creator": "H Company",
        "sourceType": "Open Weight",
        "reasoningType": "Non-Reasoning",
        "contextWindow": "64K",
        "contextWindowTokens": 64000,
        "displayScore": 100,
        "rankingEligible": false,
        "overallRank": null,
        "url": "https://benchlm.ai/models/holo3-35b-a3b",
        "markdownUrl": "https://benchlm.ai/md/models/holo3-35b-a3b.md"
      },
      "scoreDiff": 71,
      "winsA": 0,
      "winsB": 0,
      "comparableCategoryCount": 0,
      "benchmarkCountA": 17,
      "benchmarkCountB": 1,
      "categoryResults": {
        "agentic": {
          "categoryLabel": "Agentic",
          "avgA": null,
          "avgB": 82.6,
          "winner": null,
          "benchmarkCount": 5
        },
        "coding": {
          "categoryLabel": "Coding",
          "avgA": null,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 3
        },
        "multimodalGrounded": {
          "categoryLabel": "Multimodal & Grounded",
          "avgA": null,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 1
        },
        "reasoning": {
          "categoryLabel": "Reasoning",
          "avgA": null,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 2
        },
        "knowledge": {
          "categoryLabel": "Knowledge",
          "avgA": null,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 6
        },
        "instructionFollowing": {
          "categoryLabel": "Instruction Following",
          "avgA": null,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 1
        },
        "multilingual": {
          "categoryLabel": "Multilingual",
          "avgA": null,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 0
        },
        "math": {
          "categoryLabel": "Mathematics",
          "avgA": null,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 0
        }
      }
    },
    {
      "slug": "gpt-5-5-pro-vs-o1-pro",
      "url": "https://benchlm.ai/compare/gpt-5-5-pro-vs-o1-pro",
      "markdownUrl": "https://benchlm.ai/md/compare/gpt-5-5-pro-vs-o1-pro.md",
      "modelA": {
        "slug": "o1-pro",
        "canonicalModelKey": "o1-pro",
        "model": "o1-pro",
        "creator": "OpenAI",
        "sourceType": "Proprietary",
        "reasoningType": "Reasoning",
        "contextWindow": "200K",
        "contextWindowTokens": 200000,
        "displayScore": 28,
        "rankingEligible": true,
        "overallRank": 99,
        "url": "https://benchlm.ai/models/o1-pro",
        "markdownUrl": "https://benchlm.ai/md/models/o1-pro.md"
      },
      "modelB": {
        "slug": "gpt-5-5-pro",
        "canonicalModelKey": "gpt-5-5-pro",
        "model": "GPT-5.5 Pro",
        "creator": "OpenAI",
        "sourceType": "Proprietary",
        "reasoningType": "Reasoning",
        "contextWindow": "1M",
        "contextWindowTokens": 1000000,
        "displayScore": 100,
        "rankingEligible": false,
        "overallRank": null,
        "url": "https://benchlm.ai/models/gpt-5-5-pro",
        "markdownUrl": "https://benchlm.ai/md/models/gpt-5-5-pro.md"
      },
      "overallWinner": "B",
      "winner": {
        "slug": "gpt-5-5-pro",
        "canonicalModelKey": "gpt-5-5-pro",
        "model": "GPT-5.5 Pro",
        "creator": "OpenAI",
        "sourceType": "Proprietary",
        "reasoningType": "Reasoning",
        "contextWindow": "1M",
        "contextWindowTokens": 1000000,
        "displayScore": 100,
        "rankingEligible": false,
        "overallRank": null,
        "url": "https://benchlm.ai/models/gpt-5-5-pro",
        "markdownUrl": "https://benchlm.ai/md/models/gpt-5-5-pro.md"
      },
      "scoreDiff": 72,
      "winsA": 1,
      "winsB": 0,
      "comparableCategoryCount": 1,
      "benchmarkCountA": 2,
      "benchmarkCountB": 4,
      "categoryResults": {
        "agentic": {
          "categoryLabel": "Agentic",
          "avgA": null,
          "avgB": 90.1,
          "winner": null,
          "benchmarkCount": 1
        },
        "coding": {
          "categoryLabel": "Coding",
          "avgA": null,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 0
        },
        "multimodalGrounded": {
          "categoryLabel": "Multimodal & Grounded",
          "avgA": null,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 0
        },
        "reasoning": {
          "categoryLabel": "Reasoning",
          "avgA": null,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 0
        },
        "knowledge": {
          "categoryLabel": "Knowledge",
          "avgA": 79,
          "avgB": 57.2,
          "winner": "A",
          "benchmarkCount": 4
        },
        "instructionFollowing": {
          "categoryLabel": "Instruction Following",
          "avgA": null,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 0
        },
        "multilingual": {
          "categoryLabel": "Multilingual",
          "avgA": null,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 0
        },
        "math": {
          "categoryLabel": "Mathematics",
          "avgA": null,
          "avgB": 52.4,
          "winner": null,
          "benchmarkCount": 1
        }
      }
    },
    {
      "slug": "holo3-35b-a3b-vs-o1-pro",
      "url": "https://benchlm.ai/compare/holo3-35b-a3b-vs-o1-pro",
      "markdownUrl": "https://benchlm.ai/md/compare/holo3-35b-a3b-vs-o1-pro.md",
      "modelA": {
        "slug": "o1-pro",
        "canonicalModelKey": "o1-pro",
        "model": "o1-pro",
        "creator": "OpenAI",
        "sourceType": "Proprietary",
        "reasoningType": "Reasoning",
        "contextWindow": "200K",
        "contextWindowTokens": 200000,
        "displayScore": 28,
        "rankingEligible": true,
        "overallRank": 99,
        "url": "https://benchlm.ai/models/o1-pro",
        "markdownUrl": "https://benchlm.ai/md/models/o1-pro.md"
      },
      "modelB": {
        "slug": "holo3-35b-a3b",
        "canonicalModelKey": "holo3-35b-a3b",
        "model": "Holo3-35B-A3B",
        "creator": "H Company",
        "sourceType": "Open Weight",
        "reasoningType": "Non-Reasoning",
        "contextWindow": "64K",
        "contextWindowTokens": 64000,
        "displayScore": 100,
        "rankingEligible": false,
        "overallRank": null,
        "url": "https://benchlm.ai/models/holo3-35b-a3b",
        "markdownUrl": "https://benchlm.ai/md/models/holo3-35b-a3b.md"
      },
      "overallWinner": "B",
      "winner": {
        "slug": "holo3-35b-a3b",
        "canonicalModelKey": "holo3-35b-a3b",
        "model": "Holo3-35B-A3B",
        "creator": "H Company",
        "sourceType": "Open Weight",
        "reasoningType": "Non-Reasoning",
        "contextWindow": "64K",
        "contextWindowTokens": 64000,
        "displayScore": 100,
        "rankingEligible": false,
        "overallRank": null,
        "url": "https://benchlm.ai/models/holo3-35b-a3b",
        "markdownUrl": "https://benchlm.ai/md/models/holo3-35b-a3b.md"
      },
      "scoreDiff": 72,
      "winsA": 0,
      "winsB": 0,
      "comparableCategoryCount": 0,
      "benchmarkCountA": 2,
      "benchmarkCountB": 1,
      "categoryResults": {
        "agentic": {
          "categoryLabel": "Agentic",
          "avgA": null,
          "avgB": 82.6,
          "winner": null,
          "benchmarkCount": 1
        },
        "coding": {
          "categoryLabel": "Coding",
          "avgA": null,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 0
        },
        "multimodalGrounded": {
          "categoryLabel": "Multimodal & Grounded",
          "avgA": null,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 0
        },
        "reasoning": {
          "categoryLabel": "Reasoning",
          "avgA": null,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 0
        },
        "knowledge": {
          "categoryLabel": "Knowledge",
          "avgA": 79,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 2
        },
        "instructionFollowing": {
          "categoryLabel": "Instruction Following",
          "avgA": null,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 0
        },
        "multilingual": {
          "categoryLabel": "Multilingual",
          "avgA": null,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 0
        },
        "math": {
          "categoryLabel": "Mathematics",
          "avgA": null,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 0
        }
      }
    },
    {
      "slug": "gpt-5-5-pro-vs-phi-4",
      "url": "https://benchlm.ai/compare/gpt-5-5-pro-vs-phi-4",
      "markdownUrl": "https://benchlm.ai/md/compare/gpt-5-5-pro-vs-phi-4.md",
      "modelA": {
        "slug": "phi-4",
        "canonicalModelKey": "phi-4",
        "model": "Phi-4",
        "creator": "Microsoft",
        "sourceType": "Open Weight",
        "reasoningType": "Non-Reasoning",
        "contextWindow": "16K",
        "contextWindowTokens": 16000,
        "displayScore": 27,
        "rankingEligible": true,
        "overallRank": 100,
        "url": "https://benchlm.ai/models/phi-4",
        "markdownUrl": "https://benchlm.ai/md/models/phi-4.md"
      },
      "modelB": {
        "slug": "gpt-5-5-pro",
        "canonicalModelKey": "gpt-5-5-pro",
        "model": "GPT-5.5 Pro",
        "creator": "OpenAI",
        "sourceType": "Proprietary",
        "reasoningType": "Reasoning",
        "contextWindow": "1M",
        "contextWindowTokens": 1000000,
        "displayScore": 100,
        "rankingEligible": false,
        "overallRank": null,
        "url": "https://benchlm.ai/models/gpt-5-5-pro",
        "markdownUrl": "https://benchlm.ai/md/models/gpt-5-5-pro.md"
      },
      "overallWinner": "B",
      "winner": {
        "slug": "gpt-5-5-pro",
        "canonicalModelKey": "gpt-5-5-pro",
        "model": "GPT-5.5 Pro",
        "creator": "OpenAI",
        "sourceType": "Proprietary",
        "reasoningType": "Reasoning",
        "contextWindow": "1M",
        "contextWindowTokens": 1000000,
        "displayScore": 100,
        "rankingEligible": false,
        "overallRank": null,
        "url": "https://benchlm.ai/models/gpt-5-5-pro",
        "markdownUrl": "https://benchlm.ai/md/models/gpt-5-5-pro.md"
      },
      "scoreDiff": 73,
      "winsA": 0,
      "winsB": 0,
      "comparableCategoryCount": 0,
      "benchmarkCountA": 14,
      "benchmarkCountB": 4,
      "categoryResults": {
        "agentic": {
          "categoryLabel": "Agentic",
          "avgA": null,
          "avgB": 90.1,
          "winner": null,
          "benchmarkCount": 3
        },
        "coding": {
          "categoryLabel": "Coding",
          "avgA": null,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 3
        },
        "multimodalGrounded": {
          "categoryLabel": "Multimodal & Grounded",
          "avgA": null,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 0
        },
        "reasoning": {
          "categoryLabel": "Reasoning",
          "avgA": null,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 2
        },
        "knowledge": {
          "categoryLabel": "Knowledge",
          "avgA": null,
          "avgB": 57.2,
          "winner": null,
          "benchmarkCount": 8
        },
        "instructionFollowing": {
          "categoryLabel": "Instruction Following",
          "avgA": null,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 1
        },
        "multilingual": {
          "categoryLabel": "Multilingual",
          "avgA": null,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 0
        },
        "math": {
          "categoryLabel": "Mathematics",
          "avgA": null,
          "avgB": 52.4,
          "winner": null,
          "benchmarkCount": 1
        }
      }
    },
    {
      "slug": "holo3-35b-a3b-vs-phi-4",
      "url": "https://benchlm.ai/compare/holo3-35b-a3b-vs-phi-4",
      "markdownUrl": "https://benchlm.ai/md/compare/holo3-35b-a3b-vs-phi-4.md",
      "modelA": {
        "slug": "phi-4",
        "canonicalModelKey": "phi-4",
        "model": "Phi-4",
        "creator": "Microsoft",
        "sourceType": "Open Weight",
        "reasoningType": "Non-Reasoning",
        "contextWindow": "16K",
        "contextWindowTokens": 16000,
        "displayScore": 27,
        "rankingEligible": true,
        "overallRank": 100,
        "url": "https://benchlm.ai/models/phi-4",
        "markdownUrl": "https://benchlm.ai/md/models/phi-4.md"
      },
      "modelB": {
        "slug": "holo3-35b-a3b",
        "canonicalModelKey": "holo3-35b-a3b",
        "model": "Holo3-35B-A3B",
        "creator": "H Company",
        "sourceType": "Open Weight",
        "reasoningType": "Non-Reasoning",
        "contextWindow": "64K",
        "contextWindowTokens": 64000,
        "displayScore": 100,
        "rankingEligible": false,
        "overallRank": null,
        "url": "https://benchlm.ai/models/holo3-35b-a3b",
        "markdownUrl": "https://benchlm.ai/md/models/holo3-35b-a3b.md"
      },
      "overallWinner": "B",
      "winner": {
        "slug": "holo3-35b-a3b",
        "canonicalModelKey": "holo3-35b-a3b",
        "model": "Holo3-35B-A3B",
        "creator": "H Company",
        "sourceType": "Open Weight",
        "reasoningType": "Non-Reasoning",
        "contextWindow": "64K",
        "contextWindowTokens": 64000,
        "displayScore": 100,
        "rankingEligible": false,
        "overallRank": null,
        "url": "https://benchlm.ai/models/holo3-35b-a3b",
        "markdownUrl": "https://benchlm.ai/md/models/holo3-35b-a3b.md"
      },
      "scoreDiff": 73,
      "winsA": 0,
      "winsB": 0,
      "comparableCategoryCount": 0,
      "benchmarkCountA": 14,
      "benchmarkCountB": 1,
      "categoryResults": {
        "agentic": {
          "categoryLabel": "Agentic",
          "avgA": null,
          "avgB": 82.6,
          "winner": null,
          "benchmarkCount": 3
        },
        "coding": {
          "categoryLabel": "Coding",
          "avgA": null,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 3
        },
        "multimodalGrounded": {
          "categoryLabel": "Multimodal & Grounded",
          "avgA": null,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 0
        },
        "reasoning": {
          "categoryLabel": "Reasoning",
          "avgA": null,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 2
        },
        "knowledge": {
          "categoryLabel": "Knowledge",
          "avgA": null,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 6
        },
        "instructionFollowing": {
          "categoryLabel": "Instruction Following",
          "avgA": null,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 1
        },
        "multilingual": {
          "categoryLabel": "Multilingual",
          "avgA": null,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 0
        },
        "math": {
          "categoryLabel": "Mathematics",
          "avgA": null,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 0
        }
      }
    },
    {
      "slug": "gpt-4-1-nano-vs-gpt-5-5-pro",
      "url": "https://benchlm.ai/compare/gpt-4-1-nano-vs-gpt-5-5-pro",
      "markdownUrl": "https://benchlm.ai/md/compare/gpt-4-1-nano-vs-gpt-5-5-pro.md",
      "modelA": {
        "slug": "gpt-4-1-nano",
        "canonicalModelKey": "gpt-4-1-nano",
        "model": "GPT-4.1 nano",
        "creator": "OpenAI",
        "sourceType": "Proprietary",
        "reasoningType": "Non-Reasoning",
        "contextWindow": "1M",
        "contextWindowTokens": 1000000,
        "displayScore": 27,
        "rankingEligible": true,
        "overallRank": 101,
        "url": "https://benchlm.ai/models/gpt-4-1-nano",
        "markdownUrl": "https://benchlm.ai/md/models/gpt-4-1-nano.md"
      },
      "modelB": {
        "slug": "gpt-5-5-pro",
        "canonicalModelKey": "gpt-5-5-pro",
        "model": "GPT-5.5 Pro",
        "creator": "OpenAI",
        "sourceType": "Proprietary",
        "reasoningType": "Reasoning",
        "contextWindow": "1M",
        "contextWindowTokens": 1000000,
        "displayScore": 100,
        "rankingEligible": false,
        "overallRank": null,
        "url": "https://benchlm.ai/models/gpt-5-5-pro",
        "markdownUrl": "https://benchlm.ai/md/models/gpt-5-5-pro.md"
      },
      "overallWinner": "B",
      "winner": {
        "slug": "gpt-5-5-pro",
        "canonicalModelKey": "gpt-5-5-pro",
        "model": "GPT-5.5 Pro",
        "creator": "OpenAI",
        "sourceType": "Proprietary",
        "reasoningType": "Reasoning",
        "contextWindow": "1M",
        "contextWindowTokens": 1000000,
        "displayScore": 100,
        "rankingEligible": false,
        "overallRank": null,
        "url": "https://benchlm.ai/models/gpt-5-5-pro",
        "markdownUrl": "https://benchlm.ai/md/models/gpt-5-5-pro.md"
      },
      "scoreDiff": 73,
      "winsA": 0,
      "winsB": 1,
      "comparableCategoryCount": 1,
      "benchmarkCountA": 21,
      "benchmarkCountB": 4,
      "categoryResults": {
        "agentic": {
          "categoryLabel": "Agentic",
          "avgA": null,
          "avgB": 90.1,
          "winner": null,
          "benchmarkCount": 5
        },
        "coding": {
          "categoryLabel": "Coding",
          "avgA": null,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 3
        },
        "multimodalGrounded": {
          "categoryLabel": "Multimodal & Grounded",
          "avgA": null,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 2
        },
        "reasoning": {
          "categoryLabel": "Reasoning",
          "avgA": null,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 2
        },
        "knowledge": {
          "categoryLabel": "Knowledge",
          "avgA": 50.3,
          "avgB": 57.2,
          "winner": "B",
          "benchmarkCount": 10
        },
        "instructionFollowing": {
          "categoryLabel": "Instruction Following",
          "avgA": 83.2,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 2
        },
        "multilingual": {
          "categoryLabel": "Multilingual",
          "avgA": null,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 0
        },
        "math": {
          "categoryLabel": "Mathematics",
          "avgA": null,
          "avgB": 52.4,
          "winner": null,
          "benchmarkCount": 1
        }
      }
    },
    {
      "slug": "gpt-4-1-nano-vs-holo3-35b-a3b",
      "url": "https://benchlm.ai/compare/gpt-4-1-nano-vs-holo3-35b-a3b",
      "markdownUrl": "https://benchlm.ai/md/compare/gpt-4-1-nano-vs-holo3-35b-a3b.md",
      "modelA": {
        "slug": "gpt-4-1-nano",
        "canonicalModelKey": "gpt-4-1-nano",
        "model": "GPT-4.1 nano",
        "creator": "OpenAI",
        "sourceType": "Proprietary",
        "reasoningType": "Non-Reasoning",
        "contextWindow": "1M",
        "contextWindowTokens": 1000000,
        "displayScore": 27,
        "rankingEligible": true,
        "overallRank": 101,
        "url": "https://benchlm.ai/models/gpt-4-1-nano",
        "markdownUrl": "https://benchlm.ai/md/models/gpt-4-1-nano.md"
      },
      "modelB": {
        "slug": "holo3-35b-a3b",
        "canonicalModelKey": "holo3-35b-a3b",
        "model": "Holo3-35B-A3B",
        "creator": "H Company",
        "sourceType": "Open Weight",
        "reasoningType": "Non-Reasoning",
        "contextWindow": "64K",
        "contextWindowTokens": 64000,
        "displayScore": 100,
        "rankingEligible": false,
        "overallRank": null,
        "url": "https://benchlm.ai/models/holo3-35b-a3b",
        "markdownUrl": "https://benchlm.ai/md/models/holo3-35b-a3b.md"
      },
      "overallWinner": "B",
      "winner": {
        "slug": "holo3-35b-a3b",
        "canonicalModelKey": "holo3-35b-a3b",
        "model": "Holo3-35B-A3B",
        "creator": "H Company",
        "sourceType": "Open Weight",
        "reasoningType": "Non-Reasoning",
        "contextWindow": "64K",
        "contextWindowTokens": 64000,
        "displayScore": 100,
        "rankingEligible": false,
        "overallRank": null,
        "url": "https://benchlm.ai/models/holo3-35b-a3b",
        "markdownUrl": "https://benchlm.ai/md/models/holo3-35b-a3b.md"
      },
      "scoreDiff": 73,
      "winsA": 0,
      "winsB": 0,
      "comparableCategoryCount": 0,
      "benchmarkCountA": 21,
      "benchmarkCountB": 1,
      "categoryResults": {
        "agentic": {
          "categoryLabel": "Agentic",
          "avgA": null,
          "avgB": 82.6,
          "winner": null,
          "benchmarkCount": 5
        },
        "coding": {
          "categoryLabel": "Coding",
          "avgA": null,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 3
        },
        "multimodalGrounded": {
          "categoryLabel": "Multimodal & Grounded",
          "avgA": null,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 2
        },
        "reasoning": {
          "categoryLabel": "Reasoning",
          "avgA": null,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 2
        },
        "knowledge": {
          "categoryLabel": "Knowledge",
          "avgA": 50.3,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 8
        },
        "instructionFollowing": {
          "categoryLabel": "Instruction Following",
          "avgA": 83.2,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 2
        },
        "multilingual": {
          "categoryLabel": "Multilingual",
          "avgA": null,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 0
        },
        "math": {
          "categoryLabel": "Mathematics",
          "avgA": null,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 0
        }
      }
    },
    {
      "slug": "glm-4-5-vs-gpt-5-5-pro",
      "url": "https://benchlm.ai/compare/glm-4-5-vs-gpt-5-5-pro",
      "markdownUrl": "https://benchlm.ai/md/compare/glm-4-5-vs-gpt-5-5-pro.md",
      "modelA": {
        "slug": "glm-4-5",
        "canonicalModelKey": "glm-4-5",
        "model": "GLM-4.5",
        "creator": "Z.AI",
        "sourceType": "Proprietary",
        "reasoningType": "Non-Reasoning",
        "contextWindow": "128K",
        "contextWindowTokens": 128000,
        "displayScore": 25,
        "rankingEligible": true,
        "overallRank": 102,
        "url": "https://benchlm.ai/models/glm-4-5",
        "markdownUrl": "https://benchlm.ai/md/models/glm-4-5.md"
      },
      "modelB": {
        "slug": "gpt-5-5-pro",
        "canonicalModelKey": "gpt-5-5-pro",
        "model": "GPT-5.5 Pro",
        "creator": "OpenAI",
        "sourceType": "Proprietary",
        "reasoningType": "Reasoning",
        "contextWindow": "1M",
        "contextWindowTokens": 1000000,
        "displayScore": 100,
        "rankingEligible": false,
        "overallRank": null,
        "url": "https://benchlm.ai/models/gpt-5-5-pro",
        "markdownUrl": "https://benchlm.ai/md/models/gpt-5-5-pro.md"
      },
      "overallWinner": "B",
      "winner": {
        "slug": "gpt-5-5-pro",
        "canonicalModelKey": "gpt-5-5-pro",
        "model": "GPT-5.5 Pro",
        "creator": "OpenAI",
        "sourceType": "Proprietary",
        "reasoningType": "Reasoning",
        "contextWindow": "1M",
        "contextWindowTokens": 1000000,
        "displayScore": 100,
        "rankingEligible": false,
        "overallRank": null,
        "url": "https://benchlm.ai/models/gpt-5-5-pro",
        "markdownUrl": "https://benchlm.ai/md/models/gpt-5-5-pro.md"
      },
      "scoreDiff": 75,
      "winsA": 0,
      "winsB": 0,
      "comparableCategoryCount": 0,
      "benchmarkCountA": 1,
      "benchmarkCountB": 4,
      "categoryResults": {
        "agentic": {
          "categoryLabel": "Agentic",
          "avgA": null,
          "avgB": 90.1,
          "winner": null,
          "benchmarkCount": 1
        },
        "coding": {
          "categoryLabel": "Coding",
          "avgA": null,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 0
        },
        "multimodalGrounded": {
          "categoryLabel": "Multimodal & Grounded",
          "avgA": null,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 1
        },
        "reasoning": {
          "categoryLabel": "Reasoning",
          "avgA": null,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 0
        },
        "knowledge": {
          "categoryLabel": "Knowledge",
          "avgA": null,
          "avgB": 57.2,
          "winner": null,
          "benchmarkCount": 2
        },
        "instructionFollowing": {
          "categoryLabel": "Instruction Following",
          "avgA": null,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 0
        },
        "multilingual": {
          "categoryLabel": "Multilingual",
          "avgA": null,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 0
        },
        "math": {
          "categoryLabel": "Mathematics",
          "avgA": null,
          "avgB": 52.4,
          "winner": null,
          "benchmarkCount": 1
        }
      }
    },
    {
      "slug": "glm-4-5-vs-holo3-35b-a3b",
      "url": "https://benchlm.ai/compare/glm-4-5-vs-holo3-35b-a3b",
      "markdownUrl": "https://benchlm.ai/md/compare/glm-4-5-vs-holo3-35b-a3b.md",
      "modelA": {
        "slug": "glm-4-5",
        "canonicalModelKey": "glm-4-5",
        "model": "GLM-4.5",
        "creator": "Z.AI",
        "sourceType": "Proprietary",
        "reasoningType": "Non-Reasoning",
        "contextWindow": "128K",
        "contextWindowTokens": 128000,
        "displayScore": 25,
        "rankingEligible": true,
        "overallRank": 102,
        "url": "https://benchlm.ai/models/glm-4-5",
        "markdownUrl": "https://benchlm.ai/md/models/glm-4-5.md"
      },
      "modelB": {
        "slug": "holo3-35b-a3b",
        "canonicalModelKey": "holo3-35b-a3b",
        "model": "Holo3-35B-A3B",
        "creator": "H Company",
        "sourceType": "Open Weight",
        "reasoningType": "Non-Reasoning",
        "contextWindow": "64K",
        "contextWindowTokens": 64000,
        "displayScore": 100,
        "rankingEligible": false,
        "overallRank": null,
        "url": "https://benchlm.ai/models/holo3-35b-a3b",
        "markdownUrl": "https://benchlm.ai/md/models/holo3-35b-a3b.md"
      },
      "overallWinner": "B",
      "winner": {
        "slug": "holo3-35b-a3b",
        "canonicalModelKey": "holo3-35b-a3b",
        "model": "Holo3-35B-A3B",
        "creator": "H Company",
        "sourceType": "Open Weight",
        "reasoningType": "Non-Reasoning",
        "contextWindow": "64K",
        "contextWindowTokens": 64000,
        "displayScore": 100,
        "rankingEligible": false,
        "overallRank": null,
        "url": "https://benchlm.ai/models/holo3-35b-a3b",
        "markdownUrl": "https://benchlm.ai/md/models/holo3-35b-a3b.md"
      },
      "scoreDiff": 75,
      "winsA": 0,
      "winsB": 0,
      "comparableCategoryCount": 0,
      "benchmarkCountA": 1,
      "benchmarkCountB": 1,
      "categoryResults": {
        "agentic": {
          "categoryLabel": "Agentic",
          "avgA": null,
          "avgB": 82.6,
          "winner": null,
          "benchmarkCount": 1
        },
        "coding": {
          "categoryLabel": "Coding",
          "avgA": null,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 0
        },
        "multimodalGrounded": {
          "categoryLabel": "Multimodal & Grounded",
          "avgA": null,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 1
        },
        "reasoning": {
          "categoryLabel": "Reasoning",
          "avgA": null,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 0
        },
        "knowledge": {
          "categoryLabel": "Knowledge",
          "avgA": null,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 0
        },
        "instructionFollowing": {
          "categoryLabel": "Instruction Following",
          "avgA": null,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 0
        },
        "multilingual": {
          "categoryLabel": "Multilingual",
          "avgA": null,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 0
        },
        "math": {
          "categoryLabel": "Mathematics",
          "avgA": null,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 0
        }
      }
    },
    {
      "slug": "gpt-5-5-pro-vs-llama-4-scout",
      "url": "https://benchlm.ai/compare/gpt-5-5-pro-vs-llama-4-scout",
      "markdownUrl": "https://benchlm.ai/md/compare/gpt-5-5-pro-vs-llama-4-scout.md",
      "modelA": {
        "slug": "llama-4-scout",
        "canonicalModelKey": "llama-4-scout",
        "model": "Llama 4 Scout",
        "creator": "Meta",
        "sourceType": "Open Weight",
        "reasoningType": "Non-Reasoning",
        "contextWindow": "10M",
        "contextWindowTokens": 10000000,
        "displayScore": 25,
        "rankingEligible": true,
        "overallRank": 103,
        "url": "https://benchlm.ai/models/llama-4-scout",
        "markdownUrl": "https://benchlm.ai/md/models/llama-4-scout.md"
      },
      "modelB": {
        "slug": "gpt-5-5-pro",
        "canonicalModelKey": "gpt-5-5-pro",
        "model": "GPT-5.5 Pro",
        "creator": "OpenAI",
        "sourceType": "Proprietary",
        "reasoningType": "Reasoning",
        "contextWindow": "1M",
        "contextWindowTokens": 1000000,
        "displayScore": 100,
        "rankingEligible": false,
        "overallRank": null,
        "url": "https://benchlm.ai/models/gpt-5-5-pro",
        "markdownUrl": "https://benchlm.ai/md/models/gpt-5-5-pro.md"
      },
      "overallWinner": "B",
      "winner": {
        "slug": "gpt-5-5-pro",
        "canonicalModelKey": "gpt-5-5-pro",
        "model": "GPT-5.5 Pro",
        "creator": "OpenAI",
        "sourceType": "Proprietary",
        "reasoningType": "Reasoning",
        "contextWindow": "1M",
        "contextWindowTokens": 1000000,
        "displayScore": 100,
        "rankingEligible": false,
        "overallRank": null,
        "url": "https://benchlm.ai/models/gpt-5-5-pro",
        "markdownUrl": "https://benchlm.ai/md/models/gpt-5-5-pro.md"
      },
      "scoreDiff": 75,
      "winsA": 0,
      "winsB": 0,
      "comparableCategoryCount": 0,
      "benchmarkCountA": 18,
      "benchmarkCountB": 4,
      "categoryResults": {
        "agentic": {
          "categoryLabel": "Agentic",
          "avgA": null,
          "avgB": 90.1,
          "winner": null,
          "benchmarkCount": 5
        },
        "coding": {
          "categoryLabel": "Coding",
          "avgA": null,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 3
        },
        "multimodalGrounded": {
          "categoryLabel": "Multimodal & Grounded",
          "avgA": null,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 2
        },
        "reasoning": {
          "categoryLabel": "Reasoning",
          "avgA": null,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 2
        },
        "knowledge": {
          "categoryLabel": "Knowledge",
          "avgA": null,
          "avgB": 57.2,
          "winner": null,
          "benchmarkCount": 8
        },
        "instructionFollowing": {
          "categoryLabel": "Instruction Following",
          "avgA": null,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 1
        },
        "multilingual": {
          "categoryLabel": "Multilingual",
          "avgA": null,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 0
        },
        "math": {
          "categoryLabel": "Mathematics",
          "avgA": null,
          "avgB": 52.4,
          "winner": null,
          "benchmarkCount": 1
        }
      }
    },
    {
      "slug": "holo3-35b-a3b-vs-llama-4-scout",
      "url": "https://benchlm.ai/compare/holo3-35b-a3b-vs-llama-4-scout",
      "markdownUrl": "https://benchlm.ai/md/compare/holo3-35b-a3b-vs-llama-4-scout.md",
      "modelA": {
        "slug": "llama-4-scout",
        "canonicalModelKey": "llama-4-scout",
        "model": "Llama 4 Scout",
        "creator": "Meta",
        "sourceType": "Open Weight",
        "reasoningType": "Non-Reasoning",
        "contextWindow": "10M",
        "contextWindowTokens": 10000000,
        "displayScore": 25,
        "rankingEligible": true,
        "overallRank": 103,
        "url": "https://benchlm.ai/models/llama-4-scout",
        "markdownUrl": "https://benchlm.ai/md/models/llama-4-scout.md"
      },
      "modelB": {
        "slug": "holo3-35b-a3b",
        "canonicalModelKey": "holo3-35b-a3b",
        "model": "Holo3-35B-A3B",
        "creator": "H Company",
        "sourceType": "Open Weight",
        "reasoningType": "Non-Reasoning",
        "contextWindow": "64K",
        "contextWindowTokens": 64000,
        "displayScore": 100,
        "rankingEligible": false,
        "overallRank": null,
        "url": "https://benchlm.ai/models/holo3-35b-a3b",
        "markdownUrl": "https://benchlm.ai/md/models/holo3-35b-a3b.md"
      },
      "overallWinner": "B",
      "winner": {
        "slug": "holo3-35b-a3b",
        "canonicalModelKey": "holo3-35b-a3b",
        "model": "Holo3-35B-A3B",
        "creator": "H Company",
        "sourceType": "Open Weight",
        "reasoningType": "Non-Reasoning",
        "contextWindow": "64K",
        "contextWindowTokens": 64000,
        "displayScore": 100,
        "rankingEligible": false,
        "overallRank": null,
        "url": "https://benchlm.ai/models/holo3-35b-a3b",
        "markdownUrl": "https://benchlm.ai/md/models/holo3-35b-a3b.md"
      },
      "scoreDiff": 75,
      "winsA": 0,
      "winsB": 0,
      "comparableCategoryCount": 0,
      "benchmarkCountA": 18,
      "benchmarkCountB": 1,
      "categoryResults": {
        "agentic": {
          "categoryLabel": "Agentic",
          "avgA": null,
          "avgB": 82.6,
          "winner": null,
          "benchmarkCount": 5
        },
        "coding": {
          "categoryLabel": "Coding",
          "avgA": null,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 3
        },
        "multimodalGrounded": {
          "categoryLabel": "Multimodal & Grounded",
          "avgA": null,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 2
        },
        "reasoning": {
          "categoryLabel": "Reasoning",
          "avgA": null,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 2
        },
        "knowledge": {
          "categoryLabel": "Knowledge",
          "avgA": null,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 6
        },
        "instructionFollowing": {
          "categoryLabel": "Instruction Following",
          "avgA": null,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 1
        },
        "multilingual": {
          "categoryLabel": "Multilingual",
          "avgA": null,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 0
        },
        "math": {
          "categoryLabel": "Mathematics",
          "avgA": null,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 0
        }
      }
    },
    {
      "slug": "gpt-5-5-pro-vs-nemotron-3-nano-30b",
      "url": "https://benchlm.ai/compare/gpt-5-5-pro-vs-nemotron-3-nano-30b",
      "markdownUrl": "https://benchlm.ai/md/compare/gpt-5-5-pro-vs-nemotron-3-nano-30b.md",
      "modelA": {
        "slug": "nemotron-3-nano-30b",
        "canonicalModelKey": "nemotron-3-nano-30b",
        "model": "Nemotron 3 Nano 30B",
        "creator": "NVIDIA",
        "sourceType": "Open Weight",
        "reasoningType": "Non-Reasoning",
        "contextWindow": "32K",
        "contextWindowTokens": 32000,
        "displayScore": 25,
        "rankingEligible": true,
        "overallRank": 104,
        "url": "https://benchlm.ai/models/nemotron-3-nano-30b",
        "markdownUrl": "https://benchlm.ai/md/models/nemotron-3-nano-30b.md"
      },
      "modelB": {
        "slug": "gpt-5-5-pro",
        "canonicalModelKey": "gpt-5-5-pro",
        "model": "GPT-5.5 Pro",
        "creator": "OpenAI",
        "sourceType": "Proprietary",
        "reasoningType": "Reasoning",
        "contextWindow": "1M",
        "contextWindowTokens": 1000000,
        "displayScore": 100,
        "rankingEligible": false,
        "overallRank": null,
        "url": "https://benchlm.ai/models/gpt-5-5-pro",
        "markdownUrl": "https://benchlm.ai/md/models/gpt-5-5-pro.md"
      },
      "overallWinner": "B",
      "winner": {
        "slug": "gpt-5-5-pro",
        "canonicalModelKey": "gpt-5-5-pro",
        "model": "GPT-5.5 Pro",
        "creator": "OpenAI",
        "sourceType": "Proprietary",
        "reasoningType": "Reasoning",
        "contextWindow": "1M",
        "contextWindowTokens": 1000000,
        "displayScore": 100,
        "rankingEligible": false,
        "overallRank": null,
        "url": "https://benchlm.ai/models/gpt-5-5-pro",
        "markdownUrl": "https://benchlm.ai/md/models/gpt-5-5-pro.md"
      },
      "scoreDiff": 75,
      "winsA": 0,
      "winsB": 0,
      "comparableCategoryCount": 0,
      "benchmarkCountA": 16,
      "benchmarkCountB": 4,
      "categoryResults": {
        "agentic": {
          "categoryLabel": "Agentic",
          "avgA": null,
          "avgB": 90.1,
          "winner": null,
          "benchmarkCount": 5
        },
        "coding": {
          "categoryLabel": "Coding",
          "avgA": null,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 3
        },
        "multimodalGrounded": {
          "categoryLabel": "Multimodal & Grounded",
          "avgA": null,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 0
        },
        "reasoning": {
          "categoryLabel": "Reasoning",
          "avgA": null,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 2
        },
        "knowledge": {
          "categoryLabel": "Knowledge",
          "avgA": null,
          "avgB": 57.2,
          "winner": null,
          "benchmarkCount": 8
        },
        "instructionFollowing": {
          "categoryLabel": "Instruction Following",
          "avgA": null,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 1
        },
        "multilingual": {
          "categoryLabel": "Multilingual",
          "avgA": null,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 0
        },
        "math": {
          "categoryLabel": "Mathematics",
          "avgA": null,
          "avgB": 52.4,
          "winner": null,
          "benchmarkCount": 1
        }
      }
    },
    {
      "slug": "holo3-35b-a3b-vs-nemotron-3-nano-30b",
      "url": "https://benchlm.ai/compare/holo3-35b-a3b-vs-nemotron-3-nano-30b",
      "markdownUrl": "https://benchlm.ai/md/compare/holo3-35b-a3b-vs-nemotron-3-nano-30b.md",
      "modelA": {
        "slug": "nemotron-3-nano-30b",
        "canonicalModelKey": "nemotron-3-nano-30b",
        "model": "Nemotron 3 Nano 30B",
        "creator": "NVIDIA",
        "sourceType": "Open Weight",
        "reasoningType": "Non-Reasoning",
        "contextWindow": "32K",
        "contextWindowTokens": 32000,
        "displayScore": 25,
        "rankingEligible": true,
        "overallRank": 104,
        "url": "https://benchlm.ai/models/nemotron-3-nano-30b",
        "markdownUrl": "https://benchlm.ai/md/models/nemotron-3-nano-30b.md"
      },
      "modelB": {
        "slug": "holo3-35b-a3b",
        "canonicalModelKey": "holo3-35b-a3b",
        "model": "Holo3-35B-A3B",
        "creator": "H Company",
        "sourceType": "Open Weight",
        "reasoningType": "Non-Reasoning",
        "contextWindow": "64K",
        "contextWindowTokens": 64000,
        "displayScore": 100,
        "rankingEligible": false,
        "overallRank": null,
        "url": "https://benchlm.ai/models/holo3-35b-a3b",
        "markdownUrl": "https://benchlm.ai/md/models/holo3-35b-a3b.md"
      },
      "overallWinner": "B",
      "winner": {
        "slug": "holo3-35b-a3b",
        "canonicalModelKey": "holo3-35b-a3b",
        "model": "Holo3-35B-A3B",
        "creator": "H Company",
        "sourceType": "Open Weight",
        "reasoningType": "Non-Reasoning",
        "contextWindow": "64K",
        "contextWindowTokens": 64000,
        "displayScore": 100,
        "rankingEligible": false,
        "overallRank": null,
        "url": "https://benchlm.ai/models/holo3-35b-a3b",
        "markdownUrl": "https://benchlm.ai/md/models/holo3-35b-a3b.md"
      },
      "scoreDiff": 75,
      "winsA": 0,
      "winsB": 0,
      "comparableCategoryCount": 0,
      "benchmarkCountA": 16,
      "benchmarkCountB": 1,
      "categoryResults": {
        "agentic": {
          "categoryLabel": "Agentic",
          "avgA": null,
          "avgB": 82.6,
          "winner": null,
          "benchmarkCount": 5
        },
        "coding": {
          "categoryLabel": "Coding",
          "avgA": null,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 3
        },
        "multimodalGrounded": {
          "categoryLabel": "Multimodal & Grounded",
          "avgA": null,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 0
        },
        "reasoning": {
          "categoryLabel": "Reasoning",
          "avgA": null,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 2
        },
        "knowledge": {
          "categoryLabel": "Knowledge",
          "avgA": null,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 6
        },
        "instructionFollowing": {
          "categoryLabel": "Instruction Following",
          "avgA": null,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 1
        },
        "multilingual": {
          "categoryLabel": "Multilingual",
          "avgA": null,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 0
        },
        "math": {
          "categoryLabel": "Mathematics",
          "avgA": null,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 0
        }
      }
    },
    {
      "slug": "gpt-5-5-pro-vs-llama-3-70b",
      "url": "https://benchlm.ai/compare/gpt-5-5-pro-vs-llama-3-70b",
      "markdownUrl": "https://benchlm.ai/md/compare/gpt-5-5-pro-vs-llama-3-70b.md",
      "modelA": {
        "slug": "llama-3-70b",
        "canonicalModelKey": "llama-3-70b",
        "model": "Llama 3 70B",
        "creator": "Meta",
        "sourceType": "Open Weight",
        "reasoningType": "Non-Reasoning",
        "contextWindow": "128K",
        "contextWindowTokens": 128000,
        "displayScore": 25,
        "rankingEligible": true,
        "overallRank": 105,
        "url": "https://benchlm.ai/models/llama-3-70b",
        "markdownUrl": "https://benchlm.ai/md/models/llama-3-70b.md"
      },
      "modelB": {
        "slug": "gpt-5-5-pro",
        "canonicalModelKey": "gpt-5-5-pro",
        "model": "GPT-5.5 Pro",
        "creator": "OpenAI",
        "sourceType": "Proprietary",
        "reasoningType": "Reasoning",
        "contextWindow": "1M",
        "contextWindowTokens": 1000000,
        "displayScore": 100,
        "rankingEligible": false,
        "overallRank": null,
        "url": "https://benchlm.ai/models/gpt-5-5-pro",
        "markdownUrl": "https://benchlm.ai/md/models/gpt-5-5-pro.md"
      },
      "overallWinner": "B",
      "winner": {
        "slug": "gpt-5-5-pro",
        "canonicalModelKey": "gpt-5-5-pro",
        "model": "GPT-5.5 Pro",
        "creator": "OpenAI",
        "sourceType": "Proprietary",
        "reasoningType": "Reasoning",
        "contextWindow": "1M",
        "contextWindowTokens": 1000000,
        "displayScore": 100,
        "rankingEligible": false,
        "overallRank": null,
        "url": "https://benchlm.ai/models/gpt-5-5-pro",
        "markdownUrl": "https://benchlm.ai/md/models/gpt-5-5-pro.md"
      },
      "scoreDiff": 75,
      "winsA": 0,
      "winsB": 0,
      "comparableCategoryCount": 0,
      "benchmarkCountA": 0,
      "benchmarkCountB": 4,
      "categoryResults": {
        "agentic": {
          "categoryLabel": "Agentic",
          "avgA": null,
          "avgB": 90.1,
          "winner": null,
          "benchmarkCount": 1
        },
        "coding": {
          "categoryLabel": "Coding",
          "avgA": null,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 0
        },
        "multimodalGrounded": {
          "categoryLabel": "Multimodal & Grounded",
          "avgA": null,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 0
        },
        "reasoning": {
          "categoryLabel": "Reasoning",
          "avgA": null,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 0
        },
        "knowledge": {
          "categoryLabel": "Knowledge",
          "avgA": null,
          "avgB": 57.2,
          "winner": null,
          "benchmarkCount": 2
        },
        "instructionFollowing": {
          "categoryLabel": "Instruction Following",
          "avgA": null,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 0
        },
        "multilingual": {
          "categoryLabel": "Multilingual",
          "avgA": null,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 0
        },
        "math": {
          "categoryLabel": "Mathematics",
          "avgA": null,
          "avgB": 52.4,
          "winner": null,
          "benchmarkCount": 1
        }
      }
    },
    {
      "slug": "holo3-35b-a3b-vs-llama-3-70b",
      "url": "https://benchlm.ai/compare/holo3-35b-a3b-vs-llama-3-70b",
      "markdownUrl": "https://benchlm.ai/md/compare/holo3-35b-a3b-vs-llama-3-70b.md",
      "modelA": {
        "slug": "llama-3-70b",
        "canonicalModelKey": "llama-3-70b",
        "model": "Llama 3 70B",
        "creator": "Meta",
        "sourceType": "Open Weight",
        "reasoningType": "Non-Reasoning",
        "contextWindow": "128K",
        "contextWindowTokens": 128000,
        "displayScore": 25,
        "rankingEligible": true,
        "overallRank": 105,
        "url": "https://benchlm.ai/models/llama-3-70b",
        "markdownUrl": "https://benchlm.ai/md/models/llama-3-70b.md"
      },
      "modelB": {
        "slug": "holo3-35b-a3b",
        "canonicalModelKey": "holo3-35b-a3b",
        "model": "Holo3-35B-A3B",
        "creator": "H Company",
        "sourceType": "Open Weight",
        "reasoningType": "Non-Reasoning",
        "contextWindow": "64K",
        "contextWindowTokens": 64000,
        "displayScore": 100,
        "rankingEligible": false,
        "overallRank": null,
        "url": "https://benchlm.ai/models/holo3-35b-a3b",
        "markdownUrl": "https://benchlm.ai/md/models/holo3-35b-a3b.md"
      },
      "overallWinner": "B",
      "winner": {
        "slug": "holo3-35b-a3b",
        "canonicalModelKey": "holo3-35b-a3b",
        "model": "Holo3-35B-A3B",
        "creator": "H Company",
        "sourceType": "Open Weight",
        "reasoningType": "Non-Reasoning",
        "contextWindow": "64K",
        "contextWindowTokens": 64000,
        "displayScore": 100,
        "rankingEligible": false,
        "overallRank": null,
        "url": "https://benchlm.ai/models/holo3-35b-a3b",
        "markdownUrl": "https://benchlm.ai/md/models/holo3-35b-a3b.md"
      },
      "scoreDiff": 75,
      "winsA": 0,
      "winsB": 0,
      "comparableCategoryCount": 0,
      "benchmarkCountA": 0,
      "benchmarkCountB": 1,
      "categoryResults": {
        "agentic": {
          "categoryLabel": "Agentic",
          "avgA": null,
          "avgB": 82.6,
          "winner": null,
          "benchmarkCount": 1
        },
        "coding": {
          "categoryLabel": "Coding",
          "avgA": null,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 0
        },
        "multimodalGrounded": {
          "categoryLabel": "Multimodal & Grounded",
          "avgA": null,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 0
        },
        "reasoning": {
          "categoryLabel": "Reasoning",
          "avgA": null,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 0
        },
        "knowledge": {
          "categoryLabel": "Knowledge",
          "avgA": null,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 0
        },
        "instructionFollowing": {
          "categoryLabel": "Instruction Following",
          "avgA": null,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 0
        },
        "multilingual": {
          "categoryLabel": "Multilingual",
          "avgA": null,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 0
        },
        "math": {
          "categoryLabel": "Mathematics",
          "avgA": null,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 0
        }
      }
    },
    {
      "slug": "deepseek-v3-1-vs-gpt-5-5-pro",
      "url": "https://benchlm.ai/compare/deepseek-v3-1-vs-gpt-5-5-pro",
      "markdownUrl": "https://benchlm.ai/md/compare/deepseek-v3-1-vs-gpt-5-5-pro.md",
      "modelA": {
        "slug": "deepseek-v3-1",
        "canonicalModelKey": "deepseek-v3-1",
        "model": "DeepSeek V3.1",
        "creator": "DeepSeek",
        "sourceType": "Open Weight",
        "reasoningType": "Non-Reasoning",
        "contextWindow": "128K",
        "contextWindowTokens": 128000,
        "displayScore": 24,
        "rankingEligible": true,
        "overallRank": 106,
        "url": "https://benchlm.ai/models/deepseek-v3-1",
        "markdownUrl": "https://benchlm.ai/md/models/deepseek-v3-1.md"
      },
      "modelB": {
        "slug": "gpt-5-5-pro",
        "canonicalModelKey": "gpt-5-5-pro",
        "model": "GPT-5.5 Pro",
        "creator": "OpenAI",
        "sourceType": "Proprietary",
        "reasoningType": "Reasoning",
        "contextWindow": "1M",
        "contextWindowTokens": 1000000,
        "displayScore": 100,
        "rankingEligible": false,
        "overallRank": null,
        "url": "https://benchlm.ai/models/gpt-5-5-pro",
        "markdownUrl": "https://benchlm.ai/md/models/gpt-5-5-pro.md"
      },
      "overallWinner": "B",
      "winner": {
        "slug": "gpt-5-5-pro",
        "canonicalModelKey": "gpt-5-5-pro",
        "model": "GPT-5.5 Pro",
        "creator": "OpenAI",
        "sourceType": "Proprietary",
        "reasoningType": "Reasoning",
        "contextWindow": "1M",
        "contextWindowTokens": 1000000,
        "displayScore": 100,
        "rankingEligible": false,
        "overallRank": null,
        "url": "https://benchlm.ai/models/gpt-5-5-pro",
        "markdownUrl": "https://benchlm.ai/md/models/gpt-5-5-pro.md"
      },
      "scoreDiff": 76,
      "winsA": 0,
      "winsB": 0,
      "comparableCategoryCount": 0,
      "benchmarkCountA": 17,
      "benchmarkCountB": 4,
      "categoryResults": {
        "agentic": {
          "categoryLabel": "Agentic",
          "avgA": null,
          "avgB": 90.1,
          "winner": null,
          "benchmarkCount": 5
        },
        "coding": {
          "categoryLabel": "Coding",
          "avgA": null,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 3
        },
        "multimodalGrounded": {
          "categoryLabel": "Multimodal & Grounded",
          "avgA": null,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 1
        },
        "reasoning": {
          "categoryLabel": "Reasoning",
          "avgA": null,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 2
        },
        "knowledge": {
          "categoryLabel": "Knowledge",
          "avgA": null,
          "avgB": 57.2,
          "winner": null,
          "benchmarkCount": 8
        },
        "instructionFollowing": {
          "categoryLabel": "Instruction Following",
          "avgA": null,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 1
        },
        "multilingual": {
          "categoryLabel": "Multilingual",
          "avgA": null,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 0
        },
        "math": {
          "categoryLabel": "Mathematics",
          "avgA": null,
          "avgB": 52.4,
          "winner": null,
          "benchmarkCount": 1
        }
      }
    },
    {
      "slug": "deepseek-v3-1-vs-holo3-35b-a3b",
      "url": "https://benchlm.ai/compare/deepseek-v3-1-vs-holo3-35b-a3b",
      "markdownUrl": "https://benchlm.ai/md/compare/deepseek-v3-1-vs-holo3-35b-a3b.md",
      "modelA": {
        "slug": "deepseek-v3-1",
        "canonicalModelKey": "deepseek-v3-1",
        "model": "DeepSeek V3.1",
        "creator": "DeepSeek",
        "sourceType": "Open Weight",
        "reasoningType": "Non-Reasoning",
        "contextWindow": "128K",
        "contextWindowTokens": 128000,
        "displayScore": 24,
        "rankingEligible": true,
        "overallRank": 106,
        "url": "https://benchlm.ai/models/deepseek-v3-1",
        "markdownUrl": "https://benchlm.ai/md/models/deepseek-v3-1.md"
      },
      "modelB": {
        "slug": "holo3-35b-a3b",
        "canonicalModelKey": "holo3-35b-a3b",
        "model": "Holo3-35B-A3B",
        "creator": "H Company",
        "sourceType": "Open Weight",
        "reasoningType": "Non-Reasoning",
        "contextWindow": "64K",
        "contextWindowTokens": 64000,
        "displayScore": 100,
        "rankingEligible": false,
        "overallRank": null,
        "url": "https://benchlm.ai/models/holo3-35b-a3b",
        "markdownUrl": "https://benchlm.ai/md/models/holo3-35b-a3b.md"
      },
      "overallWinner": "B",
      "winner": {
        "slug": "holo3-35b-a3b",
        "canonicalModelKey": "holo3-35b-a3b",
        "model": "Holo3-35B-A3B",
        "creator": "H Company",
        "sourceType": "Open Weight",
        "reasoningType": "Non-Reasoning",
        "contextWindow": "64K",
        "contextWindowTokens": 64000,
        "displayScore": 100,
        "rankingEligible": false,
        "overallRank": null,
        "url": "https://benchlm.ai/models/holo3-35b-a3b",
        "markdownUrl": "https://benchlm.ai/md/models/holo3-35b-a3b.md"
      },
      "scoreDiff": 76,
      "winsA": 0,
      "winsB": 0,
      "comparableCategoryCount": 0,
      "benchmarkCountA": 17,
      "benchmarkCountB": 1,
      "categoryResults": {
        "agentic": {
          "categoryLabel": "Agentic",
          "avgA": null,
          "avgB": 82.6,
          "winner": null,
          "benchmarkCount": 5
        },
        "coding": {
          "categoryLabel": "Coding",
          "avgA": null,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 3
        },
        "multimodalGrounded": {
          "categoryLabel": "Multimodal & Grounded",
          "avgA": null,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 1
        },
        "reasoning": {
          "categoryLabel": "Reasoning",
          "avgA": null,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 2
        },
        "knowledge": {
          "categoryLabel": "Knowledge",
          "avgA": null,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 6
        },
        "instructionFollowing": {
          "categoryLabel": "Instruction Following",
          "avgA": null,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 1
        },
        "multilingual": {
          "categoryLabel": "Multilingual",
          "avgA": null,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 0
        },
        "math": {
          "categoryLabel": "Mathematics",
          "avgA": null,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 0
        }
      }
    },
    {
      "slug": "gpt-4-turbo-vs-gpt-5-5-pro",
      "url": "https://benchlm.ai/compare/gpt-4-turbo-vs-gpt-5-5-pro",
      "markdownUrl": "https://benchlm.ai/md/compare/gpt-4-turbo-vs-gpt-5-5-pro.md",
      "modelA": {
        "slug": "gpt-4-turbo",
        "canonicalModelKey": "gpt-4-turbo",
        "model": "GPT-4 Turbo",
        "creator": "OpenAI",
        "sourceType": "Proprietary",
        "reasoningType": "Non-Reasoning",
        "contextWindow": "128K",
        "contextWindowTokens": 128000,
        "displayScore": 24,
        "rankingEligible": true,
        "overallRank": 107,
        "url": "https://benchlm.ai/models/gpt-4-turbo",
        "markdownUrl": "https://benchlm.ai/md/models/gpt-4-turbo.md"
      },
      "modelB": {
        "slug": "gpt-5-5-pro",
        "canonicalModelKey": "gpt-5-5-pro",
        "model": "GPT-5.5 Pro",
        "creator": "OpenAI",
        "sourceType": "Proprietary",
        "reasoningType": "Reasoning",
        "contextWindow": "1M",
        "contextWindowTokens": 1000000,
        "displayScore": 100,
        "rankingEligible": false,
        "overallRank": null,
        "url": "https://benchlm.ai/models/gpt-5-5-pro",
        "markdownUrl": "https://benchlm.ai/md/models/gpt-5-5-pro.md"
      },
      "overallWinner": "B",
      "winner": {
        "slug": "gpt-5-5-pro",
        "canonicalModelKey": "gpt-5-5-pro",
        "model": "GPT-5.5 Pro",
        "creator": "OpenAI",
        "sourceType": "Proprietary",
        "reasoningType": "Reasoning",
        "contextWindow": "1M",
        "contextWindowTokens": 1000000,
        "displayScore": 100,
        "rankingEligible": false,
        "overallRank": null,
        "url": "https://benchlm.ai/models/gpt-5-5-pro",
        "markdownUrl": "https://benchlm.ai/md/models/gpt-5-5-pro.md"
      },
      "scoreDiff": 76,
      "winsA": 0,
      "winsB": 0,
      "comparableCategoryCount": 0,
      "benchmarkCountA": 4,
      "benchmarkCountB": 4,
      "categoryResults": {
        "agentic": {
          "categoryLabel": "Agentic",
          "avgA": null,
          "avgB": 90.1,
          "winner": null,
          "benchmarkCount": 1
        },
        "coding": {
          "categoryLabel": "Coding",
          "avgA": null,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 2
        },
        "multimodalGrounded": {
          "categoryLabel": "Multimodal & Grounded",
          "avgA": null,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 0
        },
        "reasoning": {
          "categoryLabel": "Reasoning",
          "avgA": null,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 0
        },
        "knowledge": {
          "categoryLabel": "Knowledge",
          "avgA": null,
          "avgB": 57.2,
          "winner": null,
          "benchmarkCount": 4
        },
        "instructionFollowing": {
          "categoryLabel": "Instruction Following",
          "avgA": null,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 0
        },
        "multilingual": {
          "categoryLabel": "Multilingual",
          "avgA": null,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 0
        },
        "math": {
          "categoryLabel": "Mathematics",
          "avgA": null,
          "avgB": 52.4,
          "winner": null,
          "benchmarkCount": 1
        }
      }
    },
    {
      "slug": "gpt-4-turbo-vs-holo3-35b-a3b",
      "url": "https://benchlm.ai/compare/gpt-4-turbo-vs-holo3-35b-a3b",
      "markdownUrl": "https://benchlm.ai/md/compare/gpt-4-turbo-vs-holo3-35b-a3b.md",
      "modelA": {
        "slug": "gpt-4-turbo",
        "canonicalModelKey": "gpt-4-turbo",
        "model": "GPT-4 Turbo",
        "creator": "OpenAI",
        "sourceType": "Proprietary",
        "reasoningType": "Non-Reasoning",
        "contextWindow": "128K",
        "contextWindowTokens": 128000,
        "displayScore": 24,
        "rankingEligible": true,
        "overallRank": 107,
        "url": "https://benchlm.ai/models/gpt-4-turbo",
        "markdownUrl": "https://benchlm.ai/md/models/gpt-4-turbo.md"
      },
      "modelB": {
        "slug": "holo3-35b-a3b",
        "canonicalModelKey": "holo3-35b-a3b",
        "model": "Holo3-35B-A3B",
        "creator": "H Company",
        "sourceType": "Open Weight",
        "reasoningType": "Non-Reasoning",
        "contextWindow": "64K",
        "contextWindowTokens": 64000,
        "displayScore": 100,
        "rankingEligible": false,
        "overallRank": null,
        "url": "https://benchlm.ai/models/holo3-35b-a3b",
        "markdownUrl": "https://benchlm.ai/md/models/holo3-35b-a3b.md"
      },
      "overallWinner": "B",
      "winner": {
        "slug": "holo3-35b-a3b",
        "canonicalModelKey": "holo3-35b-a3b",
        "model": "Holo3-35B-A3B",
        "creator": "H Company",
        "sourceType": "Open Weight",
        "reasoningType": "Non-Reasoning",
        "contextWindow": "64K",
        "contextWindowTokens": 64000,
        "displayScore": 100,
        "rankingEligible": false,
        "overallRank": null,
        "url": "https://benchlm.ai/models/holo3-35b-a3b",
        "markdownUrl": "https://benchlm.ai/md/models/holo3-35b-a3b.md"
      },
      "scoreDiff": 76,
      "winsA": 0,
      "winsB": 0,
      "comparableCategoryCount": 0,
      "benchmarkCountA": 4,
      "benchmarkCountB": 1,
      "categoryResults": {
        "agentic": {
          "categoryLabel": "Agentic",
          "avgA": null,
          "avgB": 82.6,
          "winner": null,
          "benchmarkCount": 1
        },
        "coding": {
          "categoryLabel": "Coding",
          "avgA": null,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 2
        },
        "multimodalGrounded": {
          "categoryLabel": "Multimodal & Grounded",
          "avgA": null,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 0
        },
        "reasoning": {
          "categoryLabel": "Reasoning",
          "avgA": null,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 0
        },
        "knowledge": {
          "categoryLabel": "Knowledge",
          "avgA": null,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 2
        },
        "instructionFollowing": {
          "categoryLabel": "Instruction Following",
          "avgA": null,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 0
        },
        "multilingual": {
          "categoryLabel": "Multilingual",
          "avgA": null,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 0
        },
        "math": {
          "categoryLabel": "Mathematics",
          "avgA": null,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 0
        }
      }
    },
    {
      "slug": "gemini-1-0-pro-vs-gpt-5-5-pro",
      "url": "https://benchlm.ai/compare/gemini-1-0-pro-vs-gpt-5-5-pro",
      "markdownUrl": "https://benchlm.ai/md/compare/gemini-1-0-pro-vs-gpt-5-5-pro.md",
      "modelA": {
        "slug": "gemini-1-0-pro",
        "canonicalModelKey": "gemini-1-0-pro",
        "model": "Gemini 1.0 Pro",
        "creator": "Google",
        "sourceType": "Proprietary",
        "reasoningType": "Non-Reasoning",
        "contextWindow": "32K",
        "contextWindowTokens": 32000,
        "displayScore": 24,
        "rankingEligible": true,
        "overallRank": 108,
        "url": "https://benchlm.ai/models/gemini-1-0-pro",
        "markdownUrl": "https://benchlm.ai/md/models/gemini-1-0-pro.md"
      },
      "modelB": {
        "slug": "gpt-5-5-pro",
        "canonicalModelKey": "gpt-5-5-pro",
        "model": "GPT-5.5 Pro",
        "creator": "OpenAI",
        "sourceType": "Proprietary",
        "reasoningType": "Reasoning",
        "contextWindow": "1M",
        "contextWindowTokens": 1000000,
        "displayScore": 100,
        "rankingEligible": false,
        "overallRank": null,
        "url": "https://benchlm.ai/models/gpt-5-5-pro",
        "markdownUrl": "https://benchlm.ai/md/models/gpt-5-5-pro.md"
      },
      "overallWinner": "B",
      "winner": {
        "slug": "gpt-5-5-pro",
        "canonicalModelKey": "gpt-5-5-pro",
        "model": "GPT-5.5 Pro",
        "creator": "OpenAI",
        "sourceType": "Proprietary",
        "reasoningType": "Reasoning",
        "contextWindow": "1M",
        "contextWindowTokens": 1000000,
        "displayScore": 100,
        "rankingEligible": false,
        "overallRank": null,
        "url": "https://benchlm.ai/models/gpt-5-5-pro",
        "markdownUrl": "https://benchlm.ai/md/models/gpt-5-5-pro.md"
      },
      "scoreDiff": 76,
      "winsA": 0,
      "winsB": 0,
      "comparableCategoryCount": 0,
      "benchmarkCountA": 4,
      "benchmarkCountB": 4,
      "categoryResults": {
        "agentic": {
          "categoryLabel": "Agentic",
          "avgA": null,
          "avgB": 90.1,
          "winner": null,
          "benchmarkCount": 1
        },
        "coding": {
          "categoryLabel": "Coding",
          "avgA": null,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 1
        },
        "multimodalGrounded": {
          "categoryLabel": "Multimodal & Grounded",
          "avgA": null,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 0
        },
        "reasoning": {
          "categoryLabel": "Reasoning",
          "avgA": null,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 0
        },
        "knowledge": {
          "categoryLabel": "Knowledge",
          "avgA": null,
          "avgB": 57.2,
          "winner": null,
          "benchmarkCount": 5
        },
        "instructionFollowing": {
          "categoryLabel": "Instruction Following",
          "avgA": null,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 0
        },
        "multilingual": {
          "categoryLabel": "Multilingual",
          "avgA": null,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 0
        },
        "math": {
          "categoryLabel": "Mathematics",
          "avgA": null,
          "avgB": 52.4,
          "winner": null,
          "benchmarkCount": 1
        }
      }
    },
    {
      "slug": "gemini-1-0-pro-vs-holo3-35b-a3b",
      "url": "https://benchlm.ai/compare/gemini-1-0-pro-vs-holo3-35b-a3b",
      "markdownUrl": "https://benchlm.ai/md/compare/gemini-1-0-pro-vs-holo3-35b-a3b.md",
      "modelA": {
        "slug": "gemini-1-0-pro",
        "canonicalModelKey": "gemini-1-0-pro",
        "model": "Gemini 1.0 Pro",
        "creator": "Google",
        "sourceType": "Proprietary",
        "reasoningType": "Non-Reasoning",
        "contextWindow": "32K",
        "contextWindowTokens": 32000,
        "displayScore": 24,
        "rankingEligible": true,
        "overallRank": 108,
        "url": "https://benchlm.ai/models/gemini-1-0-pro",
        "markdownUrl": "https://benchlm.ai/md/models/gemini-1-0-pro.md"
      },
      "modelB": {
        "slug": "holo3-35b-a3b",
        "canonicalModelKey": "holo3-35b-a3b",
        "model": "Holo3-35B-A3B",
        "creator": "H Company",
        "sourceType": "Open Weight",
        "reasoningType": "Non-Reasoning",
        "contextWindow": "64K",
        "contextWindowTokens": 64000,
        "displayScore": 100,
        "rankingEligible": false,
        "overallRank": null,
        "url": "https://benchlm.ai/models/holo3-35b-a3b",
        "markdownUrl": "https://benchlm.ai/md/models/holo3-35b-a3b.md"
      },
      "overallWinner": "B",
      "winner": {
        "slug": "holo3-35b-a3b",
        "canonicalModelKey": "holo3-35b-a3b",
        "model": "Holo3-35B-A3B",
        "creator": "H Company",
        "sourceType": "Open Weight",
        "reasoningType": "Non-Reasoning",
        "contextWindow": "64K",
        "contextWindowTokens": 64000,
        "displayScore": 100,
        "rankingEligible": false,
        "overallRank": null,
        "url": "https://benchlm.ai/models/holo3-35b-a3b",
        "markdownUrl": "https://benchlm.ai/md/models/holo3-35b-a3b.md"
      },
      "scoreDiff": 76,
      "winsA": 0,
      "winsB": 0,
      "comparableCategoryCount": 0,
      "benchmarkCountA": 4,
      "benchmarkCountB": 1,
      "categoryResults": {
        "agentic": {
          "categoryLabel": "Agentic",
          "avgA": null,
          "avgB": 82.6,
          "winner": null,
          "benchmarkCount": 1
        },
        "coding": {
          "categoryLabel": "Coding",
          "avgA": null,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 1
        },
        "multimodalGrounded": {
          "categoryLabel": "Multimodal & Grounded",
          "avgA": null,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 0
        },
        "reasoning": {
          "categoryLabel": "Reasoning",
          "avgA": null,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 0
        },
        "knowledge": {
          "categoryLabel": "Knowledge",
          "avgA": null,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 3
        },
        "instructionFollowing": {
          "categoryLabel": "Instruction Following",
          "avgA": null,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 0
        },
        "multilingual": {
          "categoryLabel": "Multilingual",
          "avgA": null,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 0
        },
        "math": {
          "categoryLabel": "Mathematics",
          "avgA": null,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 0
        }
      }
    },
    {
      "slug": "gpt-5-5-pro-vs-z-1",
      "url": "https://benchlm.ai/compare/gpt-5-5-pro-vs-z-1",
      "markdownUrl": "https://benchlm.ai/md/compare/gpt-5-5-pro-vs-z-1.md",
      "modelA": {
        "slug": "z-1",
        "canonicalModelKey": "z-1",
        "model": "Z-1",
        "creator": "Z",
        "sourceType": "Proprietary",
        "reasoningType": "Non-Reasoning",
        "contextWindow": "128K",
        "contextWindowTokens": 128000,
        "displayScore": 23,
        "rankingEligible": true,
        "overallRank": 109,
        "url": "https://benchlm.ai/models/z-1",
        "markdownUrl": "https://benchlm.ai/md/models/z-1.md"
      },
      "modelB": {
        "slug": "gpt-5-5-pro",
        "canonicalModelKey": "gpt-5-5-pro",
        "model": "GPT-5.5 Pro",
        "creator": "OpenAI",
        "sourceType": "Proprietary",
        "reasoningType": "Reasoning",
        "contextWindow": "1M",
        "contextWindowTokens": 1000000,
        "displayScore": 100,
        "rankingEligible": false,
        "overallRank": null,
        "url": "https://benchlm.ai/models/gpt-5-5-pro",
        "markdownUrl": "https://benchlm.ai/md/models/gpt-5-5-pro.md"
      },
      "overallWinner": "B",
      "winner": {
        "slug": "gpt-5-5-pro",
        "canonicalModelKey": "gpt-5-5-pro",
        "model": "GPT-5.5 Pro",
        "creator": "OpenAI",
        "sourceType": "Proprietary",
        "reasoningType": "Reasoning",
        "contextWindow": "1M",
        "contextWindowTokens": 1000000,
        "displayScore": 100,
        "rankingEligible": false,
        "overallRank": null,
        "url": "https://benchlm.ai/models/gpt-5-5-pro",
        "markdownUrl": "https://benchlm.ai/md/models/gpt-5-5-pro.md"
      },
      "scoreDiff": 77,
      "winsA": 0,
      "winsB": 0,
      "comparableCategoryCount": 0,
      "benchmarkCountA": 0,
      "benchmarkCountB": 4,
      "categoryResults": {
        "agentic": {
          "categoryLabel": "Agentic",
          "avgA": null,
          "avgB": 90.1,
          "winner": null,
          "benchmarkCount": 1
        },
        "coding": {
          "categoryLabel": "Coding",
          "avgA": null,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 0
        },
        "multimodalGrounded": {
          "categoryLabel": "Multimodal & Grounded",
          "avgA": null,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 0
        },
        "reasoning": {
          "categoryLabel": "Reasoning",
          "avgA": null,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 0
        },
        "knowledge": {
          "categoryLabel": "Knowledge",
          "avgA": null,
          "avgB": 57.2,
          "winner": null,
          "benchmarkCount": 2
        },
        "instructionFollowing": {
          "categoryLabel": "Instruction Following",
          "avgA": null,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 0
        },
        "multilingual": {
          "categoryLabel": "Multilingual",
          "avgA": null,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 0
        },
        "math": {
          "categoryLabel": "Mathematics",
          "avgA": null,
          "avgB": 52.4,
          "winner": null,
          "benchmarkCount": 1
        }
      }
    },
    {
      "slug": "holo3-35b-a3b-vs-z-1",
      "url": "https://benchlm.ai/compare/holo3-35b-a3b-vs-z-1",
      "markdownUrl": "https://benchlm.ai/md/compare/holo3-35b-a3b-vs-z-1.md",
      "modelA": {
        "slug": "z-1",
        "canonicalModelKey": "z-1",
        "model": "Z-1",
        "creator": "Z",
        "sourceType": "Proprietary",
        "reasoningType": "Non-Reasoning",
        "contextWindow": "128K",
        "contextWindowTokens": 128000,
        "displayScore": 23,
        "rankingEligible": true,
        "overallRank": 109,
        "url": "https://benchlm.ai/models/z-1",
        "markdownUrl": "https://benchlm.ai/md/models/z-1.md"
      },
      "modelB": {
        "slug": "holo3-35b-a3b",
        "canonicalModelKey": "holo3-35b-a3b",
        "model": "Holo3-35B-A3B",
        "creator": "H Company",
        "sourceType": "Open Weight",
        "reasoningType": "Non-Reasoning",
        "contextWindow": "64K",
        "contextWindowTokens": 64000,
        "displayScore": 100,
        "rankingEligible": false,
        "overallRank": null,
        "url": "https://benchlm.ai/models/holo3-35b-a3b",
        "markdownUrl": "https://benchlm.ai/md/models/holo3-35b-a3b.md"
      },
      "overallWinner": "B",
      "winner": {
        "slug": "holo3-35b-a3b",
        "canonicalModelKey": "holo3-35b-a3b",
        "model": "Holo3-35B-A3B",
        "creator": "H Company",
        "sourceType": "Open Weight",
        "reasoningType": "Non-Reasoning",
        "contextWindow": "64K",
        "contextWindowTokens": 64000,
        "displayScore": 100,
        "rankingEligible": false,
        "overallRank": null,
        "url": "https://benchlm.ai/models/holo3-35b-a3b",
        "markdownUrl": "https://benchlm.ai/md/models/holo3-35b-a3b.md"
      },
      "scoreDiff": 77,
      "winsA": 0,
      "winsB": 0,
      "comparableCategoryCount": 0,
      "benchmarkCountA": 0,
      "benchmarkCountB": 1,
      "categoryResults": {
        "agentic": {
          "categoryLabel": "Agentic",
          "avgA": null,
          "avgB": 82.6,
          "winner": null,
          "benchmarkCount": 1
        },
        "coding": {
          "categoryLabel": "Coding",
          "avgA": null,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 0
        },
        "multimodalGrounded": {
          "categoryLabel": "Multimodal & Grounded",
          "avgA": null,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 0
        },
        "reasoning": {
          "categoryLabel": "Reasoning",
          "avgA": null,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 0
        },
        "knowledge": {
          "categoryLabel": "Knowledge",
          "avgA": null,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 0
        },
        "instructionFollowing": {
          "categoryLabel": "Instruction Following",
          "avgA": null,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 0
        },
        "multilingual": {
          "categoryLabel": "Multilingual",
          "avgA": null,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 0
        },
        "math": {
          "categoryLabel": "Mathematics",
          "avgA": null,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 0
        }
      }
    },
    {
      "slug": "gpt-5-5-pro-vs-mistral-8x7b",
      "url": "https://benchlm.ai/compare/gpt-5-5-pro-vs-mistral-8x7b",
      "markdownUrl": "https://benchlm.ai/md/compare/gpt-5-5-pro-vs-mistral-8x7b.md",
      "modelA": {
        "slug": "mistral-8x7b",
        "canonicalModelKey": "mistral-8x7b",
        "model": "Mistral 8x7B",
        "creator": "Mistral",
        "sourceType": "Open Weight",
        "reasoningType": "Non-Reasoning",
        "contextWindow": "32K",
        "contextWindowTokens": 32000,
        "displayScore": 23,
        "rankingEligible": true,
        "overallRank": 110,
        "url": "https://benchlm.ai/models/mistral-8x7b",
        "markdownUrl": "https://benchlm.ai/md/models/mistral-8x7b.md"
      },
      "modelB": {
        "slug": "gpt-5-5-pro",
        "canonicalModelKey": "gpt-5-5-pro",
        "model": "GPT-5.5 Pro",
        "creator": "OpenAI",
        "sourceType": "Proprietary",
        "reasoningType": "Reasoning",
        "contextWindow": "1M",
        "contextWindowTokens": 1000000,
        "displayScore": 100,
        "rankingEligible": false,
        "overallRank": null,
        "url": "https://benchlm.ai/models/gpt-5-5-pro",
        "markdownUrl": "https://benchlm.ai/md/models/gpt-5-5-pro.md"
      },
      "overallWinner": "B",
      "winner": {
        "slug": "gpt-5-5-pro",
        "canonicalModelKey": "gpt-5-5-pro",
        "model": "GPT-5.5 Pro",
        "creator": "OpenAI",
        "sourceType": "Proprietary",
        "reasoningType": "Reasoning",
        "contextWindow": "1M",
        "contextWindowTokens": 1000000,
        "displayScore": 100,
        "rankingEligible": false,
        "overallRank": null,
        "url": "https://benchlm.ai/models/gpt-5-5-pro",
        "markdownUrl": "https://benchlm.ai/md/models/gpt-5-5-pro.md"
      },
      "scoreDiff": 77,
      "winsA": 0,
      "winsB": 0,
      "comparableCategoryCount": 0,
      "benchmarkCountA": 0,
      "benchmarkCountB": 4,
      "categoryResults": {
        "agentic": {
          "categoryLabel": "Agentic",
          "avgA": null,
          "avgB": 90.1,
          "winner": null,
          "benchmarkCount": 1
        },
        "coding": {
          "categoryLabel": "Coding",
          "avgA": null,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 0
        },
        "multimodalGrounded": {
          "categoryLabel": "Multimodal & Grounded",
          "avgA": null,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 0
        },
        "reasoning": {
          "categoryLabel": "Reasoning",
          "avgA": null,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 0
        },
        "knowledge": {
          "categoryLabel": "Knowledge",
          "avgA": null,
          "avgB": 57.2,
          "winner": null,
          "benchmarkCount": 2
        },
        "instructionFollowing": {
          "categoryLabel": "Instruction Following",
          "avgA": null,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 0
        },
        "multilingual": {
          "categoryLabel": "Multilingual",
          "avgA": null,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 0
        },
        "math": {
          "categoryLabel": "Mathematics",
          "avgA": null,
          "avgB": 52.4,
          "winner": null,
          "benchmarkCount": 1
        }
      }
    },
    {
      "slug": "holo3-35b-a3b-vs-mistral-8x7b",
      "url": "https://benchlm.ai/compare/holo3-35b-a3b-vs-mistral-8x7b",
      "markdownUrl": "https://benchlm.ai/md/compare/holo3-35b-a3b-vs-mistral-8x7b.md",
      "modelA": {
        "slug": "mistral-8x7b",
        "canonicalModelKey": "mistral-8x7b",
        "model": "Mistral 8x7B",
        "creator": "Mistral",
        "sourceType": "Open Weight",
        "reasoningType": "Non-Reasoning",
        "contextWindow": "32K",
        "contextWindowTokens": 32000,
        "displayScore": 23,
        "rankingEligible": true,
        "overallRank": 110,
        "url": "https://benchlm.ai/models/mistral-8x7b",
        "markdownUrl": "https://benchlm.ai/md/models/mistral-8x7b.md"
      },
      "modelB": {
        "slug": "holo3-35b-a3b",
        "canonicalModelKey": "holo3-35b-a3b",
        "model": "Holo3-35B-A3B",
        "creator": "H Company",
        "sourceType": "Open Weight",
        "reasoningType": "Non-Reasoning",
        "contextWindow": "64K",
        "contextWindowTokens": 64000,
        "displayScore": 100,
        "rankingEligible": false,
        "overallRank": null,
        "url": "https://benchlm.ai/models/holo3-35b-a3b",
        "markdownUrl": "https://benchlm.ai/md/models/holo3-35b-a3b.md"
      },
      "overallWinner": "B",
      "winner": {
        "slug": "holo3-35b-a3b",
        "canonicalModelKey": "holo3-35b-a3b",
        "model": "Holo3-35B-A3B",
        "creator": "H Company",
        "sourceType": "Open Weight",
        "reasoningType": "Non-Reasoning",
        "contextWindow": "64K",
        "contextWindowTokens": 64000,
        "displayScore": 100,
        "rankingEligible": false,
        "overallRank": null,
        "url": "https://benchlm.ai/models/holo3-35b-a3b",
        "markdownUrl": "https://benchlm.ai/md/models/holo3-35b-a3b.md"
      },
      "scoreDiff": 77,
      "winsA": 0,
      "winsB": 0,
      "comparableCategoryCount": 0,
      "benchmarkCountA": 0,
      "benchmarkCountB": 1,
      "categoryResults": {
        "agentic": {
          "categoryLabel": "Agentic",
          "avgA": null,
          "avgB": 82.6,
          "winner": null,
          "benchmarkCount": 1
        },
        "coding": {
          "categoryLabel": "Coding",
          "avgA": null,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 0
        },
        "multimodalGrounded": {
          "categoryLabel": "Multimodal & Grounded",
          "avgA": null,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 0
        },
        "reasoning": {
          "categoryLabel": "Reasoning",
          "avgA": null,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 0
        },
        "knowledge": {
          "categoryLabel": "Knowledge",
          "avgA": null,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 0
        },
        "instructionFollowing": {
          "categoryLabel": "Instruction Following",
          "avgA": null,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 0
        },
        "multilingual": {
          "categoryLabel": "Multilingual",
          "avgA": null,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 0
        },
        "math": {
          "categoryLabel": "Mathematics",
          "avgA": null,
          "avgB": null,
          "winner": null,
          "benchmarkCount": 0
        }
      }
    }
  ]
}
