{
  "updatedAt": "2026-07-30T03:17:49.398Z",
  "source": "openrouter-models-api",
  "rankingVersion": "2026-07-30.v1",
  "probeMode": "active",
  "refreshMode": "fullEval",
  "liteEvalMode": "active",
  "liteEvalSuite": "lite-agent-eval-v1",
  "rankingConfidence": "high",
  "rankingConfidenceReason": "No unevaluated candidate can overtake the primary even with a perfect lite eval score.",
  "evalCoverage": {
    "evaluated": 4,
    "completedToday": 2,
    "attemptedToday": 2,
    "totalRanked": 16,
    "candidatePool": 16,
    "unevaluatedCanStillWin": false,
    "unevaluatedThreatCount": 0,
    "topUnevaluatedThreat": null,
    "maxUnevaluatedPossibleScore": null
  },
  "baseUrl": "https://openrouter.ai/api/v1",
  "createKeyUrl": "https://openrouter.ai/settings/keys",
  "fallback": {
    "id": "openrouter/free",
    "reason": "OpenRouter-managed free model router"
  },
  "count": 6,
  "models": [
    {
      "rank": 1,
      "id": "google/gemma-4-26b-a4b-it:free",
      "name": "Google: Gemma 4 26B A4B  (free)",
      "score": 1590,
      "metadataScore": 540,
      "healthScore": 400,
      "latencyScore": 20,
      "liteEvalScore": 630,
      "contextLength": 131072,
      "maxCompletionTokens": 32768,
      "supportsTools": true,
      "supportsToolChoice": true,
      "supportsStructuredOutputs": true,
      "supportsResponseFormat": true,
      "supportsReasoning": true,
      "supportsIncludeReasoning": true,
      "supportsSeed": true,
      "supportsStop": true,
      "latencyMs": 6573,
      "healthStatus": "passed",
      "evalSuite": "lite-agent-eval-v1",
      "evalSummary": {
        "suite": "lite-agent-eval-v1",
        "status": "completed",
        "passed": 2,
        "total": 3,
        "updatedAt": "2026-07-30T03:17:49.398Z",
        "tasks": [
          {
            "id": "task_files_lite",
            "source": "pinchbench/task_files",
            "points": 350,
            "maxPoints": 350,
            "score": 1,
            "status": "passed",
            "details": {
              "usedTool": true,
              "mainPyCreated": true,
              "helloPython": true,
              "readmeCreated": true,
              "readmeHasTitle": true,
              "gitignoreCreated": true,
              "gitignoreHasPycache": true,
              "noUnsafePaths": true
            }
          },
          {
            "id": "task_shell_command_lite",
            "source": "pinchbench/task_shell_command_generator",
            "points": 250,
            "maxPoints": 300,
            "score": 0.833,
            "status": "passed",
            "details": {
              "command": "grep -l \"FATAL:\" *.log",
              "wroteCommandFile": true,
              "shellOnly": true,
              "recursiveSearch": false,
              "restrictsToLogFiles": true,
              "matchesFatalExactly": true,
              "printsEachFileOnce": true,
              "plausiblyExecutable": true
            }
          },
          {
            "id": "babylonian_clock_lite",
            "source": "shir-man/custom",
            "points": 30,
            "maxPoints": 100,
            "score": 0.3,
            "status": "partial",
            "details": {
              "expected": "02:12:48",
              "received": "01:11:11"
            }
          }
        ]
      },
      "reason": "Tools, structured outputs, reasoning; lite eval 2/3",
      "instabilityPenalty": 0
    },
    {
      "rank": 2,
      "id": "nvidia/nemotron-3-super-120b-a12b:free",
      "name": "NVIDIA: Nemotron 3 Super (free)",
      "score": 1390,
      "metadataScore": 570,
      "healthScore": 250,
      "latencyScore": 75,
      "liteEvalScore": 495,
      "contextLength": 262144,
      "maxCompletionTokens": 262144,
      "supportsTools": true,
      "supportsToolChoice": true,
      "supportsStructuredOutputs": true,
      "supportsResponseFormat": true,
      "supportsReasoning": true,
      "supportsIncludeReasoning": true,
      "supportsSeed": true,
      "supportsStop": false,
      "latencyMs": 457,
      "healthStatus": "imperfect",
      "evalSuite": "lite-agent-eval-v1",
      "evalSummary": {
        "suite": "lite-agent-eval-v1",
        "status": "completed",
        "passed": 1,
        "total": 3,
        "updatedAt": "2026-07-30T03:17:49.398Z",
        "tasks": [
          {
            "id": "task_files_lite",
            "source": "pinchbench/task_files",
            "points": 220,
            "maxPoints": 350,
            "score": 0.629,
            "status": "partial",
            "details": {
              "usedTool": true,
              "mainPyCreated": true,
              "helloPython": true,
              "readmeCreated": false,
              "readmeHasTitle": false,
              "gitignoreCreated": false,
              "gitignoreHasPycache": false,
              "noUnsafePaths": true
            }
          },
          {
            "id": "task_shell_command_lite",
            "source": "pinchbench/task_shell_command_generator",
            "points": 275,
            "maxPoints": 300,
            "score": 0.917,
            "status": "passed",
            "details": {
              "command": "grep -rl \"FATAL:\" . --include=\"*.log\"",
              "wroteCommandFile": true,
              "shellOnly": true,
              "recursiveSearch": true,
              "restrictsToLogFiles": true,
              "matchesFatalExactly": true,
              "printsEachFileOnce": false,
              "plausiblyExecutable": true
            }
          },
          {
            "id": "babylonian_clock_lite",
            "source": "shir-man/custom",
            "points": 0,
            "maxPoints": 100,
            "score": 0,
            "status": "failed",
            "details": {
              "expected": "02:12:48",
              "received": "We need to decode only the time after the em dash. Input: \"𒌚𒁹𒁹𒁹𒁹 𒌓𒌋𒌋𒁹𒁹"
            }
          }
        ]
      },
      "reason": "Tools, structured outputs, reasoning; lite eval 1/3",
      "instabilityPenalty": 0
    },
    {
      "rank": 3,
      "id": "inclusionai/ling-3.0-flash:free",
      "name": "Ling-3.0-flash (free)",
      "score": 1155,
      "metadataScore": 530,
      "healthScore": 100,
      "latencyScore": 25,
      "liteEvalScore": 500,
      "contextLength": 262144,
      "maxCompletionTokens": 32768,
      "supportsTools": true,
      "supportsToolChoice": true,
      "supportsStructuredOutputs": false,
      "supportsResponseFormat": false,
      "supportsReasoning": true,
      "supportsIncludeReasoning": true,
      "supportsSeed": true,
      "supportsStop": true,
      "latencyMs": null,
      "healthStatus": "not_probed",
      "evalSuite": "lite-agent-eval-v1",
      "evalSummary": {
        "suite": "lite-agent-eval-v1",
        "status": "cached_recent",
        "passed": 2,
        "total": 3,
        "updatedAt": "2026-07-28T03:17:03.642Z",
        "tasks": [
          {
            "id": "task_files_lite",
            "source": "pinchbench/task_files",
            "points": 350,
            "maxPoints": 350,
            "score": 1,
            "status": "passed",
            "details": {
              "usedTool": true,
              "mainPyCreated": true,
              "helloPython": true,
              "readmeCreated": true,
              "readmeHasTitle": true,
              "gitignoreCreated": true,
              "gitignoreHasPycache": true,
              "noUnsafePaths": true
            }
          },
          {
            "id": "task_shell_command_lite",
            "source": "pinchbench/task_shell_command_generator",
            "points": 275,
            "maxPoints": 300,
            "score": 0.917,
            "status": "passed",
            "details": {
              "command": "grep -rl \"FATAL:\" --include=\"*.log\" .",
              "wroteCommandFile": true,
              "shellOnly": true,
              "recursiveSearch": true,
              "restrictsToLogFiles": true,
              "matchesFatalExactly": true,
              "printsEachFileOnce": false,
              "plausiblyExecutable": true
            }
          },
          {
            "id": "babylonian_clock_lite",
            "source": "shir-man/custom",
            "points": 0,
            "maxPoints": 100,
            "score": 0,
            "status": "failed",
            "details": {
              "expected": "02:12:48",
              "received": ""
            }
          }
        ],
        "cachedFromUpdatedAt": "2026-07-28T03:17:03.642Z",
        "cacheAgeDays": 2,
        "cacheMultiplier": 0.8
      },
      "reason": "Tools, reasoning, 262k context; lite eval 2/3",
      "instabilityPenalty": 0
    },
    {
      "rank": 4,
      "id": "openai/gpt-oss-20b:free",
      "name": "OpenAI: gpt-oss-20b (free)",
      "score": 1071,
      "metadataScore": 530,
      "healthScore": 100,
      "latencyScore": 25,
      "liteEvalScore": 416,
      "contextLength": 131072,
      "maxCompletionTokens": 32768,
      "supportsTools": true,
      "supportsToolChoice": true,
      "supportsStructuredOutputs": true,
      "supportsResponseFormat": true,
      "supportsReasoning": true,
      "supportsIncludeReasoning": true,
      "supportsSeed": true,
      "supportsStop": true,
      "latencyMs": null,
      "healthStatus": "not_probed",
      "evalSuite": "lite-agent-eval-v1",
      "evalSummary": {
        "suite": "lite-agent-eval-v1",
        "status": "cached_recent",
        "passed": 1,
        "total": 3,
        "updatedAt": "2026-07-28T03:17:03.642Z",
        "tasks": [
          {
            "id": "task_files_lite",
            "source": "pinchbench/task_files",
            "points": 220,
            "maxPoints": 350,
            "score": 0.629,
            "status": "partial",
            "details": {
              "usedTool": true,
              "mainPyCreated": true,
              "helloPython": true,
              "readmeCreated": false,
              "readmeHasTitle": false,
              "gitignoreCreated": false,
              "gitignoreHasPycache": false,
              "noUnsafePaths": true
            }
          },
          {
            "id": "task_shell_command_lite",
            "source": "pinchbench/task_shell_command_generator",
            "points": 300,
            "maxPoints": 300,
            "score": 1,
            "status": "passed",
            "details": {
              "command": "find . -type f -name '*.log' -exec grep -l 'FATAL:' {} +",
              "wroteCommandFile": true,
              "shellOnly": true,
              "recursiveSearch": true,
              "restrictsToLogFiles": true,
              "matchesFatalExactly": true,
              "printsEachFileOnce": true,
              "plausiblyExecutable": true
            }
          },
          {
            "id": "babylonian_clock_lite",
            "source": "shir-man/custom",
            "points": 0,
            "maxPoints": 100,
            "score": 0,
            "status": "failed",
            "details": {
              "expected": "02:12:48",
              "received": ""
            }
          }
        ],
        "cachedFromUpdatedAt": "2026-07-28T03:17:03.642Z",
        "cacheAgeDays": 2,
        "cacheMultiplier": 0.8
      },
      "reason": "Tools, structured outputs, reasoning; lite eval 1/3",
      "instabilityPenalty": 0
    },
    {
      "rank": 5,
      "id": "google/gemma-4-31b-it:free",
      "name": "Google: Gemma 4 31B (free)",
      "score": 650,
      "metadataScore": 530,
      "healthScore": 100,
      "latencyScore": 20,
      "liteEvalScore": 0,
      "contextLength": 262144,
      "maxCompletionTokens": 32768,
      "supportsTools": true,
      "supportsToolChoice": true,
      "supportsStructuredOutputs": false,
      "supportsResponseFormat": true,
      "supportsReasoning": true,
      "supportsIncludeReasoning": true,
      "supportsSeed": true,
      "supportsStop": false,
      "latencyMs": 4473,
      "healthStatus": "http_429",
      "evalSuite": "lite-agent-eval-v1",
      "evalSummary": {
        "suite": "lite-agent-eval-v1",
        "status": "not_evaluated",
        "passed": 0,
        "total": 0,
        "updatedAt": null,
        "tasks": []
      },
      "reason": "Tools, reasoning, 262k context",
      "instabilityPenalty": 0
    },
    {
      "rank": 6,
      "id": "cohere/north-mini-code:free",
      "name": "Cohere: North Mini Code (free)",
      "score": 639,
      "metadataScore": 514,
      "healthScore": 100,
      "latencyScore": 25,
      "liteEvalScore": 0,
      "contextLength": 256000,
      "maxCompletionTokens": 64000,
      "supportsTools": true,
      "supportsToolChoice": true,
      "supportsStructuredOutputs": false,
      "supportsResponseFormat": false,
      "supportsReasoning": true,
      "supportsIncludeReasoning": true,
      "supportsSeed": true,
      "supportsStop": true,
      "latencyMs": null,
      "healthStatus": "not_probed",
      "evalSuite": "lite-agent-eval-v1",
      "evalSummary": {
        "suite": "lite-agent-eval-v1",
        "status": "not_evaluated",
        "passed": 0,
        "total": 0,
        "updatedAt": null,
        "tasks": []
      },
      "reason": "Tools, reasoning, 128k+ context",
      "instabilityPenalty": 0
    }
  ],
  "notes": [
    "Free model availability and rate limits can vary.",
    "Top candidates also received a lite agent eval for small file-writing, shell-command, and symbolic decoding tasks.",
    "The lite eval is a practical heuristic, not an official PinchBench result.",
    "Use openrouter/free if the recommended model is temporarily unavailable."
  ]
}