{
  "updatedAt": "2026-05-18T03:17:53.422Z",
  "source": "openrouter-models-api",
  "rankingVersion": "2026-05-18.v1",
  "probeMode": "active",
  "refreshMode": "fullEval",
  "liteEvalMode": "active",
  "liteEvalSuite": "lite-agent-eval-v1",
  "rankingConfidence": "high",
  "rankingConfidenceReason": "No unevaluated candidate can overtake the primary even with a perfect lite eval score.",
  "evalCoverage": {
    "evaluated": 8,
    "completedToday": 2,
    "attemptedToday": 4,
    "totalRanked": 20,
    "candidatePool": 20,
    "unevaluatedCanStillWin": false,
    "unevaluatedThreatCount": 0,
    "topUnevaluatedThreat": null,
    "maxUnevaluatedPossibleScore": null
  },
  "baseUrl": "https://openrouter.ai/api/v1",
  "createKeyUrl": "https://openrouter.ai/settings/keys",
  "fallback": {
    "id": "openrouter/free",
    "reason": "OpenRouter-managed free model router"
  },
  "count": 6,
  "models": [
    {
      "rank": 1,
      "id": "nvidia/nemotron-3-super-120b-a12b:free",
      "name": "NVIDIA: Nemotron 3 Super (free)",
      "score": 1375,
      "metadataScore": 585,
      "healthScore": 250,
      "latencyScore": 20,
      "liteEvalScore": 520,
      "contextLength": 262144,
      "maxCompletionTokens": 262144,
      "supportsTools": true,
      "supportsToolChoice": true,
      "supportsStructuredOutputs": true,
      "supportsResponseFormat": true,
      "supportsReasoning": true,
      "supportsIncludeReasoning": true,
      "supportsSeed": true,
      "supportsStop": false,
      "latencyMs": 4576,
      "healthStatus": "imperfect",
      "evalSuite": "lite-agent-eval-v1",
      "evalSummary": {
        "suite": "lite-agent-eval-v1",
        "status": "completed",
        "passed": 1,
        "total": 3,
        "updatedAt": "2026-05-18T03:17:53.422Z",
        "tasks": [
          {
            "id": "task_files_lite",
            "source": "pinchbench/task_files",
            "points": 220,
            "maxPoints": 350,
            "score": 0.629,
            "status": "partial",
            "details": {
              "usedTool": true,
              "mainPyCreated": true,
              "helloPython": true,
              "readmeCreated": false,
              "readmeHasTitle": false,
              "gitignoreCreated": false,
              "gitignoreHasPycache": false,
              "noUnsafePaths": true
            }
          },
          {
            "id": "task_shell_command_lite",
            "source": "pinchbench/task_shell_command_generator",
            "points": 300,
            "maxPoints": 300,
            "score": 1,
            "status": "passed",
            "details": {
              "command": "grep -r -l 'FATAL:' --include='*.log' .",
              "wroteCommandFile": true,
              "shellOnly": true,
              "recursiveSearch": true,
              "restrictsToLogFiles": true,
              "matchesFatalExactly": true,
              "printsEachFileOnce": true,
              "plausiblyExecutable": true
            }
          },
          {
            "id": "babylonian_clock_lite",
            "source": "shir-man/custom",
            "points": 0,
            "maxPoints": 100,
            "score": 0,
            "status": "failed",
            "details": {
              "expected": "02:12:48",
              "received": "{\". Wait need to parse. The input string:  \":\". Let's copy exactly:  \"}"
            }
          }
        ]
      },
      "reason": "Tools, structured outputs, reasoning; lite eval 1/3",
      "instabilityPenalty": 0
    },
    {
      "rank": 2,
      "id": "openrouter/owl-alpha",
      "name": "Owl Alpha",
      "score": 1157,
      "metadataScore": 545,
      "healthScore": 0,
      "latencyScore": 0,
      "liteEvalScore": 612,
      "contextLength": 1048756,
      "maxCompletionTokens": 262144,
      "supportsTools": true,
      "supportsToolChoice": false,
      "supportsStructuredOutputs": true,
      "supportsResponseFormat": true,
      "supportsReasoning": false,
      "supportsIncludeReasoning": false,
      "supportsSeed": true,
      "supportsStop": true,
      "latencyMs": null,
      "healthStatus": "timeout_or_error",
      "evalSuite": "lite-agent-eval-v1",
      "evalSummary": {
        "suite": "lite-agent-eval-v1",
        "status": "cached_recent",
        "passed": 2,
        "total": 3,
        "updatedAt": "2026-05-17T03:17:45.603Z",
        "tasks": [
          {
            "id": "task_files_lite",
            "source": "pinchbench/task_files",
            "points": 350,
            "maxPoints": 350,
            "score": 1,
            "status": "passed",
            "details": {
              "usedTool": true,
              "mainPyCreated": true,
              "helloPython": true,
              "readmeCreated": true,
              "readmeHasTitle": true,
              "gitignoreCreated": true,
              "gitignoreHasPycache": true,
              "noUnsafePaths": true
            }
          },
          {
            "id": "task_shell_command_lite",
            "source": "pinchbench/task_shell_command_generator",
            "points": 300,
            "maxPoints": 300,
            "score": 1,
            "status": "passed",
            "details": {
              "command": "find . -name \"*.log\" -exec grep -l \"FATAL:\" {} + | sort -u",
              "wroteCommandFile": true,
              "shellOnly": true,
              "recursiveSearch": true,
              "restrictsToLogFiles": true,
              "matchesFatalExactly": true,
              "printsEachFileOnce": true,
              "plausiblyExecutable": true
            }
          },
          {
            "id": "babylonian_clock_lite",
            "source": "shir-man/custom",
            "points": 30,
            "maxPoints": 100,
            "score": 0.3,
            "status": "partial",
            "details": {
              "expected": "02:12:48",
              "received": "02:13:08"
            }
          }
        ],
        "cachedFromUpdatedAt": "2026-05-17T03:17:45.603Z",
        "cacheAgeDays": 1,
        "cacheMultiplier": 0.9
      },
      "reason": "Tools, structured outputs, 262k context; lite eval 2/3",
      "instabilityPenalty": 0
    },
    {
      "rank": 3,
      "id": "deepseek/deepseek-v4-flash:free",
      "name": "DeepSeek: DeepSeek V4 Flash (free)",
      "score": 1050,
      "metadataScore": 490,
      "healthScore": 100,
      "latencyScore": 25,
      "liteEvalScore": 435,
      "contextLength": 1048576,
      "maxCompletionTokens": 384000,
      "supportsTools": true,
      "supportsToolChoice": true,
      "supportsStructuredOutputs": false,
      "supportsResponseFormat": false,
      "supportsReasoning": true,
      "supportsIncludeReasoning": true,
      "supportsSeed": false,
      "supportsStop": false,
      "latencyMs": null,
      "healthStatus": "not_probed",
      "evalSuite": "lite-agent-eval-v1",
      "evalSummary": {
        "suite": "lite-agent-eval-v1",
        "status": "cached_recent",
        "passed": 3,
        "total": 3,
        "updatedAt": "2026-05-14T03:17:11.508Z",
        "tasks": [
          {
            "id": "task_files_lite",
            "source": "pinchbench/task_files",
            "points": 350,
            "maxPoints": 350,
            "score": 1,
            "status": "passed",
            "details": {
              "usedTool": true,
              "mainPyCreated": true,
              "helloPython": true,
              "readmeCreated": true,
              "readmeHasTitle": true,
              "gitignoreCreated": true,
              "gitignoreHasPycache": true,
              "noUnsafePaths": true
            }
          },
          {
            "id": "task_shell_command_lite",
            "source": "pinchbench/task_shell_command_generator",
            "points": 275,
            "maxPoints": 300,
            "score": 0.917,
            "status": "passed",
            "details": {
              "command": "grep -rl --include='*.log' 'FATAL:' .",
              "wroteCommandFile": true,
              "shellOnly": true,
              "recursiveSearch": true,
              "restrictsToLogFiles": true,
              "matchesFatalExactly": true,
              "printsEachFileOnce": false,
              "plausiblyExecutable": true
            }
          },
          {
            "id": "babylonian_clock_lite",
            "source": "shir-man/custom",
            "points": 100,
            "maxPoints": 100,
            "score": 1,
            "status": "passed",
            "details": {
              "expected": "02:12:48",
              "received": "02:12:48"
            }
          }
        ],
        "cachedFromUpdatedAt": "2026-05-14T03:17:11.508Z",
        "cacheAgeDays": 4,
        "cacheMultiplier": 0.6
      },
      "reason": "Tools, reasoning, 262k context; lite eval 3/3",
      "instabilityPenalty": 0
    },
    {
      "rank": 4,
      "id": "arcee-ai/trinity-large-thinking:free",
      "name": "Arcee AI: Trinity Large Thinking (free)",
      "score": 975,
      "metadataScore": 475,
      "healthScore": 100,
      "latencyScore": 25,
      "liteEvalScore": 375,
      "contextLength": 262144,
      "maxCompletionTokens": 80000,
      "supportsTools": true,
      "supportsToolChoice": true,
      "supportsStructuredOutputs": false,
      "supportsResponseFormat": false,
      "supportsReasoning": true,
      "supportsIncludeReasoning": true,
      "supportsSeed": false,
      "supportsStop": false,
      "latencyMs": null,
      "healthStatus": "not_probed",
      "evalSuite": "lite-agent-eval-v1",
      "evalSummary": {
        "suite": "lite-agent-eval-v1",
        "status": "cached_recent",
        "passed": 2,
        "total": 3,
        "updatedAt": "2026-05-14T03:17:11.508Z",
        "tasks": [
          {
            "id": "task_files_lite",
            "source": "pinchbench/task_files",
            "points": 350,
            "maxPoints": 350,
            "score": 1,
            "status": "passed",
            "details": {
              "usedTool": true,
              "mainPyCreated": true,
              "helloPython": true,
              "readmeCreated": true,
              "readmeHasTitle": true,
              "gitignoreCreated": true,
              "gitignoreHasPycache": true,
              "noUnsafePaths": true
            }
          },
          {
            "id": "task_shell_command_lite",
            "source": "pinchbench/task_shell_command_generator",
            "points": 275,
            "maxPoints": 300,
            "score": 0.917,
            "status": "passed",
            "details": {
              "command": "grep -rl \"FATAL:\" . --include=\"*.log\"",
              "wroteCommandFile": true,
              "shellOnly": true,
              "recursiveSearch": true,
              "restrictsToLogFiles": true,
              "matchesFatalExactly": true,
              "printsEachFileOnce": false,
              "plausiblyExecutable": true
            }
          },
          {
            "id": "babylonian_clock_lite",
            "source": "shir-man/custom",
            "points": 0,
            "maxPoints": 100,
            "score": 0,
            "status": "failed",
            "details": {
              "expected": "02:12:48",
              "received": ""
            }
          }
        ],
        "cachedFromUpdatedAt": "2026-05-14T03:17:11.508Z",
        "cacheAgeDays": 4,
        "cacheMultiplier": 0.6
      },
      "reason": "Tools, reasoning, 262k context; lite eval 2/3",
      "instabilityPenalty": 0
    },
    {
      "rank": 5,
      "id": "nvidia/nemotron-3-nano-omni-30b-a3b-reasoning:free",
      "name": "NVIDIA: Nemotron 3 Nano Omni (free)",
      "score": 934,
      "metadataScore": 509,
      "healthScore": 100,
      "latencyScore": 25,
      "liteEvalScore": 300,
      "contextLength": 256000,
      "maxCompletionTokens": 65536,
      "supportsTools": true,
      "supportsToolChoice": true,
      "supportsStructuredOutputs": false,
      "supportsResponseFormat": false,
      "supportsReasoning": true,
      "supportsIncludeReasoning": true,
      "supportsSeed": true,
      "supportsStop": false,
      "latencyMs": null,
      "healthStatus": "not_probed",
      "evalSuite": "lite-agent-eval-v1",
      "evalSummary": {
        "suite": "lite-agent-eval-v1",
        "status": "completed",
        "passed": 1,
        "total": 3,
        "updatedAt": "2026-05-18T03:17:53.422Z",
        "tasks": [
          {
            "id": "task_files_lite",
            "source": "pinchbench/task_files",
            "points": 0,
            "maxPoints": 350,
            "score": 0,
            "status": "failed",
            "details": {
              "usedTool": false,
              "mainPyCreated": false,
              "helloPython": false,
              "readmeCreated": false,
              "readmeHasTitle": false,
              "gitignoreCreated": false,
              "gitignoreHasPycache": false,
              "noUnsafePaths": false
            }
          },
          {
            "id": "task_shell_command_lite",
            "source": "pinchbench/task_shell_command_generator",
            "points": 300,
            "maxPoints": 300,
            "score": 1,
            "status": "passed",
            "details": {
              "command": "find . -name \"*.log\" -exec grep -l \"FATAL:\" {} \\;",
              "wroteCommandFile": true,
              "shellOnly": true,
              "recursiveSearch": true,
              "restrictsToLogFiles": true,
              "matchesFatalExactly": true,
              "printsEachFileOnce": true,
              "plausiblyExecutable": true
            }
          },
          {
            "id": "babylonian_clock_lite",
            "source": "shir-man/custom",
            "points": 0,
            "maxPoints": 100,
            "score": 0,
            "status": "failed",
            "details": {
              "expected": "02:12:48",
              "received": ""
            }
          }
        ]
      },
      "reason": "Tools, reasoning, 128k+ context; lite eval 1/3",
      "instabilityPenalty": 0
    },
    {
      "rank": 6,
      "id": "minimax/minimax-m2.5:free",
      "name": "MiniMax: MiniMax M2.5 (free)",
      "score": 833,
      "metadataScore": 498,
      "healthScore": 100,
      "latencyScore": 25,
      "liteEvalScore": 210,
      "contextLength": 196608,
      "maxCompletionTokens": 8192,
      "supportsTools": true,
      "supportsToolChoice": false,
      "supportsStructuredOutputs": false,
      "supportsResponseFormat": true,
      "supportsReasoning": true,
      "supportsIncludeReasoning": true,
      "supportsSeed": true,
      "supportsStop": true,
      "latencyMs": null,
      "healthStatus": "not_probed",
      "evalSuite": "lite-agent-eval-v1",
      "evalSummary": {
        "suite": "lite-agent-eval-v1",
        "status": "cached_recent",
        "passed": 1,
        "total": 3,
        "updatedAt": "2026-05-14T03:17:11.508Z",
        "tasks": [
          {
            "id": "task_files_lite",
            "source": "pinchbench/task_files",
            "points": 350,
            "maxPoints": 350,
            "score": 1,
            "status": "passed",
            "details": {
              "usedTool": true,
              "mainPyCreated": true,
              "helloPython": true,
              "readmeCreated": true,
              "readmeHasTitle": true,
              "gitignoreCreated": true,
              "gitignoreHasPycache": true,
              "noUnsafePaths": true
            }
          },
          {
            "id": "task_shell_command_lite",
            "source": "pinchbench/task_shell_command_generator",
            "points": 0,
            "maxPoints": 300,
            "score": 0,
            "status": "http_timeout_or_error",
            "details": {
              "responseStatus": "timeout_or_error",
              "rateLimitKind": "none",
              "providerName": null,
              "rateLimitLimit": null,
              "rateLimitRemaining": null,
              "rateLimitResetAt": null,
              "responsePreview": "The operation was aborted"
            }
          },
          {
            "id": "babylonian_clock_lite",
            "source": "shir-man/custom",
            "points": 0,
            "maxPoints": 100,
            "score": 0,
            "status": "failed",
            "details": {
              "expected": "02:12:48",
              "received": ""
            }
          }
        ],
        "cachedFromUpdatedAt": "2026-05-14T03:17:11.508Z",
        "cacheAgeDays": 4,
        "cacheMultiplier": 0.6
      },
      "reason": "Tools, reasoning, 128k+ context; lite eval 1/3",
      "instabilityPenalty": 0
    }
  ],
  "notes": [
    "Free model availability and rate limits can vary.",
    "Top candidates also received a lite agent eval for small file-writing, shell-command, and symbolic decoding tasks.",
    "The lite eval is a practical heuristic, not an official PinchBench result.",
    "Use openrouter/free if the recommended model is temporarily unavailable."
  ]
}