{
  "version": "v2",
  "generatedAt": "2026-05-19T17:58:04.814Z",
  "datasets": [
    {
      "id": "v2_Semi_Private",
      "displayName": "ARC-AGI-2",
      "url": ""
    }
  ],
  "evaluations": [
    {
      "datasetId": "v2_Semi_Private",
      "datasetDisplayName": "ARC-AGI-2",
      "modelId": "2025_human_panel",
      "modelDisplayName": "Human Panel",
      "modelType": null,
      "modelGroup": "Human",
      "modelReleaseDate": null,
      "providerId": "Human",
      "providerDisplayName": "Human",
      "providerColor": "#a9a9a9ff",
      "score": 1,
      "costPerTask": 17,
      "resultsUrl": "",
      "display": true
    },
    {
      "datasetId": "v2_Semi_Private",
      "datasetDisplayName": "ARC-AGI-2",
      "modelId": "NVARC_2025",
      "modelDisplayName": "NVARC",
      "modelType": "Custom",
      "modelGroup": "Kaggle",
      "modelReleaseDate": "2024-11-03T00:00:00.000Z",
      "providerId": "ARC Prize 2025",
      "providerDisplayName": "ARC Prize 2025",
      "providerColor": "#ff841cff",
      "score": 0.2764,
      "costPerTask": 0.2,
      "resultsUrl": "",
      "display": true
    },
    {
      "datasetId": "v2_Semi_Private",
      "datasetDisplayName": "ARC-AGI-2",
      "modelId": "ARChitects",
      "modelDisplayName": "ARChitects",
      "modelType": "Custom",
      "modelGroup": "Kaggle",
      "modelReleaseDate": "2024-11-03T00:00:00.000Z",
      "providerId": "ARC Prize 2024",
      "providerDisplayName": "ARC Prize 2024",
      "providerColor": "#ff841cff",
      "score": 0.025,
      "costPerTask": 0.2,
      "resultsUrl": "",
      "display": true
    },
    {
      "datasetId": "v2_Semi_Private",
      "datasetDisplayName": "ARC-AGI-2",
      "modelId": "Claude 3.7",
      "modelDisplayName": "Claude 3.7",
      "modelType": "Base LLM",
      "modelGroup": null,
      "modelReleaseDate": "2025-02-24T00:00:00.000Z",
      "providerId": "Anthropic",
      "providerDisplayName": "Anthropic",
      "providerColor": "#f93c32ff",
      "score": 0,
      "costPerTask": 0.12,
      "resultsUrl": "",
      "display": true
    },
    {
      "datasetId": "v2_Semi_Private",
      "datasetDisplayName": "ARC-AGI-2",
      "modelId": "Claude 3.7 Thinking 16K",
      "modelDisplayName": "Claude 3.7 (16K)",
      "modelType": "CoT",
      "modelGroup": "Claude_3_7_thinking",
      "modelReleaseDate": "2025-02-24T00:00:00.000Z",
      "providerId": "Anthropic",
      "providerDisplayName": "Anthropic",
      "providerColor": "#f93c32ff",
      "score": 0.007,
      "costPerTask": 0.51,
      "resultsUrl": "",
      "display": true
    },
    {
      "datasetId": "v2_Semi_Private",
      "datasetDisplayName": "ARC-AGI-2",
      "modelId": "Claude 3.7 Thinking 1K",
      "modelDisplayName": "Claude 3.7 (1K)",
      "modelType": "CoT",
      "modelGroup": "Claude_3_7_thinking",
      "modelReleaseDate": "2025-02-24T00:00:00.000Z",
      "providerId": "Anthropic",
      "providerDisplayName": "Anthropic",
      "providerColor": "#f93c32ff",
      "score": 0.004,
      "costPerTask": 0.14,
      "resultsUrl": "",
      "display": true
    },
    {
      "datasetId": "v2_Semi_Private",
      "datasetDisplayName": "ARC-AGI-2",
      "modelId": "Claude 3.7 Thinking 8K",
      "modelDisplayName": "Claude 3.7 (8K)",
      "modelType": "CoT",
      "modelGroup": "Claude_3_7_thinking",
      "modelReleaseDate": "2025-02-24T00:00:00.000Z",
      "providerId": "Anthropic",
      "providerDisplayName": "Anthropic",
      "providerColor": "#f93c32ff",
      "score": 0.009,
      "costPerTask": 0.36,
      "resultsUrl": "",
      "display": true
    },
    {
      "datasetId": "v2_Semi_Private",
      "datasetDisplayName": "ARC-AGI-2",
      "modelId": "Gemini 1.5 Pro",
      "modelDisplayName": "Gemini 1.5 Pro",
      "modelType": "Base LLM",
      "modelGroup": null,
      "modelReleaseDate": "2025-02-15T00:00:00.000Z",
      "providerId": "Google",
      "providerDisplayName": "Google",
      "providerColor": "#4ecc30ff",
      "score": 0.008,
      "costPerTask": 0.04,
      "resultsUrl": "",
      "display": true
    },
    {
      "datasetId": "v2_Semi_Private",
      "datasetDisplayName": "ARC-AGI-2",
      "modelId": "Gemini 2.0 Flash",
      "modelDisplayName": "Gemini 2.0 Flash",
      "modelType": "Base LLM",
      "modelGroup": null,
      "modelReleaseDate": "2025-02-02T00:00:00.000Z",
      "providerId": "Google",
      "providerDisplayName": "Google",
      "providerColor": "#4ecc30ff",
      "score": 0.013,
      "costPerTask": 0.004,
      "resultsUrl": "",
      "display": true
    },
    {
      "datasetId": "v2_Semi_Private",
      "datasetDisplayName": "ARC-AGI-2",
      "modelId": "gpt-4-5-2025-02-27",
      "modelDisplayName": "GPT-4.5",
      "modelType": "Base LLM",
      "modelGroup": null,
      "modelReleaseDate": "2025-02-27T00:00:00.000Z",
      "providerId": "OpenAI",
      "providerDisplayName": "OpenAI",
      "providerColor": "#1e93ffff",
      "score": 0.008,
      "costPerTask": 2.1,
      "resultsUrl": "",
      "display": true
    },
    {
      "datasetId": "v2_Semi_Private",
      "datasetDisplayName": "ARC-AGI-2",
      "modelId": "gpt-4o-2024-11-20",
      "modelDisplayName": "GPT-4o",
      "modelType": "Base LLM",
      "modelGroup": null,
      "modelReleaseDate": "2024-11-20T00:00:00.000Z",
      "providerId": "OpenAI",
      "providerDisplayName": "OpenAI",
      "providerColor": "#1e93ffff",
      "score": 0,
      "costPerTask": 0.08,
      "resultsUrl": "",
      "display": true
    },
    {
      "datasetId": "v2_Semi_Private",
      "datasetDisplayName": "ARC-AGI-2",
      "modelId": "gpt-4o-mini-2024-07-18",
      "modelDisplayName": "GPT-4o-mini",
      "modelType": "Base LLM",
      "modelGroup": null,
      "modelReleaseDate": "2024-07-18T00:00:00.000Z",
      "providerId": "OpenAI",
      "providerDisplayName": "OpenAI",
      "providerColor": "#1e93ffff",
      "score": 0,
      "costPerTask": 0.01,
      "resultsUrl": "",
      "display": true
    },
    {
      "datasetId": "v2_Semi_Private",
      "datasetDisplayName": "ARC-AGI-2",
      "modelId": "Icecuber",
      "modelDisplayName": "Icecuber",
      "modelType": "Custom",
      "modelGroup": "Kaggle",
      "modelReleaseDate": "2023-11-03T00:00:00.000Z",
      "providerId": "ARC Prize 2024",
      "providerDisplayName": "ARC Prize 2024",
      "providerColor": "#ff841cff",
      "score": 0.016,
      "costPerTask": 0.13,
      "resultsUrl": "",
      "display": true
    },
    {
      "datasetId": "v2_Semi_Private",
      "datasetDisplayName": "ARC-AGI-2",
      "modelId": "o3-preview-low",
      "modelDisplayName": "o3 (Preview, Low) ¹",
      "modelType": "CoT + Synthesis",
      "modelGroup": "o3-preview",
      "modelReleaseDate": "2024-12-20T00:00:00.000Z",
      "providerId": "OpenAI",
      "providerDisplayName": "OpenAI",
      "providerColor": "#1e93ffff",
      "score": 0.04,
      "costPerTask": 200,
      "resultsUrl": "",
      "display": false
    },
    {
      "datasetId": "v2_Semi_Private",
      "datasetDisplayName": "ARC-AGI-2",
      "modelId": "R1",
      "modelDisplayName": "Deepseek R1",
      "modelType": "CoT",
      "modelGroup": null,
      "modelReleaseDate": "2025-01-22T00:00:00.000Z",
      "providerId": "Deepseek",
      "providerDisplayName": "Deepseek",
      "providerColor": "#ffdc00ff",
      "score": 0.013,
      "costPerTask": 0.08,
      "resultsUrl": "",
      "display": true
    },
    {
      "datasetId": "v2_Semi_Private",
      "datasetDisplayName": "ARC-AGI-2",
      "modelId": "Llama-4-Maverick-17B-128E-Instruct-FP8-together",
      "modelDisplayName": "Llama 4 Maverick",
      "modelType": "Base LLM",
      "modelGroup": "Llama 4",
      "modelReleaseDate": "2025-04-05T00:00:00.000Z",
      "providerId": "Meta",
      "providerDisplayName": "Meta",
      "providerColor": "#e43ba2ff",
      "score": 0,
      "costPerTask": 0.0121,
      "resultsUrl": "",
      "display": true
    },
    {
      "datasetId": "v2_Semi_Private",
      "datasetDisplayName": "ARC-AGI-2",
      "modelId": "Llama-4-Scout-17B-16E-Instruct-together",
      "modelDisplayName": "Llama 4 Scout",
      "modelType": "Base LLM",
      "modelGroup": "Llama 4",
      "modelReleaseDate": "2025-04-05T00:00:00.000Z",
      "providerId": "Meta",
      "providerDisplayName": "Meta",
      "providerColor": "#e43ba2ff",
      "score": 0,
      "costPerTask": 0.0062,
      "resultsUrl": "",
      "display": true
    },
    {
      "datasetId": "v2_Semi_Private",
      "datasetDisplayName": "ARC-AGI-2",
      "modelId": "gpt-4-1-nano-2025-04-14",
      "modelDisplayName": "GPT-4.1-Nano",
      "modelType": "Base LLM",
      "modelGroup": "gpt-4.1",
      "modelReleaseDate": "2025-04-14T00:00:00.000Z",
      "providerId": "OpenAI",
      "providerDisplayName": "OpenAI",
      "providerColor": "#1e93ffff",
      "score": 0,
      "costPerTask": 0.0036,
      "resultsUrl": "",
      "display": true
    },
    {
      "datasetId": "v2_Semi_Private",
      "datasetDisplayName": "ARC-AGI-2",
      "modelId": "gpt-4-1-mini-2025-04-14",
      "modelDisplayName": "GPT-4.1-Mini",
      "modelType": "Base LLM",
      "modelGroup": "gpt-4.1",
      "modelReleaseDate": "2025-04-14T00:00:00.000Z",
      "providerId": "OpenAI",
      "providerDisplayName": "OpenAI",
      "providerColor": "#1e93ffff",
      "score": 0,
      "costPerTask": 0.0139,
      "resultsUrl": "",
      "display": true
    },
    {
      "datasetId": "v2_Semi_Private",
      "datasetDisplayName": "ARC-AGI-2",
      "modelId": "gpt-4-1-2025-04-14",
      "modelDisplayName": "GPT-4.1",
      "modelType": "Base LLM",
      "modelGroup": "gpt-4.1",
      "modelReleaseDate": "2025-04-14T00:00:00.000Z",
      "providerId": "OpenAI",
      "providerDisplayName": "OpenAI",
      "providerColor": "#1e93ffff",
      "score": 0.0042,
      "costPerTask": 0.0691,
      "resultsUrl": "",
      "display": true
    },
    {
      "datasetId": "v2_Semi_Private",
      "datasetDisplayName": "ARC-AGI-2",
      "modelId": "o1-mini-2024-09-12",
      "modelDisplayName": "o1-mini",
      "modelType": "CoT",
      "modelGroup": "o1-mini",
      "modelReleaseDate": "2024-09-12T00:00:00.000Z",
      "providerId": "OpenAI",
      "providerDisplayName": "OpenAI",
      "providerColor": "#1e93ffff",
      "score": 0.0083,
      "costPerTask": 0.1907,
      "resultsUrl": "",
      "display": true
    },
    {
      "datasetId": "v2_Semi_Private",
      "datasetDisplayName": "ARC-AGI-2",
      "modelId": "o3-mini-2025-01-31-low",
      "modelDisplayName": "o3-mini (Low)",
      "modelType": "CoT",
      "modelGroup": "o3-mini",
      "modelReleaseDate": "2025-01-31T00:00:00.000Z",
      "providerId": "OpenAI",
      "providerDisplayName": "OpenAI",
      "providerColor": "#1e93ffff",
      "score": 0,
      "costPerTask": 0.0623,
      "resultsUrl": "",
      "display": true
    },
    {
      "datasetId": "v2_Semi_Private",
      "datasetDisplayName": "ARC-AGI-2",
      "modelId": "o3-mini-2025-01-31-medium",
      "modelDisplayName": "o3-mini (Medium)",
      "modelType": "CoT",
      "modelGroup": "o3-mini",
      "modelReleaseDate": "2025-01-31T00:00:00.000Z",
      "providerId": "OpenAI",
      "providerDisplayName": "OpenAI",
      "providerColor": "#1e93ffff",
      "score": 0.0208,
      "costPerTask": 0.2843,
      "resultsUrl": "",
      "display": true
    },
    {
      "datasetId": "v2_Semi_Private",
      "datasetDisplayName": "ARC-AGI-2",
      "modelId": "o3-mini-2025-01-31-high",
      "modelDisplayName": "o3-mini (High)",
      "modelType": "CoT",
      "modelGroup": "o3-mini",
      "modelReleaseDate": "2025-01-31T00:00:00.000Z",
      "providerId": "OpenAI",
      "providerDisplayName": "OpenAI",
      "providerColor": "#1e93ffff",
      "score": 0.0299,
      "costPerTask": 0.5472,
      "resultsUrl": "",
      "display": true
    },
    {
      "datasetId": "v2_Semi_Private",
      "datasetDisplayName": "ARC-AGI-2",
      "modelId": "o3-2025-04-16-low",
      "modelDisplayName": "o3 (Low)",
      "modelType": "CoT",
      "modelGroup": "o3",
      "modelReleaseDate": "2025-04-16T00:00:00.000Z",
      "providerId": "OpenAI",
      "providerDisplayName": "OpenAI",
      "providerColor": "#1e93ffff",
      "score": 0.0199,
      "costPerTask": 0.2343,
      "resultsUrl": "",
      "display": true
    },
    {
      "datasetId": "v2_Semi_Private",
      "datasetDisplayName": "ARC-AGI-2",
      "modelId": "o3-2025-04-16-medium",
      "modelDisplayName": "o3 (Medium)",
      "modelType": "CoT",
      "modelGroup": "o3",
      "modelReleaseDate": "2025-04-16T00:00:00.000Z",
      "providerId": "OpenAI",
      "providerDisplayName": "OpenAI",
      "providerColor": "#1e93ffff",
      "score": 0.0298,
      "costPerTask": 0.4787,
      "resultsUrl": "",
      "display": true
    },
    {
      "datasetId": "v2_Semi_Private",
      "datasetDisplayName": "ARC-AGI-2",
      "modelId": "o3-2025-04-16-high",
      "modelDisplayName": "o3 (High)",
      "modelType": "CoT",
      "modelGroup": "o3",
      "modelReleaseDate": "2025-04-16T00:00:00.000Z",
      "providerId": "OpenAI",
      "providerDisplayName": "OpenAI",
      "providerColor": "#1e93ffff",
      "score": 0.0653,
      "costPerTask": 0.8339,
      "resultsUrl": "",
      "display": true
    },
    {
      "datasetId": "v2_Semi_Private",
      "datasetDisplayName": "ARC-AGI-2",
      "modelId": "o4-mini-2025-04-16-low",
      "modelDisplayName": "o4-mini (Low)",
      "modelType": "CoT",
      "modelGroup": "o4-mini",
      "modelReleaseDate": "2025-04-16T00:00:00.000Z",
      "providerId": "OpenAI",
      "providerDisplayName": "OpenAI",
      "providerColor": "#1e93ffff",
      "score": 0.0167,
      "costPerTask": 0.05,
      "resultsUrl": "",
      "display": true
    },
    {
      "datasetId": "v2_Semi_Private",
      "datasetDisplayName": "ARC-AGI-2",
      "modelId": "o4-mini-2025-04-16-medium",
      "modelDisplayName": "o4-mini (Medium)",
      "modelType": "CoT",
      "modelGroup": "o4-mini",
      "modelReleaseDate": "2025-04-16T00:00:00.000Z",
      "providerId": "OpenAI",
      "providerDisplayName": "OpenAI",
      "providerColor": "#1e93ffff",
      "score": 0.0236,
      "costPerTask": 0.2311,
      "resultsUrl": "",
      "display": true
    },
    {
      "datasetId": "v2_Semi_Private",
      "datasetDisplayName": "ARC-AGI-2",
      "modelId": "o4-mini-2025-04-16-high",
      "modelDisplayName": "o4-mini (High)",
      "modelType": "CoT",
      "modelGroup": "o4-mini",
      "modelReleaseDate": "2025-04-16T00:00:00.000Z",
      "providerId": "OpenAI",
      "providerDisplayName": "OpenAI",
      "providerColor": "#1e93ffff",
      "score": 0.0611,
      "costPerTask": 0.856,
      "resultsUrl": "",
      "display": true
    },
    {
      "datasetId": "v2_Semi_Private",
      "datasetDisplayName": "ARC-AGI-2",
      "modelId": "gemini-2-5-flash-preview-05-20",
      "modelDisplayName": "Gemini 2.5 Flash (Preview)",
      "modelType": "CoT",
      "modelGroup": null,
      "modelReleaseDate": "2025-05-20T00:00:00.000Z",
      "providerId": "Google",
      "providerDisplayName": "Google",
      "providerColor": "#4ecc30ff",
      "score": 0.0169,
      "costPerTask": 0.057,
      "resultsUrl": "",
      "display": true
    },
    {
      "datasetId": "v2_Semi_Private",
      "datasetDisplayName": "ARC-AGI-2",
      "modelId": "gemini-2-5-flash-preview-05-20-thinking-1k",
      "modelDisplayName": "Gemini 2.5 Flash (Preview) (Thinking 1K)",
      "modelType": "CoT",
      "modelGroup": "gemini-2-5-flash-preview-05-20-thinking",
      "modelReleaseDate": "2025-05-20T00:00:00.000Z",
      "providerId": "Google",
      "providerDisplayName": "Google",
      "providerColor": "#4ecc30ff",
      "score": 0.0216,
      "costPerTask": 0.0302,
      "resultsUrl": "",
      "display": true
    },
    {
      "datasetId": "v2_Semi_Private",
      "datasetDisplayName": "ARC-AGI-2",
      "modelId": "gemini-2-5-flash-preview-05-20-thinking-8k",
      "modelDisplayName": "Gemini 2.5 Flash (Preview) (Thinking 8K)",
      "modelType": "CoT",
      "modelGroup": "gemini-2-5-flash-preview-05-20-thinking",
      "modelReleaseDate": "2025-05-20T00:00:00.000Z",
      "providerId": "Google",
      "providerDisplayName": "Google",
      "providerColor": "#4ecc30ff",
      "score": 0.0212,
      "costPerTask": 0.1994,
      "resultsUrl": "",
      "display": true
    },
    {
      "datasetId": "v2_Semi_Private",
      "datasetDisplayName": "ARC-AGI-2",
      "modelId": "gemini-2-5-flash-preview-05-20-thinking-16k",
      "modelDisplayName": "Gemini 2.5 Flash (Preview) (Thinking 16K)",
      "modelType": "CoT",
      "modelGroup": "gemini-2-5-flash-preview-05-20-thinking",
      "modelReleaseDate": "2025-05-20T00:00:00.000Z",
      "providerId": "Google",
      "providerDisplayName": "Google",
      "providerColor": "#4ecc30ff",
      "score": 0.0198,
      "costPerTask": 0.3173,
      "resultsUrl": "",
      "display": true
    },
    {
      "datasetId": "v2_Semi_Private",
      "datasetDisplayName": "ARC-AGI-2",
      "modelId": "gemini-2-5-flash-preview-05-20-thinking-24k",
      "modelDisplayName": "Gemini 2.5 Flash (Preview) (Thinking 24K)",
      "modelType": "CoT",
      "modelGroup": "gemini-2-5-flash-preview-05-20-thinking",
      "modelReleaseDate": "2025-05-20T00:00:00.000Z",
      "providerId": "Google",
      "providerDisplayName": "Google",
      "providerColor": "#4ecc30ff",
      "score": 0.0254,
      "costPerTask": 0.3191,
      "resultsUrl": "",
      "display": true
    },
    {
      "datasetId": "v2_Semi_Private",
      "datasetDisplayName": "ARC-AGI-2",
      "modelId": "codex-mini-latest",
      "modelDisplayName": "Codex Mini (Latest)",
      "modelType": "CoT",
      "modelGroup": "",
      "modelReleaseDate": "2025-05-23T00:00:00.000Z",
      "providerId": "OpenAI",
      "providerDisplayName": "OpenAI",
      "providerColor": "#1e93ffff",
      "score": 0.0127,
      "costPerTask": 0.23,
      "resultsUrl": "",
      "display": true
    },
    {
      "datasetId": "v2_Semi_Private",
      "datasetDisplayName": "ARC-AGI-2",
      "modelId": "claude-sonnet-4-20250514",
      "modelDisplayName": "Claude Sonnet 4",
      "modelType": "Base LLM",
      "modelGroup": "",
      "modelReleaseDate": "2025-05-14T00:00:00.000Z",
      "providerId": "Anthropic",
      "providerDisplayName": "Anthropic",
      "providerColor": "#f93c32ff",
      "score": 0.0127,
      "costPerTask": 0.1272,
      "resultsUrl": "",
      "display": true
    },
    {
      "datasetId": "v2_Semi_Private",
      "datasetDisplayName": "ARC-AGI-2",
      "modelId": "claude-sonnet-4-20250514-thinking-1k",
      "modelDisplayName": "Claude Sonnet 4 (Thinking 1K)",
      "modelType": "CoT",
      "modelGroup": "claude-sonnet-4-20250514-thinking",
      "modelReleaseDate": "2025-05-14T00:00:00.000Z",
      "providerId": "Anthropic",
      "providerDisplayName": "Anthropic",
      "providerColor": "#f93c32ff",
      "score": 0.0085,
      "costPerTask": 0.1425,
      "resultsUrl": "",
      "display": true
    },
    {
      "datasetId": "v2_Semi_Private",
      "datasetDisplayName": "ARC-AGI-2",
      "modelId": "claude-sonnet-4-20250514-thinking-8k-bedrock",
      "modelDisplayName": "Claude Sonnet 4 (Thinking 8K)",
      "modelType": "CoT",
      "modelGroup": "claude-sonnet-4-20250514-thinking",
      "modelReleaseDate": "2025-05-14T00:00:00.000Z",
      "providerId": "Anthropic",
      "providerDisplayName": "Anthropic",
      "providerColor": "#f93c32ff",
      "score": 0.0212,
      "costPerTask": 0.2654,
      "resultsUrl": "",
      "display": true
    },
    {
      "datasetId": "v2_Semi_Private",
      "datasetDisplayName": "ARC-AGI-2",
      "modelId": "claude-sonnet-4-20250514-thinking-16k-bedrock",
      "modelDisplayName": "Claude Sonnet 4 (Thinking 16K)",
      "modelType": "CoT",
      "modelGroup": "claude-sonnet-4-20250514-thinking",
      "modelReleaseDate": "2025-05-14T00:00:00.000Z",
      "providerId": "Anthropic",
      "providerDisplayName": "Anthropic",
      "providerColor": "#f93c32ff",
      "score": 0.0593,
      "costPerTask": 0.4857,
      "resultsUrl": "",
      "display": true
    },
    {
      "datasetId": "v2_Semi_Private",
      "datasetDisplayName": "ARC-AGI-2",
      "modelId": "claude-opus-4-20250514-thinking-16k",
      "modelDisplayName": "Claude Opus 4 (Thinking 16K)",
      "modelType": "CoT",
      "modelGroup": "claude-opus-4-20250514-thinking",
      "modelReleaseDate": "2025-05-14T00:00:00.000Z",
      "providerId": "Anthropic",
      "providerDisplayName": "Anthropic",
      "providerColor": "#f93c32ff",
      "score": 0.0861,
      "costPerTask": 1.9284,
      "resultsUrl": "",
      "display": true
    },
    {
      "datasetId": "v2_Semi_Private",
      "datasetDisplayName": "ARC-AGI-2",
      "modelId": "claude-opus-4-20250514-thinking-8k",
      "modelDisplayName": "Claude Opus 4 (Thinking 8K)",
      "modelType": "CoT",
      "modelGroup": "claude-opus-4-20250514-thinking",
      "modelReleaseDate": "2025-05-14T00:00:00.000Z",
      "providerId": "Anthropic",
      "providerDisplayName": "Anthropic",
      "providerColor": "#f93c32ff",
      "score": 0.0452,
      "costPerTask": 1.1569,
      "resultsUrl": "",
      "display": true
    },
    {
      "datasetId": "v2_Semi_Private",
      "datasetDisplayName": "ARC-AGI-2",
      "modelId": "claude-opus-4-20250514-thinking-1k",
      "modelDisplayName": "Claude Opus 4 (Thinking 1K)",
      "modelType": "CoT",
      "modelGroup": "claude-opus-4-20250514-thinking",
      "modelReleaseDate": "2025-05-14T00:00:00.000Z",
      "providerId": "Anthropic",
      "providerDisplayName": "Anthropic",
      "providerColor": "#f93c32ff",
      "score": 0,
      "costPerTask": 0.7503,
      "resultsUrl": "",
      "display": true
    },
    {
      "datasetId": "v2_Semi_Private",
      "datasetDisplayName": "ARC-AGI-2",
      "modelId": "claude-opus-4-20250514",
      "modelDisplayName": "Claude Opus 4",
      "modelType": "CoT",
      "modelGroup": "",
      "modelReleaseDate": "2025-05-14T00:00:00.000Z",
      "providerId": "Anthropic",
      "providerDisplayName": "Anthropic",
      "providerColor": "#f93c32ff",
      "score": 0.0127,
      "costPerTask": 0.6388,
      "resultsUrl": "",
      "display": true
    },
    {
      "datasetId": "v2_Semi_Private",
      "datasetDisplayName": "ARC-AGI-2",
      "modelId": "deepseek_r1_0528-openrouter",
      "modelDisplayName": "Deepseek R1 (05/28)",
      "modelType": "CoT",
      "modelGroup": "",
      "modelReleaseDate": "2025-05-28T00:00:00.000Z",
      "providerId": "Deepseek",
      "providerDisplayName": "Deepseek",
      "providerColor": "#ffdc00ff",
      "score": 0.0112,
      "costPerTask": 0.0527,
      "resultsUrl": "",
      "display": true
    },
    {
      "datasetId": "v2_Semi_Private",
      "datasetDisplayName": "ARC-AGI-2",
      "modelId": "grok-3-openrouter",
      "modelDisplayName": "Grok 3",
      "modelType": "Base LLM",
      "modelGroup": "",
      "modelReleaseDate": "2025-02-19T00:00:00.000Z",
      "providerId": "xAI",
      "providerDisplayName": "xAI",
      "providerColor": "#ff1ed9",
      "score": 0,
      "costPerTask": 0.1421,
      "resultsUrl": "",
      "display": true
    },
    {
      "datasetId": "v2_Semi_Private",
      "datasetDisplayName": "ARC-AGI-2",
      "modelId": "grok-3-mini-beta-low-openrouter",
      "modelDisplayName": "Grok 3 Mini (Low)",
      "modelType": "CoT",
      "modelGroup": "",
      "modelReleaseDate": "2025-02-19T00:00:00.000Z",
      "providerId": "xAI",
      "providerDisplayName": "xAI",
      "providerColor": "#ff1ed9",
      "score": 0.0042,
      "costPerTask": 0.0131,
      "resultsUrl": "",
      "display": true
    },
    {
      "datasetId": "v2_Semi_Private",
      "datasetDisplayName": "ARC-AGI-2",
      "modelId": "gemini-2-5-pro-preview-openrouter",
      "modelDisplayName": "Gemini 2.5 Pro (Preview)",
      "modelType": "CoT",
      "modelGroup": "",
      "modelReleaseDate": "2025-02-19T00:00:00.000Z",
      "providerId": "Google",
      "providerDisplayName": "Google",
      "providerColor": "#4ecc30ff",
      "score": 0.0375,
      "costPerTask": 0.8126,
      "resultsUrl": "",
      "display": false
    },
    {
      "datasetId": "v2_Semi_Private",
      "datasetDisplayName": "ARC-AGI-2",
      "modelId": "gemini-2-5-pro-preview-05-06-thinking-1k",
      "modelDisplayName": "Gemini 2.5 Pro (Preview, Thinking 1K)",
      "modelType": "CoT",
      "modelGroup": "",
      "modelReleaseDate": "2025-02-19T00:00:00.000Z",
      "providerId": "Google",
      "providerDisplayName": "Google",
      "providerColor": "#4ecc30ff",
      "score": 0.0344,
      "costPerTask": 0.8037,
      "resultsUrl": "",
      "display": false
    },
    {
      "datasetId": "v2_Semi_Private",
      "datasetDisplayName": "ARC-AGI-2",
      "modelId": "o3-pro-2025-06-10-low",
      "modelDisplayName": "o3-Pro (Low)",
      "modelType": "CoT + Synthesis",
      "modelGroup": "o3-pro",
      "modelReleaseDate": "2025-06-10T00:00:00.000Z",
      "providerId": "OpenAI",
      "providerDisplayName": "OpenAI",
      "providerColor": "#1e93ffff",
      "score": 0.0205,
      "costPerTask": 2.2293,
      "resultsUrl": "",
      "display": true
    },
    {
      "datasetId": "v2_Semi_Private",
      "datasetDisplayName": "ARC-AGI-2",
      "modelId": "o3-pro-2025-06-10-medium",
      "modelDisplayName": "o3-Pro (Medium)",
      "modelType": "CoT + Synthesis",
      "modelGroup": "o3-pro",
      "modelReleaseDate": "2025-06-10T00:00:00.000Z",
      "providerId": "OpenAI",
      "providerDisplayName": "OpenAI",
      "providerColor": "#1e93ffff",
      "score": 0.0194,
      "costPerTask": 4.7441,
      "resultsUrl": "",
      "display": true
    },
    {
      "datasetId": "v2_Semi_Private",
      "datasetDisplayName": "ARC-AGI-2",
      "modelId": "o3-pro-2025-06-10-high",
      "modelDisplayName": "o3-Pro (High)",
      "modelType": "CoT + Synthesis",
      "modelGroup": "o3-pro",
      "modelReleaseDate": "2025-06-10T00:00:00.000Z",
      "providerId": "OpenAI",
      "providerDisplayName": "OpenAI",
      "providerColor": "#1e93ffff",
      "score": 0.0486,
      "costPerTask": 7.5516,
      "resultsUrl": "",
      "display": true
    },
    {
      "datasetId": "v2_Semi_Private",
      "datasetDisplayName": "ARC-AGI-2",
      "modelId": "magistral-small-2506",
      "modelDisplayName": "Magistral Small",
      "modelType": "CoT",
      "modelGroup": "",
      "modelReleaseDate": "2025-06-10T00:00:00.000Z",
      "providerId": "Mistral",
      "providerDisplayName": "Mistral",
      "providerColor": "#ffffff",
      "score": 0,
      "costPerTask": 0.0488,
      "resultsUrl": "",
      "display": true
    },
    {
      "datasetId": "v2_Semi_Private",
      "datasetDisplayName": "ARC-AGI-2",
      "modelId": "magistral-medium-2506",
      "modelDisplayName": "Magistral Medium",
      "modelType": "CoT",
      "modelGroup": "",
      "modelReleaseDate": "2025-06-10T00:00:00.000Z",
      "providerId": "Mistral",
      "providerDisplayName": "Mistral",
      "providerColor": "#ffffff",
      "score": 0,
      "costPerTask": 0.1079,
      "resultsUrl": "",
      "display": true
    },
    {
      "datasetId": "v2_Semi_Private",
      "datasetDisplayName": "ARC-AGI-2",
      "modelId": "magistral-medium-2506-thinking",
      "modelDisplayName": "Magistral Medium (Thinking)",
      "modelType": "CoT",
      "modelGroup": "",
      "modelReleaseDate": "2025-06-10T00:00:00.000Z",
      "providerId": "Mistral",
      "providerDisplayName": "Mistral",
      "providerColor": "#ffffff",
      "score": 0,
      "costPerTask": 0.123,
      "resultsUrl": "",
      "display": true
    },
    {
      "datasetId": "v2_Semi_Private",
      "datasetDisplayName": "ARC-AGI-2",
      "modelId": "gemini-2-5-pro-2025-06-17-thinking-1k",
      "modelDisplayName": "Gemini 2.5 Pro (Thinking 1K)",
      "modelType": "CoT",
      "modelGroup": "gemini-2-5-pro-2025-06-17-thinking",
      "modelReleaseDate": "2025-06-17T00:00:00.000Z",
      "providerId": "Google",
      "providerDisplayName": "Google",
      "providerColor": "#4ecc30ff",
      "score": 0,
      "costPerTask": 0.0885,
      "resultsUrl": "",
      "display": true
    },
    {
      "datasetId": "v2_Semi_Private",
      "datasetDisplayName": "ARC-AGI-2",
      "modelId": "gemini-2-5-pro-2025-06-17-thinking-8k",
      "modelDisplayName": "Gemini 2.5 Pro (Thinking 8K)",
      "modelType": "CoT",
      "modelGroup": "gemini-2-5-pro-2025-06-17-thinking",
      "modelReleaseDate": "2025-06-17T00:00:00.000Z",
      "providerId": "Google",
      "providerDisplayName": "Google",
      "providerColor": "#4ecc30ff",
      "score": 0.0292,
      "costPerTask": 0.4439,
      "resultsUrl": "",
      "display": true
    },
    {
      "datasetId": "v2_Semi_Private",
      "datasetDisplayName": "ARC-AGI-2",
      "modelId": "gemini-2-5-pro-2025-06-17-thinking-16k",
      "modelDisplayName": "Gemini 2.5 Pro (Thinking 16K)",
      "modelType": "CoT",
      "modelGroup": "gemini-2-5-pro-2025-06-17-thinking",
      "modelReleaseDate": "2025-06-17T00:00:00.000Z",
      "providerId": "Google",
      "providerDisplayName": "Google",
      "providerColor": "#4ecc30ff",
      "score": 0.0403,
      "costPerTask": 0.7145,
      "resultsUrl": "",
      "display": true
    },
    {
      "datasetId": "v2_Semi_Private",
      "datasetDisplayName": "ARC-AGI-2",
      "modelId": "gemini-2-5-pro-2025-06-17-thinking-32k",
      "modelDisplayName": "Gemini 2.5 Pro (Thinking 32K)",
      "modelType": "CoT",
      "modelGroup": "gemini-2-5-pro-2025-06-17-thinking",
      "modelReleaseDate": "2025-06-17T00:00:00.000Z",
      "providerId": "Google",
      "providerDisplayName": "Google",
      "providerColor": "#4ecc30ff",
      "score": 0.0486,
      "costPerTask": 0.757,
      "resultsUrl": "",
      "display": true
    },
    {
      "datasetId": "v2_Semi_Private",
      "datasetDisplayName": "ARC-AGI-2",
      "modelId": "grok-4-0709",
      "modelDisplayName": "Grok 4 (Thinking)",
      "modelType": "CoT",
      "modelGroup": "",
      "modelReleaseDate": "2025-07-09T00:00:00.000Z",
      "providerId": "xAI",
      "providerDisplayName": "xAI",
      "providerColor": "#ff1ed9",
      "score": 0.15975,
      "costPerTask": 2.1659,
      "resultsUrl": "",
      "display": true
    },
    {
      "datasetId": "v2_Semi_Private",
      "datasetDisplayName": "ARC-AGI-2",
      "modelId": "qwen3-235b-a22b-instruct-2507",
      "modelDisplayName": "Qwen3-235b-a22b Instruct (25/07)",
      "modelType": "Base LLM",
      "modelGroup": "",
      "modelReleaseDate": "2025-07-25T00:00:00.000Z",
      "providerId": "Alibaba",
      "providerDisplayName": "Alibaba",
      "providerColor": "#ffffff",
      "score": 0.0125,
      "costPerTask": 0.0044,
      "resultsUrl": "",
      "display": true
    },
    {
      "datasetId": "v2_Semi_Private",
      "datasetDisplayName": "ARC-AGI-2",
      "modelId": "gpt-5-2025-08-07-high",
      "modelDisplayName": "GPT-5 (High)",
      "modelType": "CoT",
      "modelGroup": "gpt-5-reasoning",
      "modelReleaseDate": "2025-08-07T00:00:00.000Z",
      "providerId": "OpenAI",
      "providerDisplayName": "OpenAI",
      "providerColor": "#1e93ffff",
      "score": 0.0986,
      "costPerTask": 0.7302,
      "resultsUrl": "",
      "display": true
    },
    {
      "datasetId": "v2_Semi_Private",
      "datasetDisplayName": "ARC-AGI-2",
      "modelId": "gpt-5-2025-08-07-medium",
      "modelDisplayName": "GPT-5 (Medium)",
      "modelType": "CoT",
      "modelGroup": "gpt-5-reasoning",
      "modelReleaseDate": "2025-08-07T00:00:00.000Z",
      "providerId": "OpenAI",
      "providerDisplayName": "OpenAI",
      "providerColor": "#1e93ffff",
      "score": 0.0749,
      "costPerTask": 0.4486,
      "resultsUrl": "",
      "display": true
    },
    {
      "datasetId": "v2_Semi_Private",
      "datasetDisplayName": "ARC-AGI-2",
      "modelId": "gpt-5-2025-08-07-low",
      "modelDisplayName": "GPT-5 (Low)",
      "modelType": "CoT",
      "modelGroup": "gpt-5-reasoning",
      "modelReleaseDate": "2025-08-07T00:00:00.000Z",
      "providerId": "OpenAI",
      "providerDisplayName": "OpenAI",
      "providerColor": "#1e93ffff",
      "score": 0.0194,
      "costPerTask": 0.1896,
      "resultsUrl": "",
      "display": true
    },
    {
      "datasetId": "v2_Semi_Private",
      "datasetDisplayName": "ARC-AGI-2",
      "modelId": "gpt-5-2025-08-07-low",
      "modelDisplayName": "GPT-5 (Low)",
      "modelType": "CoT",
      "modelGroup": "gpt-5-reasoning",
      "modelReleaseDate": "2025-08-07T00:00:00.000Z",
      "providerId": "OpenAI",
      "providerDisplayName": "OpenAI",
      "providerColor": "#1e93ffff",
      "score": 0.0194,
      "costPerTask": 0.1896,
      "resultsUrl": "",
      "display": true
    },
    {
      "datasetId": "v2_Semi_Private",
      "datasetDisplayName": "ARC-AGI-2",
      "modelId": "gpt-5-2025-08-07-minimal",
      "modelDisplayName": "GPT-5 (Minimal)",
      "modelType": "Base LLM",
      "modelGroup": "",
      "modelReleaseDate": "2025-08-07T00:00:00.000Z",
      "providerId": "OpenAI",
      "providerDisplayName": "OpenAI",
      "providerColor": "#1e93ffff",
      "score": 0,
      "costPerTask": 0.0562,
      "resultsUrl": "",
      "display": true
    },
    {
      "datasetId": "v2_Semi_Private",
      "datasetDisplayName": "ARC-AGI-2",
      "modelId": "gpt-5-mini-2025-08-07-high",
      "modelDisplayName": "GPT-5 Mini (High)",
      "modelType": "CoT",
      "modelGroup": "gpt-5-mini-reasoning",
      "modelReleaseDate": "2025-08-07T00:00:00.000Z",
      "providerId": "OpenAI",
      "providerDisplayName": "OpenAI",
      "providerColor": "#1e93ffff",
      "score": 0.0444,
      "costPerTask": 0.1977,
      "resultsUrl": "",
      "display": true
    },
    {
      "datasetId": "v2_Semi_Private",
      "datasetDisplayName": "ARC-AGI-2",
      "modelId": "gpt-5-mini-2025-08-07-medium",
      "modelDisplayName": "GPT-5 Mini (Medium)",
      "modelType": "CoT",
      "modelGroup": "gpt-5-mini-reasoning",
      "modelReleaseDate": "2025-08-07T00:00:00.000Z",
      "providerId": "OpenAI",
      "providerDisplayName": "OpenAI",
      "providerColor": "#1e93ffff",
      "score": 0.0403,
      "costPerTask": 0.0629,
      "resultsUrl": "",
      "display": true
    },
    {
      "datasetId": "v2_Semi_Private",
      "datasetDisplayName": "ARC-AGI-2",
      "modelId": "gpt-5-mini-2025-08-07-low",
      "modelDisplayName": "GPT-5 Mini (Low)",
      "modelType": "CoT",
      "modelGroup": "gpt-5-mini-reasoning",
      "modelReleaseDate": "2025-08-07T00:00:00.000Z",
      "providerId": "OpenAI",
      "providerDisplayName": "OpenAI",
      "providerColor": "#1e93ffff",
      "score": 0.0083,
      "costPerTask": 0.0189,
      "resultsUrl": "",
      "display": true
    },
    {
      "datasetId": "v2_Semi_Private",
      "datasetDisplayName": "ARC-AGI-2",
      "modelId": "gpt-5-mini-2025-08-07-minimal",
      "modelDisplayName": "GPT-5 Mini (Minimal)",
      "modelType": "CoT",
      "modelGroup": "",
      "modelReleaseDate": "2025-08-07T00:00:00.000Z",
      "providerId": "OpenAI",
      "providerDisplayName": "OpenAI",
      "providerColor": "#1e93ffff",
      "score": 0.0167,
      "costPerTask": 0.0094,
      "resultsUrl": "",
      "display": true
    },
    {
      "datasetId": "v2_Semi_Private",
      "datasetDisplayName": "ARC-AGI-2",
      "modelId": "gpt-5-nano-2025-08-07-high",
      "modelDisplayName": "GPT-5 Nano (High)",
      "modelType": "CoT",
      "modelGroup": "gpt-5-nano-reasoning",
      "modelReleaseDate": "2025-08-07T00:00:00.000Z",
      "providerId": "OpenAI",
      "providerDisplayName": "OpenAI",
      "providerColor": "#1e93ffff",
      "score": 0.0261,
      "costPerTask": 0.0295,
      "resultsUrl": "",
      "display": true
    },
    {
      "datasetId": "v2_Semi_Private",
      "datasetDisplayName": "ARC-AGI-2",
      "modelId": "gpt-5-nano-2025-08-07-medium",
      "modelDisplayName": "GPT-5 Nano (Medium)",
      "modelType": "CoT",
      "modelGroup": "gpt-5-nano-reasoning",
      "modelReleaseDate": "2025-08-07T00:00:00.000Z",
      "providerId": "OpenAI",
      "providerDisplayName": "OpenAI",
      "providerColor": "#1e93ffff",
      "score": 0.0088,
      "costPerTask": 0.0137,
      "resultsUrl": "",
      "display": true
    },
    {
      "datasetId": "v2_Semi_Private",
      "datasetDisplayName": "ARC-AGI-2",
      "modelId": "gpt-5-nano-2025-08-07-low",
      "modelDisplayName": "GPT-5 Nano (Low)",
      "modelType": "CoT",
      "modelGroup": "gpt-5-nano-reasoning",
      "modelReleaseDate": "2025-08-07T00:00:00.000Z",
      "providerId": "OpenAI",
      "providerDisplayName": "OpenAI",
      "providerColor": "#1e93ffff",
      "score": 0,
      "costPerTask": 0.0033,
      "resultsUrl": "",
      "display": true
    },
    {
      "datasetId": "v2_Semi_Private",
      "datasetDisplayName": "ARC-AGI-2",
      "modelId": "gpt-5-nano-2025-08-07-minimal",
      "modelDisplayName": "GPT-5 Nano (Minimal)",
      "modelType": "CoT",
      "modelGroup": "",
      "modelReleaseDate": "2025-08-07T00:00:00.000Z",
      "providerId": "OpenAI",
      "providerDisplayName": "OpenAI",
      "providerColor": "#1e93ffff",
      "score": 0,
      "costPerTask": 0.0025,
      "resultsUrl": "",
      "display": true
    },
    {
      "datasetId": "v2_Semi_Private",
      "datasetDisplayName": "ARC-AGI-2",
      "modelId": "hrm-2-2508",
      "modelDisplayName": "Hierarchical Reasoning Model (HRM)",
      "modelType": "",
      "modelGroup": "",
      "modelReleaseDate": "2025-08-07T00:00:00.000Z",
      "providerId": "bespoke",
      "providerDisplayName": "Bespoke",
      "providerColor": "#ff841cff",
      "score": 0.02,
      "costPerTask": 1.68,
      "resultsUrl": "",
      "display": false
    },
    {
      "datasetId": "v2_Semi_Private",
      "datasetDisplayName": "ARC-AGI-2",
      "modelId": "jeremy_sept_2025",
      "modelDisplayName": "Grok 4 (Refine.)",
      "modelType": "Refinement",
      "modelGroup": "",
      "modelReleaseDate": "2025-08-07T00:00:00.000Z",
      "providerId": "j_berman",
      "providerDisplayName": "J. Berman",
      "providerColor": "#ffffff",
      "score": 0.2944,
      "costPerTask": 30.4,
      "resultsUrl": "",
      "display": true
    },
    {
      "datasetId": "v2_Semi_Private",
      "datasetDisplayName": "ARC-AGI-2",
      "modelId": "eric_pang_sept_2025",
      "modelDisplayName": "Grok 4 (Refine.)",
      "modelType": "Refinement",
      "modelGroup": "",
      "modelReleaseDate": "2025-08-07T00:00:00.000Z",
      "providerId": "e_pang",
      "providerDisplayName": "E. Pang",
      "providerColor": "#ffffff",
      "score": 0.26,
      "costPerTask": 3.97,
      "resultsUrl": "",
      "display": false
    },
    {
      "datasetId": "v2_Semi_Private",
      "datasetDisplayName": "ARC-AGI-2",
      "modelId": "claude-sonnet-4-5-20250929",
      "modelDisplayName": "Claude Sonnet 4.5",
      "modelType": "Base LLM",
      "modelGroup": "claude-sonnet-4-5-20250929",
      "modelReleaseDate": "2025-09-29T00:00:00.000Z",
      "providerId": "Anthropic",
      "providerDisplayName": "Anthropic",
      "providerColor": "#f93c32ff",
      "score": 0.0375,
      "costPerTask": 0.1295,
      "resultsUrl": "",
      "display": true
    },
    {
      "datasetId": "v2_Semi_Private",
      "datasetDisplayName": "ARC-AGI-2",
      "modelId": "claude-sonnet-4-5-20250929-thinking-1k",
      "modelDisplayName": "Claude Sonnet 4.5 (Thinking 1K)",
      "modelType": "CoT",
      "modelGroup": "claude-sonnet-4-5-20250929",
      "modelReleaseDate": "2025-09-29T00:00:00.000Z",
      "providerId": "Anthropic",
      "providerDisplayName": "Anthropic",
      "providerColor": "#f93c32ff",
      "score": 0.0583,
      "costPerTask": 0.1424,
      "resultsUrl": "",
      "display": true
    },
    {
      "datasetId": "v2_Semi_Private",
      "datasetDisplayName": "ARC-AGI-2",
      "modelId": "claude-sonnet-4-5-20250929-thinking-8k",
      "modelDisplayName": "Claude Sonnet 4.5 (Thinking 8K)",
      "modelType": "CoT",
      "modelGroup": "claude-sonnet-4-5-20250929",
      "modelReleaseDate": "2025-09-29T00:00:00.000Z",
      "providerId": "Anthropic",
      "providerDisplayName": "Anthropic",
      "providerColor": "#f93c32ff",
      "score": 0.0694,
      "costPerTask": 0.2349,
      "resultsUrl": "",
      "display": true
    },
    {
      "datasetId": "v2_Semi_Private",
      "datasetDisplayName": "ARC-AGI-2",
      "modelId": "claude-sonnet-4-5-20250929-thinking-16k",
      "modelDisplayName": "Claude Sonnet 4.5 (Thinking 16K)",
      "modelType": "CoT",
      "modelGroup": "claude-sonnet-4-5-20250929",
      "modelReleaseDate": "2025-09-29T00:00:00.000Z",
      "providerId": "Anthropic",
      "providerDisplayName": "Anthropic",
      "providerColor": "#f93c32ff",
      "score": 0.0694,
      "costPerTask": 0.3499,
      "resultsUrl": "",
      "display": true
    },
    {
      "datasetId": "v2_Semi_Private",
      "datasetDisplayName": "ARC-AGI-2",
      "modelId": "claude-sonnet-4-5-20250929-thinking-32k",
      "modelDisplayName": "Claude Sonnet 4.5 (Thinking 32K)",
      "modelType": "CoT",
      "modelGroup": "claude-sonnet-4-5-20250929",
      "modelReleaseDate": "2025-09-29T00:00:00.000Z",
      "providerId": "Anthropic",
      "providerDisplayName": "Anthropic",
      "providerColor": "#f93c32ff",
      "score": 0.1361,
      "costPerTask": 0.7589,
      "resultsUrl": "",
      "display": true
    },
    {
      "datasetId": "v2_Semi_Private",
      "datasetDisplayName": "ARC-AGI-2",
      "modelId": "gpt-5-pro-2025-10-06",
      "modelDisplayName": "GPT-5 Pro",
      "modelType": "CoT",
      "modelGroup": "",
      "modelReleaseDate": "2025-10-06T00:00:00.000Z",
      "providerId": "OpenAI",
      "providerDisplayName": "OpenAI",
      "providerColor": "#1e93ffff",
      "score": 0.1833,
      "costPerTask": 7.1432,
      "resultsUrl": "",
      "display": true
    },
    {
      "datasetId": "v2_Semi_Private",
      "datasetDisplayName": "ARC-AGI-2",
      "modelId": "trm-2025-10-07",
      "modelDisplayName": "Tiny Recursion Model (TRM)",
      "modelType": "",
      "modelGroup": "",
      "modelReleaseDate": "2025-10-07T00:00:00.000Z",
      "providerId": "bespoke",
      "providerDisplayName": "Bespoke",
      "providerColor": "#ff841cff",
      "score": 0.0625,
      "costPerTask": 2.1,
      "resultsUrl": "",
      "display": true
    },
    {
      "datasetId": "v2_Semi_Private",
      "datasetDisplayName": "ARC-AGI-2",
      "modelId": "claude-haiku-4-5-20251001",
      "modelDisplayName": "Claude Haiku 4.5",
      "modelType": "Base LLM",
      "modelGroup": "claude-haiku-4-5-20251001",
      "modelReleaseDate": "2025-10-01T00:00:00.000Z",
      "providerId": "Anthropic",
      "providerDisplayName": "Anthropic",
      "providerColor": "#f93c32ff",
      "score": 0.0125,
      "costPerTask": 0.0426,
      "resultsUrl": "",
      "display": true
    },
    {
      "datasetId": "v2_Semi_Private",
      "datasetDisplayName": "ARC-AGI-2",
      "modelId": "claude-haiku-4-5-20251001-thinking-1k",
      "modelDisplayName": "Claude Haiku 4.5 (Thinking 1K)",
      "modelType": "CoT",
      "modelGroup": "claude-haiku-4-5-20251001",
      "modelReleaseDate": "2025-10-01T00:00:00.000Z",
      "providerId": "Anthropic",
      "providerDisplayName": "Anthropic",
      "providerColor": "#f93c32ff",
      "score": 0.0125,
      "costPerTask": 0.0471,
      "resultsUrl": "",
      "display": true
    },
    {
      "datasetId": "v2_Semi_Private",
      "datasetDisplayName": "ARC-AGI-2",
      "modelId": "claude-haiku-4-5-20251001-thinking-8k",
      "modelDisplayName": "Claude Haiku 4.5 (Thinking 8K)",
      "modelType": "CoT",
      "modelGroup": "claude-haiku-4-5-20251001",
      "modelReleaseDate": "2025-10-01T00:00:00.000Z",
      "providerId": "Anthropic",
      "providerDisplayName": "Anthropic",
      "providerColor": "#f93c32ff",
      "score": 0.0167,
      "costPerTask": 0.0909,
      "resultsUrl": "",
      "display": true
    },
    {
      "datasetId": "v2_Semi_Private",
      "datasetDisplayName": "ARC-AGI-2",
      "modelId": "claude-haiku-4-5-20251001-thinking-16k",
      "modelDisplayName": "Claude Haiku 4.5 (Thinking 16K)",
      "modelType": "CoT",
      "modelGroup": "claude-haiku-4-5-20251001",
      "modelReleaseDate": "2025-10-01T00:00:00.000Z",
      "providerId": "Anthropic",
      "providerDisplayName": "Anthropic",
      "providerColor": "#f93c32ff",
      "score": 0.0278,
      "costPerTask": 0.1392,
      "resultsUrl": "",
      "display": true
    },
    {
      "datasetId": "v2_Semi_Private",
      "datasetDisplayName": "ARC-AGI-2",
      "modelId": "claude-haiku-4-5-20251001-thinking-32k",
      "modelDisplayName": "Claude Haiku 4.5 (Thinking 32K)",
      "modelType": "CoT",
      "modelGroup": "claude-haiku-4-5-20251001",
      "modelReleaseDate": "2025-10-01T00:00:00.000Z",
      "providerId": "Anthropic",
      "providerDisplayName": "Anthropic",
      "providerColor": "#f93c32ff",
      "score": 0.0403,
      "costPerTask": 0.3766,
      "resultsUrl": "",
      "display": true,
      "displayLabel": false
    },
    {
      "datasetId": "v2_Semi_Private",
      "datasetDisplayName": "ARC-AGI-2",
      "modelId": "grok-4-fast-reasoning",
      "modelDisplayName": "Grok 4 (Fast Reasoning)",
      "modelType": "CoT",
      "modelGroup": "grok-4-0709",
      "modelReleaseDate": "2025-10-21T00:00:00.000Z",
      "providerId": "xAI",
      "providerDisplayName": "xAI",
      "providerColor": "#ff1ed9",
      "score": 0.0528,
      "costPerTask": 0.061,
      "resultsUrl": "",
      "display": true
    },
    {
      "datasetId": "v2_Semi_Private",
      "datasetDisplayName": "ARC-AGI-2",
      "modelId": "gpt-5-1-2025-11-13-thinking-none",
      "modelDisplayName": "GPT-5.1 (Thinking, None)",
      "modelType": "CoT",
      "modelGroup": "gpt-5-1-reasoning",
      "modelReleaseDate": "2025-11-13T00:00:00.000Z",
      "providerId": "OpenAI",
      "providerDisplayName": "OpenAI",
      "providerColor": "#1e93ffff",
      "score": 0.0042,
      "costPerTask": 0.0581,
      "resultsUrl": "",
      "display": true
    },
    {
      "datasetId": "v2_Semi_Private",
      "datasetDisplayName": "ARC-AGI-2",
      "modelId": "gpt-5-1-2025-11-13-thinking-low",
      "modelDisplayName": "GPT-5.1 (Thinking, Low)",
      "modelType": "CoT",
      "modelGroup": "gpt-5-1-reasoning",
      "modelReleaseDate": "2025-11-13T00:00:00.000Z",
      "providerId": "OpenAI",
      "providerDisplayName": "OpenAI",
      "providerColor": "#1e93ffff",
      "score": 0.0194,
      "costPerTask": 0.129,
      "resultsUrl": "",
      "display": true
    },
    {
      "datasetId": "v2_Semi_Private",
      "datasetDisplayName": "ARC-AGI-2",
      "modelId": "gpt-5-1-2025-11-13-thinking-medium",
      "modelDisplayName": "GPT-5.1 (Thinking, Medium)",
      "modelType": "CoT",
      "modelGroup": "gpt-5-1-reasoning",
      "modelReleaseDate": "2025-11-13T00:00:00.000Z",
      "providerId": "OpenAI",
      "providerDisplayName": "OpenAI",
      "providerColor": "#1e93ffff",
      "score": 0.0653,
      "costPerTask": 0.4206,
      "resultsUrl": "",
      "display": true
    },
    {
      "datasetId": "v2_Semi_Private",
      "datasetDisplayName": "ARC-AGI-2",
      "modelId": "gpt-5-1-2025-11-13-thinking-high",
      "modelDisplayName": "GPT-5.1 (Thinking, High)",
      "modelType": "CoT",
      "modelGroup": "gpt-5-1-reasoning",
      "modelReleaseDate": "2025-11-13T00:00:00.000Z",
      "providerId": "OpenAI",
      "providerDisplayName": "OpenAI",
      "providerColor": "#1e93ffff",
      "score": 0.1764,
      "costPerTask": 1.1704,
      "resultsUrl": "",
      "display": true
    },
    {
      "datasetId": "v2_Semi_Private",
      "datasetDisplayName": "ARC-AGI-2",
      "modelId": "gemini-3-pro-preview",
      "modelDisplayName": "Gemini 3 Pro",
      "modelType": "CoT",
      "modelGroup": "gemini-3-pro",
      "modelReleaseDate": "2025-11-18T00:00:00.000Z",
      "providerId": "Google",
      "providerDisplayName": "Google",
      "providerColor": "#4ecc30ff",
      "score": 0.3111,
      "costPerTask": 0.8109,
      "resultsUrl": "",
      "display": true
    },
    {
      "datasetId": "v2_Semi_Private",
      "datasetDisplayName": "ARC-AGI-2",
      "modelId": "gemini-3-deep-think-preview",
      "modelDisplayName": "Gemini 3 Deep Think (Preview) ²",
      "modelType": "CoT",
      "modelGroup": "gemini-3-deep-think-preview",
      "modelReleaseDate": "2026-02-12T16:13:00.000Z",
      "providerId": "Google",
      "providerDisplayName": "Google",
      "providerColor": "#4ecc30ff",
      "score": 0.4514,
      "costPerTask": 77.16309638,
      "resultsUrl": "",
      "display": true,
      "displayLabel": false
    },
    {
      "datasetId": "v2_Semi_Private",
      "datasetDisplayName": "ARC-AGI-2",
      "modelId": "claude-opus-4-5-20251101-thinking-none",
      "modelDisplayName": "Opus 4.5 (Thinking, None)",
      "modelType": "CoT",
      "modelGroup": "opus-4-5-thinking",
      "modelReleaseDate": "2025-11-24T00:00:00.000Z",
      "providerId": "Anthropic",
      "providerDisplayName": "Anthropic",
      "providerColor": "#f93c32ff",
      "score": 0.0778,
      "costPerTask": 0.22,
      "resultsUrl": "",
      "display": true
    },
    {
      "datasetId": "v2_Semi_Private",
      "datasetDisplayName": "ARC-AGI-2",
      "modelId": "claude-opus-4-5-20251101-thinking-1k",
      "modelDisplayName": "Opus 4.5 (Thinking, 1K)",
      "modelType": "CoT",
      "modelGroup": "opus-4-5-thinking",
      "modelReleaseDate": "2025-11-24T00:00:00.000Z",
      "providerId": "Anthropic",
      "providerDisplayName": "Anthropic",
      "providerColor": "#f93c32ff",
      "score": 0.0944,
      "costPerTask": 0.23,
      "resultsUrl": "",
      "display": false
    },
    {
      "datasetId": "v2_Semi_Private",
      "datasetDisplayName": "ARC-AGI-2",
      "modelId": "claude-opus-4-5-20251101-thinking-8k",
      "modelDisplayName": "Opus 4.5 (Thinking, 8K)",
      "modelType": "CoT",
      "modelGroup": "opus-4-5-thinking",
      "modelReleaseDate": "2025-11-24T00:00:00.000Z",
      "providerId": "Anthropic",
      "providerDisplayName": "Anthropic",
      "providerColor": "#f93c32ff",
      "score": 0.1389,
      "costPerTask": 0.48,
      "resultsUrl": "",
      "display": true
    },
    {
      "datasetId": "v2_Semi_Private",
      "datasetDisplayName": "ARC-AGI-2",
      "modelId": "claude-opus-4-5-20251101-thinking-16k",
      "modelDisplayName": "Opus 4.5 (Thinking, 16K)",
      "modelType": "CoT",
      "modelGroup": "opus-4-5-thinking",
      "modelReleaseDate": "2025-11-24T00:00:00.000Z",
      "providerId": "Anthropic",
      "providerDisplayName": "Anthropic",
      "providerColor": "#f93c32ff",
      "score": 0.2278,
      "costPerTask": 0.79,
      "resultsUrl": "",
      "display": true
    },
    {
      "datasetId": "v2_Semi_Private",
      "datasetDisplayName": "ARC-AGI-2",
      "modelId": "claude-opus-4-5-20251101-thinking-32k",
      "modelDisplayName": "Opus 4.5 (Thinking, 32K)",
      "modelType": "CoT",
      "modelGroup": "opus-4-5-thinking",
      "modelReleaseDate": "2025-11-24T00:00:00.000Z",
      "providerId": "Anthropic",
      "providerDisplayName": "Anthropic",
      "providerColor": "#f93c32ff",
      "score": 0.3056,
      "costPerTask": 1.29,
      "resultsUrl": "",
      "display": false
    },
    {
      "datasetId": "v2_Semi_Private",
      "datasetDisplayName": "ARC-AGI-2",
      "modelId": "claude-opus-4-5-20251101-thinking-64k",
      "modelDisplayName": "Opus 4.5 (Thinking, 64K)",
      "modelType": "CoT",
      "modelGroup": "opus-4-5-thinking",
      "modelReleaseDate": "2025-11-24T00:00:00.000Z",
      "providerId": "Anthropic",
      "providerDisplayName": "Anthropic",
      "providerColor": "#f93c32ff",
      "score": 0.3764,
      "costPerTask": 2.4,
      "resultsUrl": "",
      "display": true
    },
    {
      "datasetId": "v2_Semi_Private",
      "datasetDisplayName": "ARC-AGI-2",
      "modelId": "poetiq-arc-agi-gemini-3-d_v1",
      "modelDisplayName": "Gemini 3 Pro (Refine.)",
      "modelType": "Refinement",
      "modelGroup": "",
      "modelReleaseDate": "2025-12-04T00:00:00.000Z",
      "providerId": "poetiq",
      "providerDisplayName": "Poetiq",
      "providerColor": "#ffffff",
      "score": 0.54,
      "costPerTask": 30.568,
      "resultsUrl": "",
      "display": true,
      "displayLabel": false
    },
    {
      "datasetId": "v2_Semi_Private",
      "datasetDisplayName": "ARC-AGI-2",
      "modelId": "gpt-5-2-2025-12-11-thinking-none",
      "modelDisplayName": "GPT-5.2",
      "modelType": "Base LLM",
      "modelGroup": "",
      "modelReleaseDate": "2025-12-11T00:00:00.000Z",
      "providerId": "OpenAI",
      "providerDisplayName": "OpenAI",
      "providerColor": "#1e93ffff",
      "score": 0.0083,
      "costPerTask": 0.0818,
      "resultsUrl": "",
      "display": true
    },
    {
      "datasetId": "v2_Semi_Private",
      "datasetDisplayName": "ARC-AGI-2",
      "modelId": "gpt-5-2-2025-12-11-thinking-low",
      "modelDisplayName": "GPT-5.2 (Low)",
      "modelType": "CoT",
      "modelGroup": "gpt-5-2-2025-12-11-thinking",
      "modelReleaseDate": "2025-12-11T00:00:00.000Z",
      "providerId": "OpenAI",
      "providerDisplayName": "OpenAI",
      "providerColor": "#1e93ffff",
      "score": 0.0972,
      "costPerTask": 0.2642,
      "resultsUrl": "",
      "display": true
    },
    {
      "datasetId": "v2_Semi_Private",
      "datasetDisplayName": "ARC-AGI-2",
      "modelId": "gpt-5-2-2025-12-11-thinking-medium",
      "modelDisplayName": "GPT-5.2 (Medium)",
      "modelType": "CoT",
      "modelGroup": "gpt-5-2-2025-12-11-thinking",
      "modelReleaseDate": "2025-12-11T00:00:00.000Z",
      "providerId": "OpenAI",
      "providerDisplayName": "OpenAI",
      "providerColor": "#1e93ffff",
      "score": 0.2667,
      "costPerTask": 0.7594,
      "resultsUrl": "",
      "display": true
    },
    {
      "datasetId": "v2_Semi_Private",
      "datasetDisplayName": "ARC-AGI-2",
      "modelId": "gpt-5-2-2025-12-11-thinking-high",
      "modelDisplayName": "GPT-5.2 (High)",
      "modelType": "CoT",
      "modelGroup": "gpt-5-2-2025-12-11-thinking",
      "modelReleaseDate": "2025-12-11T00:00:00.000Z",
      "providerId": "OpenAI",
      "providerDisplayName": "OpenAI",
      "providerColor": "#1e93ffff",
      "score": 0.4333,
      "costPerTask": 1.393,
      "resultsUrl": "",
      "display": true
    },
    {
      "datasetId": "v2_Semi_Private",
      "datasetDisplayName": "ARC-AGI-2",
      "modelId": "gpt-5-2-2025-12-11-thinking-xhigh",
      "modelDisplayName": "GPT-5.2 (xHigh)",
      "modelType": "CoT",
      "modelGroup": "gpt-5-2-2025-12-11-thinking",
      "modelReleaseDate": "2025-12-11T00:00:00.000Z",
      "providerId": "OpenAI",
      "providerDisplayName": "OpenAI",
      "providerColor": "#1e93ffff",
      "score": 0.5291,
      "costPerTask": 1.8982,
      "resultsUrl": "",
      "display": true
    },
    {
      "datasetId": "v2_Semi_Private",
      "datasetDisplayName": "ARC-AGI-2",
      "modelId": "gpt-5-2-pro-2025-12-11-medium",
      "modelDisplayName": "GPT-5.2 Pro (Medium)",
      "modelType": "CoT",
      "modelGroup": "gpt-5-2-pro-2025-12-11-thinking",
      "modelReleaseDate": "2025-12-11T00:00:00.000Z",
      "providerId": "OpenAI",
      "providerDisplayName": "OpenAI",
      "providerColor": "#1e93ffff",
      "score": 0.3847,
      "costPerTask": 8.9928,
      "resultsUrl": "",
      "display": true
    },
    {
      "datasetId": "v2_Semi_Private",
      "datasetDisplayName": "ARC-AGI-2",
      "modelId": "gpt-5-2-pro-2025-12-11-high",
      "modelDisplayName": "GPT-5.2 Pro (High)",
      "modelType": "CoT",
      "modelGroup": "gpt-5-2-pro-2025-12-11-thinking",
      "modelReleaseDate": "2025-12-11T00:00:00.000Z",
      "providerId": "OpenAI",
      "providerDisplayName": "OpenAI",
      "providerColor": "#1e93ffff",
      "score": 0.5416,
      "costPerTask": 15.721,
      "resultsUrl": "",
      "display": true,
      "labelOffsetX": -2,
      "labelOffsetY": -10
    },
    {
      "datasetId": "v2_Semi_Private",
      "datasetDisplayName": "ARC-AGI-2",
      "modelId": "gemini-3-flash-preview-thinking-minimal",
      "modelDisplayName": "Gemini 3 Flash Preview (Minimal)",
      "modelType": "CoT",
      "modelGroup": "gemini-3-flash-preview-thinking",
      "modelReleaseDate": "2025-12-17T00:00:00.000Z",
      "providerId": "Google",
      "providerDisplayName": "Google",
      "providerColor": "#4ecc30ff",
      "score": 0.0333,
      "costPerTask": 0.0205,
      "resultsUrl": "",
      "display": true
    },
    {
      "datasetId": "v2_Semi_Private",
      "datasetDisplayName": "ARC-AGI-2",
      "modelId": "gemini-3-flash-preview-thinking-low",
      "modelDisplayName": "Gemini 3 Flash Preview (Low)",
      "modelType": "CoT",
      "modelGroup": "gemini-3-flash-preview-thinking",
      "modelReleaseDate": "2025-12-17T00:00:00.000Z",
      "providerId": "Google",
      "providerDisplayName": "Google",
      "providerColor": "#4ecc30ff",
      "score": 0.0125,
      "costPerTask": 0.0249,
      "resultsUrl": "",
      "display": true
    },
    {
      "datasetId": "v2_Semi_Private",
      "datasetDisplayName": "ARC-AGI-2",
      "modelId": "gemini-3-flash-preview-thinking-medium",
      "modelDisplayName": "Gemini 3 Flash Preview (Medium)",
      "modelType": "CoT",
      "modelGroup": "gemini-3-flash-preview-thinking",
      "modelReleaseDate": "2025-12-17T00:00:00.000Z",
      "providerId": "Google",
      "providerDisplayName": "Google",
      "providerColor": "#4ecc30ff",
      "score": 0.1278,
      "costPerTask": 0.0824,
      "resultsUrl": "",
      "display": true
    },
    {
      "datasetId": "v2_Semi_Private",
      "datasetDisplayName": "ARC-AGI-2",
      "modelId": "gemini-3-flash-preview-thinking-high",
      "modelDisplayName": "Gemini 3 Flash Preview (High)",
      "modelType": "CoT",
      "modelGroup": "gemini-3-flash-preview-thinking",
      "modelReleaseDate": "2025-12-17T00:00:00.000Z",
      "providerId": "Google",
      "providerDisplayName": "Google",
      "providerColor": "#4ecc30ff",
      "score": 0.3361,
      "costPerTask": 0.2314,
      "resultsUrl": "",
      "display": true
    },
    {
      "datasetId": "v2_Semi_Private",
      "datasetDisplayName": "ARC-AGI-2",
      "modelId": "grok-4.20-beta-0309b-reasoning",
      "modelDisplayName": "Grok 4.20 (Reasoning)",
      "modelType": "CoT",
      "modelGroup": "grok-4.20-beta-0309b-reasoning",
      "modelReleaseDate": "2026-03-09T00:00:00.000Z",
      "providerId": "xAI",
      "providerDisplayName": "xAI",
      "providerColor": "#ff1ed9",
      "score": 0.6514,
      "costPerTask": 0.92,
      "resultsUrl": "",
      "display": true
    },
    {
      "datasetId": "v2_Semi_Private",
      "datasetDisplayName": "ARC-AGI-2",
      "modelId": "johan_land_gpt_5_2_refine",
      "modelDisplayName": "GPT-5.2 (Refine.)",
      "modelType": "Refinement",
      "modelGroup": "",
      "modelReleaseDate": "2026-02-03T00:00:00.000Z",
      "providerId": "johan_land",
      "providerDisplayName": "Johan Land",
      "providerColor": "#ffffff",
      "score": 0.729,
      "costPerTask": 38.99,
      "resultsUrl": "",
      "display": true
    },
    {
      "datasetId": "v2_Semi_Private",
      "datasetDisplayName": "ARC-AGI-2",
      "modelId": "claude-opus-4-6-thinking-120K-low",
      "modelDisplayName": "Claude Opus 4.6 (120K, Low)",
      "modelType": "CoT",
      "modelGroup": "claude-opus-4-6-thinking",
      "modelReleaseDate": "2026-02-05T00:00:00.000Z",
      "providerId": "Anthropic",
      "providerDisplayName": "Anthropic",
      "providerColor": "#f93c32ff",
      "score": 0.6458,
      "costPerTask": 2.2507,
      "resultsUrl": "",
      "display": true
    },
    {
      "datasetId": "v2_Semi_Private",
      "datasetDisplayName": "ARC-AGI-2",
      "modelId": "claude-opus-4-6-thinking-120K-medium",
      "modelDisplayName": "Claude Opus 4.6 (120K, Medium)",
      "modelType": "CoT",
      "modelGroup": "claude-opus-4-6-thinking",
      "modelReleaseDate": "2026-02-05T00:00:00.000Z",
      "providerId": "Anthropic",
      "providerDisplayName": "Anthropic",
      "providerColor": "#f93c32ff",
      "score": 0.6625,
      "costPerTask": 2.7209,
      "resultsUrl": "",
      "display": true
    },
    {
      "datasetId": "v2_Semi_Private",
      "datasetDisplayName": "ARC-AGI-2",
      "modelId": "claude-opus-4-6-thinking-120K-high",
      "modelDisplayName": "Claude Opus 4.6 (120K, High)",
      "modelType": "CoT",
      "modelGroup": "claude-opus-4-6-thinking",
      "modelReleaseDate": "2026-02-05T00:00:00.000Z",
      "providerId": "Anthropic",
      "providerDisplayName": "Anthropic",
      "providerColor": "#f93c32ff",
      "score": 0.6917,
      "costPerTask": 3.4719,
      "resultsUrl": "",
      "display": true,
      "displayLabel": false
    },
    {
      "datasetId": "v2_Semi_Private",
      "datasetDisplayName": "ARC-AGI-2",
      "modelId": "claude-opus-4-6-thinking-120K-max",
      "modelDisplayName": "Claude Opus 4.6 (120K, Max)",
      "modelType": "CoT",
      "modelGroup": "claude-opus-4-6-thinking",
      "modelReleaseDate": "2026-02-05T00:00:00.000Z",
      "providerId": "Anthropic",
      "providerDisplayName": "Anthropic",
      "providerColor": "#f93c32ff",
      "score": 0.6875,
      "costPerTask": 3.641,
      "resultsUrl": "",
      "display": true
    },
    {
      "datasetId": "v2_Semi_Private",
      "datasetDisplayName": "ARC-AGI-2",
      "modelId": "gemini_3_deep_think_022026",
      "modelDisplayName": "Gemini 3 Deep Think (2/26)",
      "modelType": "CoT",
      "modelGroup": "",
      "modelReleaseDate": "2026-02-12T16:13:00.000Z",
      "providerId": "Google",
      "providerDisplayName": "Google",
      "providerColor": "#4ecc30ff",
      "score": 0.8458,
      "costPerTask": 13.6213,
      "resultsUrl": "",
      "display": true
    },
    {
      "datasetId": "v2_Semi_Private",
      "datasetDisplayName": "ARC-AGI-2",
      "modelId": "claude_sonnet_4_6_max",
      "modelDisplayName": "Claude Sonnet 4.6 (Max)",
      "modelType": "CoT",
      "modelGroup": "claude-sonnet-4-6",
      "modelReleaseDate": "2026-02-17T00:00:00.000Z",
      "providerId": "Anthropic",
      "providerDisplayName": "Anthropic",
      "providerColor": "#f93c32ff",
      "score": 0.5833,
      "costPerTask": 2.7179,
      "resultsUrl": "",
      "display": true
    },
    {
      "datasetId": "v2_Semi_Private",
      "datasetDisplayName": "ARC-AGI-2",
      "modelId": "claude_sonnet_4_6_high",
      "modelDisplayName": "Claude Sonnet 4.6 (High)",
      "modelType": "CoT",
      "modelGroup": "claude-sonnet-4-6",
      "modelReleaseDate": "2026-02-17T00:00:00.000Z",
      "providerId": "Anthropic",
      "providerDisplayName": "Anthropic",
      "providerColor": "#f93c32ff",
      "score": 0.6042,
      "costPerTask": 2.6966,
      "resultsUrl": "",
      "display": true
    },
    {
      "datasetId": "v2_Semi_Private",
      "datasetDisplayName": "ARC-AGI-2",
      "modelId": "gemini-3-1-pro-preview",
      "modelDisplayName": "Gemini 3.1 Pro (Preview)",
      "modelType": "CoT",
      "modelGroup": "",
      "modelReleaseDate": "2026-02-19T00:00:00.000Z",
      "providerId": "Google",
      "providerDisplayName": "Google",
      "providerColor": "#4ecc30ff",
      "score": 0.7708,
      "costPerTask": 0.9622,
      "resultsUrl": "",
      "display": true
    },
    {
      "datasetId": "v2_Semi_Private",
      "datasetDisplayName": "ARC-AGI-2",
      "modelId": "kimi-k2.5",
      "modelDisplayName": "Kimi K2.5",
      "modelType": "CoT",
      "modelGroup": "",
      "modelReleaseDate": "2026-01-27T00:00:00.000Z",
      "providerId": "Moonshot AI",
      "providerDisplayName": "Moonshot AI",
      "providerColor": "#00c8ff",
      "score": 0.1181,
      "costPerTask": 0.28,
      "resultsUrl": "",
      "display": true
    },
    {
      "datasetId": "v2_Semi_Private",
      "datasetDisplayName": "ARC-AGI-2",
      "modelId": "minimax-m2.5",
      "modelDisplayName": "Minimax M2.5",
      "modelType": "CoT",
      "modelGroup": "",
      "modelReleaseDate": "2026-02-12T00:00:00.000Z",
      "providerId": "Minimax",
      "providerDisplayName": "Minimax",
      "providerColor": "#ffffff",
      "score": 0.0486,
      "costPerTask": 0.17,
      "resultsUrl": "",
      "display": true
    },
    {
      "datasetId": "v2_Semi_Private",
      "datasetDisplayName": "ARC-AGI-2",
      "modelId": "deepseek-v3.2",
      "modelDisplayName": "Deepseek V3.2",
      "modelType": "Base LLM",
      "modelGroup": "",
      "modelReleaseDate": "2025-12-01T00:00:00.000Z",
      "providerId": "Deepseek",
      "providerDisplayName": "Deepseek",
      "providerColor": "#ffdc00ff",
      "score": 0.0403,
      "costPerTask": 0.12,
      "resultsUrl": "",
      "display": true
    },
    {
      "datasetId": "v2_Semi_Private",
      "datasetDisplayName": "ARC-AGI-2",
      "modelId": "glm-5",
      "modelDisplayName": "GLM-5",
      "modelType": "CoT",
      "modelGroup": "",
      "modelReleaseDate": "2026-02-20T00:00:00.000Z",
      "providerId": "Z.ai",
      "providerDisplayName": "Z.ai",
      "providerColor": "#ffffff",
      "score": 0.0486,
      "costPerTask": 0.27,
      "resultsUrl": "",
      "display": true
    },
    {
      "datasetId": "v2_Semi_Private",
      "datasetDisplayName": "ARC-AGI-2",
      "modelId": "gpt-5-4-low",
      "modelDisplayName": "GPT-5.4 (Low)",
      "modelType": "CoT",
      "modelGroup": "gpt-5-4",
      "modelReleaseDate": "2026-03-04T00:00:00.000Z",
      "providerId": "OpenAI",
      "providerDisplayName": "OpenAI",
      "providerColor": "#1e93ffff",
      "score": 0.2917,
      "costPerTask": 0.27,
      "resultsUrl": "",
      "display": true
    },
    {
      "datasetId": "v2_Semi_Private",
      "datasetDisplayName": "ARC-AGI-2",
      "modelId": "gpt-5-4-medium",
      "modelDisplayName": "GPT-5.4 (Medium)",
      "modelType": "CoT",
      "modelGroup": "gpt-5-4",
      "modelReleaseDate": "2026-03-04T00:00:00.000Z",
      "providerId": "OpenAI",
      "providerDisplayName": "OpenAI",
      "providerColor": "#1e93ffff",
      "score": 0.5542,
      "costPerTask": 0.68,
      "resultsUrl": "",
      "display": true
    },
    {
      "datasetId": "v2_Semi_Private",
      "datasetDisplayName": "ARC-AGI-2",
      "modelId": "gpt-5-4-high",
      "modelDisplayName": "GPT-5.4 (High)",
      "modelType": "CoT",
      "modelGroup": "gpt-5-4",
      "modelReleaseDate": "2026-03-04T00:00:00.000Z",
      "providerId": "OpenAI",
      "providerDisplayName": "OpenAI",
      "providerColor": "#1e93ffff",
      "score": 0.675,
      "costPerTask": 1.02,
      "resultsUrl": "",
      "display": true
    },
    {
      "datasetId": "v2_Semi_Private",
      "datasetDisplayName": "ARC-AGI-2",
      "modelId": "gpt-5-4-xhigh",
      "modelDisplayName": "GPT-5.4 (xHigh)",
      "modelType": "CoT",
      "modelGroup": "gpt-5-4",
      "modelReleaseDate": "2026-03-04T00:00:00.000Z",
      "providerId": "OpenAI",
      "providerDisplayName": "OpenAI",
      "providerColor": "#1e93ffff",
      "score": 0.7395,
      "costPerTask": 1.52,
      "resultsUrl": "",
      "display": true
    },
    {
      "datasetId": "v2_Semi_Private",
      "datasetDisplayName": "ARC-AGI-2",
      "modelId": "gpt-5-4-pro-xhigh",
      "modelDisplayName": "GPT-5.4 Pro (xHigh)",
      "modelType": "CoT",
      "modelGroup": "gpt-5-4-pro",
      "modelReleaseDate": "2026-03-04T00:00:00.000Z",
      "providerId": "OpenAI",
      "providerDisplayName": "OpenAI",
      "providerColor": "#1e93ffff",
      "score": 0.8333,
      "costPerTask": 16.41,
      "resultsUrl": "",
      "display": true
    },
    {
      "datasetId": "v2_Semi_Private",
      "datasetDisplayName": "ARC-AGI-2",
      "modelId": "gpt-5-4-mini-xhigh",
      "modelDisplayName": "GPT-5.4 Mini (xHigh)",
      "modelType": "CoT",
      "modelGroup": "gpt-5-4-mini-reasoning",
      "modelReleaseDate": "2026-03-17T00:00:00.000Z",
      "providerId": "OpenAI",
      "providerDisplayName": "OpenAI",
      "providerColor": "#1e93ffff",
      "score": 0.189,
      "costPerTask": 0.75,
      "resultsUrl": "",
      "display": true
    },
    {
      "datasetId": "v2_Semi_Private",
      "datasetDisplayName": "ARC-AGI-2",
      "modelId": "gpt-5-4-mini-high",
      "modelDisplayName": "GPT-5.4 Mini (High)",
      "modelType": "CoT",
      "modelGroup": "gpt-5-4-mini-reasoning",
      "modelReleaseDate": "2026-03-17T00:00:00.000Z",
      "providerId": "OpenAI",
      "providerDisplayName": "OpenAI",
      "providerColor": "#1e93ffff",
      "score": 0.1319,
      "costPerTask": 0.56,
      "resultsUrl": "",
      "display": true
    },
    {
      "datasetId": "v2_Semi_Private",
      "datasetDisplayName": "ARC-AGI-2",
      "modelId": "gpt-5-4-mini-medium",
      "modelDisplayName": "GPT-5.4 Mini (Medium)",
      "modelType": "CoT",
      "modelGroup": "gpt-5-4-mini-reasoning",
      "modelReleaseDate": "2026-03-17T00:00:00.000Z",
      "providerId": "OpenAI",
      "providerDisplayName": "OpenAI",
      "providerColor": "#1e93ffff",
      "score": 0.0444,
      "costPerTask": 0.33,
      "resultsUrl": "",
      "display": true
    },
    {
      "datasetId": "v2_Semi_Private",
      "datasetDisplayName": "ARC-AGI-2",
      "modelId": "gpt-5-4-mini-low",
      "modelDisplayName": "GPT-5.4 Mini (Low)",
      "modelType": "CoT",
      "modelGroup": "gpt-5-4-mini-reasoning",
      "modelReleaseDate": "2026-03-17T00:00:00.000Z",
      "providerId": "OpenAI",
      "providerDisplayName": "OpenAI",
      "providerColor": "#1e93ffff",
      "score": 0.0111,
      "costPerTask": 0.06,
      "resultsUrl": "",
      "display": true
    },
    {
      "datasetId": "v2_Semi_Private",
      "datasetDisplayName": "ARC-AGI-2",
      "modelId": "gpt-5-4-nano-xhigh",
      "modelDisplayName": "GPT-5.4 Nano (xHigh)",
      "modelType": "CoT",
      "modelGroup": "gpt-5-4-nano-reasoning",
      "modelReleaseDate": "2026-03-17T00:00:00.000Z",
      "providerId": "OpenAI",
      "providerDisplayName": "OpenAI",
      "providerColor": "#1e93ffff",
      "score": 0.0569,
      "costPerTask": 0.16,
      "resultsUrl": "",
      "display": true
    },
    {
      "datasetId": "v2_Semi_Private",
      "datasetDisplayName": "ARC-AGI-2",
      "modelId": "gpt-5-4-nano-high",
      "modelDisplayName": "GPT-5.4 Nano (High)",
      "modelType": "CoT",
      "modelGroup": "gpt-5-4-nano-reasoning",
      "modelReleaseDate": "2026-03-17T00:00:00.000Z",
      "providerId": "OpenAI",
      "providerDisplayName": "OpenAI",
      "providerColor": "#1e93ffff",
      "score": 0.0361,
      "costPerTask": 0.13,
      "resultsUrl": "",
      "display": true
    },
    {
      "datasetId": "v2_Semi_Private",
      "datasetDisplayName": "ARC-AGI-2",
      "modelId": "gpt-5-4-nano-medium",
      "modelDisplayName": "GPT-5.4 Nano (Medium)",
      "modelType": "CoT",
      "modelGroup": "gpt-5-4-nano-reasoning",
      "modelReleaseDate": "2026-03-17T00:00:00.000Z",
      "providerId": "OpenAI",
      "providerDisplayName": "OpenAI",
      "providerColor": "#1e93ffff",
      "score": 0.0194,
      "costPerTask": 0.06,
      "resultsUrl": "",
      "display": true
    },
    {
      "datasetId": "v2_Semi_Private",
      "datasetDisplayName": "ARC-AGI-2",
      "modelId": "gpt-5-4-nano-low",
      "modelDisplayName": "GPT-5.4 Nano (Low)",
      "modelType": "CoT",
      "modelGroup": "gpt-5-4-nano-reasoning",
      "modelReleaseDate": "2026-03-17T00:00:00.000Z",
      "providerId": "OpenAI",
      "providerDisplayName": "OpenAI",
      "providerColor": "#1e93ffff",
      "score": 0.0153,
      "costPerTask": 0.01,
      "resultsUrl": "",
      "display": true
    },
    {
      "datasetId": "v2_Semi_Private",
      "datasetDisplayName": "ARC-AGI-2",
      "modelId": "claude-4-7-low",
      "modelDisplayName": "Claude 4.7 (Low)",
      "modelType": "CoT",
      "modelGroup": "claude-4-7",
      "modelReleaseDate": "2026-04-16T00:00:00.000Z",
      "providerId": "Anthropic",
      "providerDisplayName": "Anthropic",
      "providerColor": "#f93c32ff",
      "score": 0.6208,
      "costPerTask": 2.38,
      "resultsUrl": "",
      "display": true
    },
    {
      "datasetId": "v2_Semi_Private",
      "datasetDisplayName": "ARC-AGI-2",
      "modelId": "claude-4-7-medium",
      "modelDisplayName": "Claude 4.7 (Medium)",
      "modelType": "CoT",
      "modelGroup": "claude-4-7",
      "modelReleaseDate": "2026-04-16T00:00:00.000Z",
      "providerId": "Anthropic",
      "providerDisplayName": "Anthropic",
      "providerColor": "#f93c32ff",
      "score": 0.675,
      "costPerTask": 2.96,
      "resultsUrl": "",
      "display": true
    },
    {
      "datasetId": "v2_Semi_Private",
      "datasetDisplayName": "ARC-AGI-2",
      "modelId": "claude-4-7-high",
      "modelDisplayName": "Claude 4.7 (High)",
      "modelType": "CoT",
      "modelGroup": "claude-4-7",
      "modelReleaseDate": "2026-04-16T00:00:00.000Z",
      "providerId": "Anthropic",
      "providerDisplayName": "Anthropic",
      "providerColor": "#f93c32ff",
      "score": 0.6833,
      "costPerTask": 3.17,
      "resultsUrl": "",
      "display": true
    },
    {
      "datasetId": "v2_Semi_Private",
      "datasetDisplayName": "ARC-AGI-2",
      "modelId": "claude-4-7-max",
      "modelDisplayName": "Claude 4.7 (Max)",
      "modelType": "CoT",
      "modelGroup": "claude-4-7",
      "modelReleaseDate": "2026-04-16T00:00:00.000Z",
      "providerId": "Anthropic",
      "providerDisplayName": "Anthropic",
      "providerColor": "#f93c32ff",
      "score": 0.7583,
      "costPerTask": 7.43,
      "resultsUrl": "",
      "display": true
    },
    {
      "datasetId": "v2_Semi_Private",
      "datasetDisplayName": "ARC-AGI-2",
      "modelId": "gpt-5-5-2026-04-22-thinking-low",
      "modelDisplayName": "GPT-5.5 (Low)",
      "modelType": "CoT",
      "modelGroup": "gpt-5-5-2026-04-22-thinking",
      "modelReleaseDate": "2026-04-22T00:00:00.000Z",
      "providerId": "OpenAI",
      "providerDisplayName": "OpenAI",
      "providerColor": "#1e93ffff",
      "score": 0.3333,
      "costPerTask": 0.35,
      "resultsUrl": "",
      "display": true
    },
    {
      "datasetId": "v2_Semi_Private",
      "datasetDisplayName": "ARC-AGI-2",
      "modelId": "gpt-5-5-2026-04-22-thinking-medium",
      "modelDisplayName": "GPT-5.5 (Medium)",
      "modelType": "CoT",
      "modelGroup": "gpt-5-5-2026-04-22-thinking",
      "modelReleaseDate": "2026-04-22T00:00:00.000Z",
      "providerId": "OpenAI",
      "providerDisplayName": "OpenAI",
      "providerColor": "#1e93ffff",
      "score": 0.7042,
      "costPerTask": 0.86,
      "resultsUrl": "",
      "display": true
    },
    {
      "datasetId": "v2_Semi_Private",
      "datasetDisplayName": "ARC-AGI-2",
      "modelId": "gpt-5-5-2026-04-22-thinking-high",
      "modelDisplayName": "GPT-5.5 (High)",
      "modelType": "CoT",
      "modelGroup": "gpt-5-5-2026-04-22-thinking",
      "modelReleaseDate": "2026-04-22T00:00:00.000Z",
      "providerId": "OpenAI",
      "providerDisplayName": "OpenAI",
      "providerColor": "#1e93ffff",
      "score": 0.8333,
      "costPerTask": 1.45,
      "resultsUrl": "",
      "display": true
    },
    {
      "datasetId": "v2_Semi_Private",
      "datasetDisplayName": "ARC-AGI-2",
      "modelId": "gpt-5-5-2026-04-22-thinking-xhigh",
      "modelDisplayName": "GPT-5.5 (xHigh)",
      "modelType": "CoT",
      "modelGroup": "gpt-5-5-2026-04-22-thinking",
      "modelReleaseDate": "2026-04-22T00:00:00.000Z",
      "providerId": "OpenAI",
      "providerDisplayName": "OpenAI",
      "providerColor": "#1e93ffff",
      "score": 0.85,
      "costPerTask": 1.87,
      "resultsUrl": "",
      "display": true
    },
    {
      "datasetId": "v2_Semi_Private",
      "datasetDisplayName": "ARC-AGI-2",
      "modelId": "gpt-5-5-pro-2026-04-23-high",
      "modelDisplayName": "GPT-5.5 Pro (High)",
      "modelType": "CoT",
      "modelGroup": "gpt-5-5-pro-2026-04-23-thinking",
      "modelReleaseDate": "2026-04-23T00:00:00.000Z",
      "providerId": "OpenAI",
      "providerDisplayName": "OpenAI",
      "providerColor": "#1e93ffff",
      "score": 0.8458,
      "costPerTask": 10.51,
      "resultsUrl": "",
      "display": true
    },
    {
      "datasetId": "v2_Semi_Private",
      "datasetDisplayName": "ARC-AGI-2",
      "modelId": "gpt-5-5-pro-2026-04-23-xhigh",
      "modelDisplayName": "GPT-5.5 Pro (xHigh)",
      "modelType": "CoT",
      "modelGroup": "gpt-5-5-pro-2026-04-23-thinking",
      "modelReleaseDate": "2026-04-23T00:00:00.000Z",
      "providerId": "OpenAI",
      "providerDisplayName": "OpenAI",
      "providerColor": "#1e93ffff",
      "score": 0.8416,
      "costPerTask": 10.76,
      "resultsUrl": "",
      "display": true
    },
    {
      "datasetId": "v2_Semi_Private",
      "datasetDisplayName": "ARC-AGI-2",
      "modelId": "gemini-3-5-flash-minimal",
      "modelDisplayName": "Gemini 3.5 Flash (Minimal)",
      "modelType": "CoT",
      "modelGroup": "gemini-3-5-flash",
      "modelReleaseDate": "2026-05-19T00:00:00.000Z",
      "providerId": "Google",
      "providerDisplayName": "Google",
      "providerColor": "#4ecc30ff",
      "score": 0.0889,
      "costPerTask": 0.1074,
      "resultsUrl": "",
      "display": true
    },
    {
      "datasetId": "v2_Semi_Private",
      "datasetDisplayName": "ARC-AGI-2",
      "modelId": "gemini-3-5-flash-high",
      "modelDisplayName": "Gemini 3.5 Flash (High)",
      "modelType": "CoT",
      "modelGroup": "gemini-3-5-flash",
      "modelReleaseDate": "2026-05-19T00:00:00.000Z",
      "providerId": "Google",
      "providerDisplayName": "Google",
      "providerColor": "#4ecc30ff",
      "score": 0.7208,
      "costPerTask": 0.8503,
      "resultsUrl": "",
      "display": true
    }
  ]
}
