Longterm Wiki

AI Forecasting Benchmark Tournament

ai-forecasting-benchmarkprojectPath: /knowledge-base/responses/ai-forecasting-benchmark/
E10Entity ID (EID)
← Back to page3 backlinksQuality: 41Updated: 2026-03-13
Page Recorddatabase.json — merged from MDX frontmatter + Entity YAML + computed metrics at build time
{
  "id": "ai-forecasting-benchmark",
  "numericId": null,
  "path": "/knowledge-base/responses/ai-forecasting-benchmark/",
  "filePath": "knowledge-base/responses/ai-forecasting-benchmark.mdx",
  "title": "AI Forecasting Benchmark Tournament",
  "quality": 41,
  "readerImportance": 22.5,
  "researchImportance": 37.5,
  "tacticalValue": null,
  "contentFormat": "article",
  "tractability": null,
  "neglectedness": null,
  "uncertainty": null,
  "causalLevel": null,
  "lastUpdated": "2026-03-13",
  "dateCreated": "2026-02-15",
  "llmSummary": "Quarterly competition (Q2 2025: 348 questions, 54 bot-makers, \\$30K prizes) comparing human Pro Forecasters against AI bots, with statistical testing showing humans maintain significant lead (p=0.00001) though AI improves ~24% Q3-Q4 2024. Best AI baseline is OpenAI's o3; top bot-makers are students/hobbyists; ensemble methods significantly improve performance.",
  "description": "A quarterly competition run by Metaculus comparing human Pro Forecasters against AI forecasting bots. Q2 2025 results (348 questions, 54 bot-makers) show Pro Forecasters maintain a statistically significant lead (p = 0.00001), though AI performance improves each quarter. Prize pool of \\$30,000 per quarter with API credits provided by OpenAI and Anthropic. Best AI baseline (Q2 2025): OpenAI's o3 model.",
  "ratings": {
    "novelty": 3.5,
    "rigor": 5,
    "actionability": 3,
    "completeness": 6.5
  },
  "category": "responses",
  "subcategory": "epistemic-platforms",
  "clusters": [
    "epistemics",
    "ai-safety"
  ],
  "metrics": {
    "wordCount": 1697,
    "tableCount": 20,
    "diagramCount": 1,
    "internalLinks": 8,
    "externalLinks": 7,
    "footnoteCount": 0,
    "bulletRatio": 0.08,
    "sectionCount": 33,
    "hasOverview": true,
    "structuralScore": 15
  },
  "suggestedQuality": 100,
  "updateFrequency": 45,
  "evergreen": true,
  "wordCount": 1697,
  "unconvertedLinks": [
    {
      "text": "Metaculus Homepage",
      "url": "https://www.metaculus.com/",
      "resourceId": "d99a6d0fb1edc2db",
      "resourceTitle": "Metaculus"
    }
  ],
  "unconvertedLinkCount": 1,
  "convertedLinkCount": 0,
  "backlinkCount": 3,
  "hallucinationRisk": {
    "level": "medium",
    "score": 55,
    "factors": [
      "no-citations"
    ]
  },
  "entityType": "project",
  "redundancy": {
    "maxSimilarity": 16,
    "similarPages": [
      {
        "id": "forecastbench",
        "title": "ForecastBench",
        "path": "/knowledge-base/responses/forecastbench/",
        "similarity": 16
      },
      {
        "id": "metaculus",
        "title": "Metaculus",
        "path": "/knowledge-base/organizations/metaculus/",
        "similarity": 14
      },
      {
        "id": "metaforecast",
        "title": "Metaforecast",
        "path": "/knowledge-base/responses/metaforecast/",
        "similarity": 12
      },
      {
        "id": "collective-intelligence",
        "title": "Collective Intelligence / Coordination",
        "path": "/knowledge-base/intelligence-paradigms/collective-intelligence/",
        "similarity": 11
      },
      {
        "id": "fri",
        "title": "Forecasting Research Institute",
        "path": "/knowledge-base/organizations/fri/",
        "similarity": 11
      }
    ]
  },
  "coverage": {
    "passing": 6,
    "total": 13,
    "targets": {
      "tables": 7,
      "diagrams": 1,
      "internalLinks": 14,
      "externalLinks": 8,
      "footnotes": 5,
      "references": 5
    },
    "actuals": {
      "tables": 20,
      "diagrams": 1,
      "internalLinks": 8,
      "externalLinks": 7,
      "footnotes": 0,
      "references": 1,
      "quotesWithQuotes": 0,
      "quotesTotal": 0,
      "accuracyChecked": 0,
      "accuracyTotal": 0
    },
    "items": {
      "llmSummary": "green",
      "schedule": "green",
      "entity": "green",
      "editHistory": "red",
      "overview": "green",
      "tables": "green",
      "diagrams": "green",
      "internalLinks": "amber",
      "externalLinks": "amber",
      "footnotes": "red",
      "references": "amber",
      "quotes": "red",
      "accuracy": "red"
    },
    "ratingsString": "N:3.5 R:5 A:3 C:6.5"
  },
  "readerRank": 505,
  "researchRank": 363,
  "recommendedScore": 114.84
}
External Links

No external links

Backlinks (3)
idtitletyperelationship
metaculusMetaculusorganization
epistemic-tools-tools-overviewTools & Platforms (Overview)concept
forecastbenchForecastBenchproject
Longterm Wiki