Corrigibility Failure Pathways
corrigibility-failure-pathwaysanalysisPath: /knowledge-base/models/corrigibility-failure-pathways/
E81Entity ID (EID)
Page Recorddatabase.json — merged from MDX frontmatter + Entity YAML + computed metrics at build time
{
"id": "corrigibility-failure-pathways",
"numericId": null,
"path": "/knowledge-base/models/corrigibility-failure-pathways/",
"filePath": "knowledge-base/models/corrigibility-failure-pathways.mdx",
"title": "Corrigibility Failure Pathways",
"quality": 62,
"readerImportance": 73,
"researchImportance": 80,
"tacticalValue": null,
"contentFormat": "article",
"tractability": null,
"neglectedness": null,
"uncertainty": null,
"causalLevel": null,
"lastUpdated": "2026-03-13",
"dateCreated": "2026-02-15",
"llmSummary": "This model systematically maps six pathways to corrigibility failure with quantified probability estimates (60-90% for advanced AI) and intervention effectiveness (40-70% reduction). It provides concrete risk matrices across capability levels, identifies pathway interactions that multiply severity 2-4x, and recommends specific interventions including bounded objectives (60-80% effective), self-modification restrictions (80-95%), and 4-10x increased research funding.",
"description": "This model maps pathways from AI training to corrigibility failure, with quantified probability estimates (60-90% for capable optimizers) and intervention effectiveness (40-70% reduction). It analyzes six failure mechanisms including instrumental convergence, goal preservation, and deceptive corrigibility with specific mitigation strategies.",
"ratings": {
"focus": 8.5,
"novelty": 4.5,
"rigor": 6,
"completeness": 7.5,
"concreteness": 7,
"actionability": 6.5
},
"category": "models",
"subcategory": "risk-models",
"clusters": [
"ai-safety"
],
"metrics": {
"wordCount": 1935,
"tableCount": 17,
"diagramCount": 1,
"internalLinks": 50,
"externalLinks": 0,
"footnoteCount": 0,
"bulletRatio": 0.27,
"sectionCount": 33,
"hasOverview": true,
"structuralScore": 12
},
"suggestedQuality": 80,
"updateFrequency": 90,
"evergreen": true,
"wordCount": 1935,
"unconvertedLinks": [],
"unconvertedLinkCount": 0,
"convertedLinkCount": 25,
"backlinkCount": 0,
"hallucinationRisk": {
"level": "medium",
"score": 60,
"factors": [
"no-citations",
"few-external-sources"
]
},
"entityType": "analysis",
"redundancy": {
"maxSimilarity": 20,
"similarPages": [
{
"id": "power-seeking-conditions",
"title": "Power-Seeking Emergence Conditions Model",
"path": "/knowledge-base/models/power-seeking-conditions/",
"similarity": 20
},
{
"id": "scheming-likelihood-model",
"title": "Scheming Likelihood Assessment",
"path": "/knowledge-base/models/scheming-likelihood-model/",
"similarity": 20
},
{
"id": "deceptive-alignment-decomposition",
"title": "Deceptive Alignment Decomposition Model",
"path": "/knowledge-base/models/deceptive-alignment-decomposition/",
"similarity": 18
},
{
"id": "instrumental-convergence-framework",
"title": "Instrumental Convergence Framework",
"path": "/knowledge-base/models/instrumental-convergence-framework/",
"similarity": 17
},
{
"id": "intervention-effectiveness-matrix",
"title": "Intervention Effectiveness Matrix",
"path": "/knowledge-base/models/intervention-effectiveness-matrix/",
"similarity": 17
}
]
},
"coverage": {
"passing": 8,
"total": 13,
"targets": {
"tables": 8,
"diagrams": 1,
"internalLinks": 15,
"externalLinks": 10,
"footnotes": 6,
"references": 6
},
"actuals": {
"tables": 17,
"diagrams": 1,
"internalLinks": 50,
"externalLinks": 0,
"footnotes": 0,
"references": 21,
"quotesWithQuotes": 0,
"quotesTotal": 0,
"accuracyChecked": 0,
"accuracyTotal": 0
},
"items": {
"llmSummary": "green",
"schedule": "green",
"entity": "green",
"editHistory": "red",
"overview": "green",
"tables": "green",
"diagrams": "green",
"internalLinks": "green",
"externalLinks": "red",
"footnotes": "red",
"references": "green",
"quotes": "red",
"accuracy": "red"
},
"ratingsString": "N:4.5 R:6 A:6.5 C:7.5"
},
"readerRank": 135,
"researchRank": 86,
"recommendedScore": 182.14
}External Links
No external links
Backlinks (0)
No backlinks