verification_report.json
1 { 2 "generated_by": "research/scripts/verify_paper_claims.py", 3 "canonical_source": "/Users/rcerf/LocalDev/Sovereign_OS/research/data/paper_claims.json", 4 "paper_source": "/Users/rcerf/LocalDev/Sovereign_OS/research/latex/externalization_boundary.tex", 5 "summary": { 6 "total_checks": 7, 7 "pass": 6, 8 "fail": 0, 9 "warning": 1, 10 "unverifiable": 0 11 }, 12 "checks": [ 13 { 14 "check_id": "AGG-01", 15 "description": "Model count in title", 16 "location": "line 14", 17 "paper_value": "48", 18 "canonical_value": "48", 19 "status": "PASS", 20 "note": "" 21 }, 22 { 23 "check_id": "AGG-02", 24 "description": "Lab count in title", 25 "location": "line 14", 26 "paper_value": "22", 27 "canonical_value": "22", 28 "status": "PASS", 29 "note": "" 30 }, 31 { 32 "check_id": "AGG-06-L27", 33 "description": "Core study model/lab count (line 27)", 34 "location": "line 27", 35 "paper_value": "31 models, 11 labs", 36 "canonical_value": "Core study (31 models, 11 labs)", 37 "status": "PASS", 38 "note": "Core study count, not format-sensitivity extension" 39 }, 40 { 41 "check_id": "AGG-06-L264", 42 "description": "Core study model/lab count (line 264)", 43 "location": "line 264", 44 "paper_value": "31 models, 11 labs", 45 "canonical_value": "Core study (31 models, 11 labs)", 46 "status": "PASS", 47 "note": "Core study count, not format-sensitivity extension" 48 }, 49 { 50 "check_id": "AGG-06-L373", 51 "description": "Core study model/lab count (line 373)", 52 "location": "line 373", 53 "paper_value": "31 models, 11 labs", 54 "canonical_value": "Core study (31 models, 11 labs)", 55 "status": "PASS", 56 "note": "Core study count, not format-sensitivity extension" 57 }, 58 { 59 "check_id": "D1-inline-gpt4o_mini-L137", 60 "description": "GPT-4o-mini inline D1 (line 137)", 61 "location": "line 137", 62 "paper_value": "0.067", 63 "canonical_value": "0.0222", 64 "status": "WARNING", 65 "note": "Delta=0.045" 66 }, 67 { 68 "check_id": "D1-inline-llama4_scout-L137", 69 "description": "Llama 4 Scout inline D1 (line 137)", 70 "location": "line 137", 71 "paper_value": "0.600", 72 "canonical_value": "0.6000", 73 "status": "PASS", 74 "note": "" 75 } 76 ] 77 }