{"schema_version":"papers/paper-detail-v1","title":"Stop Probing, Start Coding: Why Linear Probes and Sparse Autoencoders Fail at Compositional Generalisation","surface":"papers","opportunity_kernel":{"paper_id":"4bf80b1e-90bf-41e2-9db0-11b6392cd7dd","title":"Stop Probing, Start Coding: Why Linear Probes and Sparse Autoencoders Fail at Compositional Generalisation","authors":["Vitória Barin Pacela","Shruti Joshi","Isabela Camacho","Simon Lacoste-Julien","David Klindt"],"arxiv_id":"2603.28744v1","doi":null,"published_at":"2026-03-30T17:52:16.000Z","score_object":{"overall":{"value":3,"scale":"0-10","confidence":0.85,"confidence_reason":"Backfilled from persisted papers.viability_score.","model_version":"phase0-backfill-v1","pipeline_version":"phase0-kernel-v1","computed_at":"2026-04-02T02:30:40.136Z","fresh_until":"2026-05-02T02:30:40.136Z","is_stale":true,"source_count":1,"missingness":[]},"technical":{"value":2,"scale":"0-10","confidence":0.55,"confidence_reason":"Backfilled from paper_extraction_scorecards.reconstruction_score.","model_version":"phase0-backfill-v1","pipeline_version":"phase0-kernel-v1","computed_at":"2026-03-31T20:22:55.575Z","fresh_until":"2026-04-14T20:22:55.575Z","is_stale":true,"source_count":1,"missingness":[]},"commercial":{"value":0,"scale":"0-10","confidence":0.75,"confidence_reason":"Backfilled from persisted commercial_flags and repo availability.","model_version":"phase0-backfill-v1","pipeline_version":"phase0-kernel-v1","computed_at":"2026-04-02T02:30:40.136Z","fresh_until":"2026-05-02T02:30:40.136Z","is_stale":true,"source_count":1,"missingness":[]},"market":{"value":0,"scale":"0-10","confidence":0.15,"confidence_reason":"No persisted distribution_readiness_scores row was available; marked low confidence.","model_version":"phase0-backfill-v1","pipeline_version":"phase0-kernel-v1","computed_at":"2026-04-02T02:30:40.136Z","fresh_until":"2026-04-16T02:30:40.136Z","is_stale":true,"source_count":0,"missingness":["distribution_readiness_scores.score"]},"team":{"value":10,"scale":"0-10","confidence":0.15,"confidence_reason":"No persisted team-quality evidence was available; marked low confidence.","model_version":"phase0-backfill-v1","pipeline_version":"phase0-kernel-v1","computed_at":"2026-04-02T02:30:40.136Z","fresh_until":"2026-04-16T02:30:40.136Z","is_stale":true,"source_count":0,"missingness":["engineer_profiles.builder_score","author_startups"]},"methodology":{"value":9.4,"scale":"0-10","confidence":0.82,"confidence_reason":"Backfilled from paper_extraction_scorecards.total_score.","model_version":"phase0-backfill-v1","pipeline_version":"phase0-kernel-v1","computed_at":"2026-03-31T20:22:55.575Z","fresh_until":"2026-04-30T20:22:55.575Z","is_stale":true,"source_count":2,"missingness":[]}},"evidence_receipt":{"freshness":"stale","proof_status":"unverified","repo_status":"missing","references_count":41,"source_count":3,"coverage":0.5,"missingness":["repo_url","proof_status","distribution_readiness_scores"],"unresolved_unknowns":["distribution readiness has not been computed yet","proof verification has not been recorded yet"],"last_verification_at":"2026-03-31T20:22:55.575Z"},"lineage_hash":"dd26436c0f92eff2d5e7b16c9f2a4e209a320a8eb3ac0e8be4f4e2d8211f16e7"},"distribution":null,"replication_evidence":[],"author_dna":[]}