{"schema_version":"papers/paper-detail-v1","title":"SUPERNOVA: Eliciting General Reasoning in LLMs with Reinforcement Learning on Natural Instructions","surface":"papers","opportunity_kernel":{"paper_id":"74aad2f4-d403-4514-a3b2-42f9a3a25abd","title":"SUPERNOVA: Eliciting General Reasoning in LLMs with Reinforcement Learning on Natural Instructions","authors":["Ashima Suvarna","Kendrick Phan","Mehrab Beikzadeh","Hritik Bansal","Saadia Gabriel"],"arxiv_id":"2604.08477v1","doi":null,"published_at":"2026-04-09T17:16:07.000Z","score_object":{"overall":{"value":7,"scale":"0-10","confidence":0.85,"confidence_reason":"Aligned to persisted papers.viability_score for public contract consistency.","model_version":"phase0-backfill-v1","pipeline_version":"phase0-kernel-v1","computed_at":"2026-04-10T17:22:14.513Z","fresh_until":"2026-05-10T17:22:14.513Z","is_stale":true,"source_count":1,"missingness":[]},"technical":{"value":6.4,"scale":"0-10","confidence":0.7,"confidence_reason":"Backfilled from deployability_scores.score.","model_version":"phase0-backfill-v1","pipeline_version":"phase0-kernel-v1","computed_at":"2026-04-10T20:18:25.155Z","fresh_until":"2026-04-24T20:18:25.155Z","is_stale":true,"source_count":2,"missingness":["reproducibility_results.reproducibility_score"]},"commercial":{"value":5,"scale":"0-10","confidence":0.75,"confidence_reason":"Backfilled from persisted commercial_flags and repo availability.","model_version":"phase0-backfill-v1","pipeline_version":"phase0-kernel-v1","computed_at":"2026-04-10T17:22:14.513Z","fresh_until":"2026-05-10T17:22:14.513Z","is_stale":true,"source_count":2,"missingness":[]},"market":{"value":5.5,"scale":"0-10","confidence":0.8,"confidence_reason":"Backfilled from distribution_readiness_scores.score.","model_version":"phase0-backfill-v1","pipeline_version":"phase0-kernel-v1","computed_at":"2026-04-10T17:36:49.516Z","fresh_until":"2026-04-24T17:36:49.516Z","is_stale":true,"source_count":1,"missingness":[]},"team":{"value":6.1,"scale":"0-10","confidence":0.42,"confidence_reason":"Heuristic fallback from paper author count and extracted affiliations.","model_version":"phase0-backfill-v1","pipeline_version":"phase0-kernel-v1","computed_at":"2026-04-10T17:22:14.513Z","fresh_until":"2026-04-24T17:22:14.513Z","is_stale":true,"source_count":2,"missingness":[]},"methodology":{"value":4.7,"scale":"0-10","confidence":0.82,"confidence_reason":"Backfilled from paper_extraction_scorecards.total_score.","model_version":"phase0-backfill-v1","pipeline_version":"phase0-kernel-v1","computed_at":"2026-04-10T17:23:36.192Z","fresh_until":"2026-05-10T17:23:36.192Z","is_stale":true,"source_count":2,"missingness":[]}},"evidence_receipt":{"freshness":"stale","proof_status":"unverified","repo_status":"active","references_count":0,"source_count":4,"coverage":0.8333,"missingness":["references"],"unresolved_unknowns":[],"last_verification_at":"2026-04-10T20:18:25.155Z"},"lineage_hash":"10025607c715508955dab11d9fdf71f15eb4c7d404311e25ce50638f9ee52788"},"distribution":null,"replication_evidence":[],"author_dna":[{"author_id":"5731112f-df7c-4eb3-becd-37ff9878066d","name":"Ashima Suvarna","institution":"University of California, Los Angeles","h_index":null,"paper_count":1,"patents_count":0,"founder_score":11,"prior_startup":false,"industry_years":null,"top_skills":["Research"],"prior_commercialization_rate":null,"confidence":null,"paper_sample_size":0,"commercialized_paper_count":0,"last_backfilled_at":null,"archived_at":null},{"author_id":"c572b38c-096b-43e1-86f9-94abe4837549","name":"Kendrick Phan","institution":"University of California, Los Angeles","h_index":null,"paper_count":1,"patents_count":0,"founder_score":11,"prior_startup":false,"industry_years":null,"top_skills":["Research"],"prior_commercialization_rate":null,"confidence":null,"paper_sample_size":0,"commercialized_paper_count":0,"last_backfilled_at":null,"archived_at":null},{"author_id":"e60c384a-6c8f-4e92-863a-1b4459041fea","name":"Mehrab Beikzadeh","institution":"University of California, Los Angeles","h_index":null,"paper_count":1,"patents_count":0,"founder_score":11,"prior_startup":false,"industry_years":null,"top_skills":["Research"],"prior_commercialization_rate":null,"confidence":null,"paper_sample_size":0,"commercialized_paper_count":0,"last_backfilled_at":null,"archived_at":null},{"author_id":"b2e6054d-a65b-4a2a-b78a-75ed74d051aa","name":"Hritik Bansal","institution":"University of California, Los Angeles","h_index":null,"paper_count":1,"patents_count":0,"founder_score":11,"prior_startup":false,"industry_years":null,"top_skills":["Research"],"prior_commercialization_rate":null,"confidence":null,"paper_sample_size":0,"commercialized_paper_count":0,"last_backfilled_at":null,"archived_at":null},{"author_id":"d9d12e08-23da-42d9-97a7-4f4d91cd6473","name":"Saadia Gabriel","institution":"University of California, Los Angeles","h_index":null,"paper_count":1,"patents_count":0,"founder_score":11,"prior_startup":false,"industry_years":null,"top_skills":["Research"],"prior_commercialization_rate":null,"confidence":null,"paper_sample_size":0,"commercialized_paper_count":0,"last_backfilled_at":null,"archived_at":null}]}