{"record_type":"pith_number_record","schema_url":"https://pith.science/schemas/pith-number/v1.json","pith_number":"pith:2025:4EIUKAODF2KD4BRDN2XQ7TMUTT","short_pith_number":"pith:4EIUKAOD","schema_version":"1.0","canonical_sha256":"e1114501c32e943e06236eaf0fcd949cef50bef5b1c21844e5a6f25b8f1adb26","source":{"kind":"arxiv","id":"2511.02824","version":2},"attestation_state":"computed","paper":{"title":"Kosmos: An AI Scientist for Autonomous Discovery","license":"http://creativecommons.org/licenses/by/4.0/","headline":"","cross_cats":[],"primary_cat":"cs.AI","authors_text":"Aizad Kamal, Albert Bou, Ali E. Ghareeb, Andrew D. White, Angela Yiu, Arvis Sulovari, Asmamaw T. Wassie, Benjamin Chang, Bruna Gomes, Daniel L. Barabasi, Edwin Melville-Green, Eric C. Landsness, Euan A. Ashley, Fang Cao, Jon M. Laurent, Kaleigh F. Roberts, Karen E. Duff, Kevin J. Zwezdaryk, Laurie McCoy, Leah P. Shriver, Ludovico Mitchener, Martha Foiani, Mathieu Bourdenx, Mayk Caldas, Michaela M. Hinks, Michael Skarlinski, Miranda E. Orr, Nicky Evans, Randall J. Bateman, Samuel G. Rodriques, Shriya Reddy, Siddharth Narayanan, Sladjana Zagorac, Timothy C. Orr, Tom Rainforth, Tonio Buonassisi, Tyler Nadolski","submitted_at":"2025-11-04T18:50:52Z","abstract_excerpt":"Data-driven scientific discovery requires iterative cycles of literature search, hypothesis generation, and data analysis. Substantial progress has been made towards AI agents that can automate scientific research, but all such agents remain limited in the number of actions they can take before losing coherence, thus limiting the depth of their findings. Here we present Kosmos, an AI scientist that automates data-driven discovery. Given an open-ended objective and a dataset, Kosmos runs for up to 12 hours performing cycles of parallel data analysis, literature search, and hypothesis generation"},"verification_status":{"content_addressed":true,"pith_receipt":true,"author_attested":false,"weak_author_claims":0,"strong_author_claims":0,"externally_anchored":false,"storage_verified":false,"citation_signatures":0,"replication_records":0,"graph_snapshot":true,"references_resolved":false,"formal_links_present":false},"canonical_record":{"source":{"id":"2511.02824","kind":"arxiv","version":2},"metadata":{"license":"http://creativecommons.org/licenses/by/4.0/","primary_cat":"cs.AI","submitted_at":"2025-11-04T18:50:52Z","cross_cats_sorted":[],"title_canon_sha256":"ea973789ba4b700440f636d3569a3c578555bc6189b2e76724c8c669a7c72407","abstract_canon_sha256":"3e210cbebeedbfd1b10a5a31b9f15f92bcbe09c75d5b6c7a53e67bc74866ef6c"},"schema_version":"1.0"},"receipt":{"kind":"pith_receipt","key_id":"pith-v1-2026-05","algorithm":"ed25519","signed_at":"2026-05-22T08:35:30.146013Z","signature_b64":"5ybA0l0oer9dezoMgd+TrJWtzOEbEOoJQ8HGWh3vsLEC4KKIR+WsLIIlhngsdcKuODf7N8zTb9DWvnxftNNjDw==","signed_message":"canonical_sha256_bytes","builder_version":"pith-number-builder-2026-05-17-v1","receipt_version":"0.3","canonical_sha256":"e1114501c32e943e06236eaf0fcd949cef50bef5b1c21844e5a6f25b8f1adb26","last_reissued_at":"2026-05-22T08:35:30.142803Z","signature_status":"signed_v1","first_computed_at":"2026-05-22T08:35:30.142803Z","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54"},"graph_snapshot":{"paper":{"title":"Kosmos: An AI Scientist for Autonomous Discovery","license":"http://creativecommons.org/licenses/by/4.0/","headline":"","cross_cats":[],"primary_cat":"cs.AI","authors_text":"Aizad Kamal, Albert Bou, Ali E. Ghareeb, Andrew D. White, Angela Yiu, Arvis Sulovari, Asmamaw T. Wassie, Benjamin Chang, Bruna Gomes, Daniel L. Barabasi, Edwin Melville-Green, Eric C. Landsness, Euan A. Ashley, Fang Cao, Jon M. Laurent, Kaleigh F. Roberts, Karen E. Duff, Kevin J. Zwezdaryk, Laurie McCoy, Leah P. Shriver, Ludovico Mitchener, Martha Foiani, Mathieu Bourdenx, Mayk Caldas, Michaela M. Hinks, Michael Skarlinski, Miranda E. Orr, Nicky Evans, Randall J. Bateman, Samuel G. Rodriques, Shriya Reddy, Siddharth Narayanan, Sladjana Zagorac, Timothy C. Orr, Tom Rainforth, Tonio Buonassisi, Tyler Nadolski","submitted_at":"2025-11-04T18:50:52Z","abstract_excerpt":"Data-driven scientific discovery requires iterative cycles of literature search, hypothesis generation, and data analysis. Substantial progress has been made towards AI agents that can automate scientific research, but all such agents remain limited in the number of actions they can take before losing coherence, thus limiting the depth of their findings. Here we present Kosmos, an AI scientist that automates data-driven discovery. Given an open-ended objective and a dataset, Kosmos runs for up to 12 hours performing cycles of parallel data analysis, literature search, and hypothesis generation"},"claims":{"count":0,"items":[],"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"source":{"id":"2511.02824","kind":"arxiv","version":2},"verdict":{"id":null,"model_set":{},"created_at":null,"strongest_claim":"","one_line_summary":"","pipeline_version":null,"weakest_assumption":"","pith_extraction_headline":""},"integrity":{"clean":true,"summary":{"advisory":0,"critical":0,"by_detector":{},"informational":0},"endpoint":"/pith/2511.02824/integrity.json","findings":[],"available":true,"detectors_run":[],"snapshot_sha256":"c28c3603d3b5d939e8dc4c7e95fa8dfce3d595e45f758748cecf8e644a296938"},"references":{"count":0,"sample":[],"resolved_work":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57","internal_anchors":0},"formal_canon":{"evidence_count":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"author_claims":{"count":0,"strong_count":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"builder_version":"pith-number-builder-2026-05-17-v1"},"aliases":[{"alias_kind":"arxiv","alias_value":"2511.02824","created_at":"2026-05-22T08:35:30.142983+00:00"},{"alias_kind":"arxiv_version","alias_value":"2511.02824v2","created_at":"2026-05-22T08:35:30.142983+00:00"},{"alias_kind":"doi","alias_value":"10.48550/arxiv.2511.02824","created_at":"2026-05-22T08:35:30.142983+00:00"},{"alias_kind":"pith_short_12","alias_value":"4EIUKAODF2KD","created_at":"2026-05-22T08:35:30.142983+00:00"},{"alias_kind":"pith_short_16","alias_value":"4EIUKAODF2KD4BRD","created_at":"2026-05-22T08:35:30.142983+00:00"},{"alias_kind":"pith_short_8","alias_value":"4EIUKAOD","created_at":"2026-05-22T08:35:30.142983+00:00"}],"events":[],"event_summary":{},"paper_claims":[],"inbound_citations":{"count":26,"internal_anchor_count":26,"sample":[{"citing_arxiv_id":"2605.21825","citing_title":"Toward AI VIS Co-Scientists: A General and End-to-End Agent Harness for Solving Complex Data Visualization Tasks","ref_index":23,"is_internal_anchor":true},{"citing_arxiv_id":"2605.22681","citing_title":"Forecasting Scientific Progress with Artificial Intelligence","ref_index":42,"is_internal_anchor":true},{"citing_arxiv_id":"2605.22343","citing_title":"Sibyl-AutoResearch: Autonomous Research Needs Self-Evolving Trial-and-Error Harnesses, Not Paper Generators","ref_index":25,"is_internal_anchor":true},{"citing_arxiv_id":"2512.01089","citing_title":"CodeDistiller: Automatically Generating Code Libraries for Scientific Coding Agents","ref_index":16,"is_internal_anchor":true},{"citing_arxiv_id":"2605.16294","citing_title":"Are Researchers Being Replaced by Artificial Intelligence?","ref_index":2,"is_internal_anchor":true},{"citing_arxiv_id":"2605.07022","citing_title":"Self-Driving Datasets: From 20 Million Papers to Nuanced Biomedical Knowledge at Scale","ref_index":47,"is_internal_anchor":true},{"citing_arxiv_id":"2605.18831","citing_title":"Towards Discovery of Polymers for Insulin Delivery via Physics-Grounded Agentic Workflows","ref_index":23,"is_internal_anchor":true},{"citing_arxiv_id":"2605.18831","citing_title":"Towards Discovery of Polymers for Insulin Delivery via Physics-Grounded Agentic Workflows","ref_index":24,"is_internal_anchor":true},{"citing_arxiv_id":"2605.18661","citing_title":"AI for Auto-Research: Roadmap & User Guide","ref_index":133,"is_internal_anchor":true},{"citing_arxiv_id":"2512.15930","citing_title":"Scalable Agentic Reasoning for Designing Biologics Targeting Intrinsically Disordered Proteins","ref_index":45,"is_internal_anchor":true},{"citing_arxiv_id":"2512.15567","citing_title":"Evaluating Large Language Models in Scientific Discovery","ref_index":33,"is_internal_anchor":true},{"citing_arxiv_id":"2602.04850","citing_title":"El Agente Quntur: A research collaborator agent for quantum chemistry","ref_index":37,"is_internal_anchor":true},{"citing_arxiv_id":"2603.03295","citing_title":"Language Model Goal Selection Differs from Humans' in a Self-Directed Learning Task","ref_index":12,"is_internal_anchor":true},{"citing_arxiv_id":"2604.09590","citing_title":"DeepReviewer 2.0: A Traceable Agentic System for Auditable Scientific Peer Review","ref_index":3,"is_internal_anchor":true},{"citing_arxiv_id":"2603.09970","citing_title":"CREATE: Testing LLMs for Associative Creativity","ref_index":3,"is_internal_anchor":true},{"citing_arxiv_id":"2605.06651","citing_title":"AI co-mathematician: Accelerating mathematicians with agentic AI","ref_index":46,"is_internal_anchor":true},{"citing_arxiv_id":"2605.11258","citing_title":"Unlocking LLM Creativity in Science through Analogical Reasoning","ref_index":29,"is_internal_anchor":true},{"citing_arxiv_id":"2605.05921","citing_title":"Intentmaking and Sensemaking: Human Interaction with AI-Guided Mathematical Discovery","ref_index":26,"is_internal_anchor":true},{"citing_arxiv_id":"2605.01489","citing_title":"SciResearcher: Scaling Deep Research Agents for Frontier Scientific Reasoning","ref_index":26,"is_internal_anchor":true},{"citing_arxiv_id":"2604.18805","citing_title":"AI scientists produce results without reasoning scientifically","ref_index":20,"is_internal_anchor":true},{"citing_arxiv_id":"2605.07022","citing_title":"Self-Driving Datasets: From 20 Million Papers to Nuanced Biomedical Knowledge at Scale","ref_index":48,"is_internal_anchor":true},{"citing_arxiv_id":"2604.25610","citing_title":"Optimizing ground state preparation protocols with autoresearch","ref_index":26,"is_internal_anchor":true},{"citing_arxiv_id":"2605.07022","citing_title":"Self-Driving Datasets: From 20 Million Papers to Nuanced Biomedical Knowledge at Scale","ref_index":47,"is_internal_anchor":true},{"citing_arxiv_id":"2604.15411","citing_title":"PRL-Bench: A Comprehensive Benchmark Evaluating LLMs' Capabilities in Frontier Physics Research","ref_index":5,"is_internal_anchor":true},{"citing_arxiv_id":"2604.25610","citing_title":"Optimizing ground state preparation protocols with autoresearch","ref_index":26,"is_internal_anchor":true}]},"formal_canon":{"evidence_count":0,"sample":[],"anchors":[]},"links":{"html":"https://pith.science/pith/4EIUKAODF2KD4BRDN2XQ7TMUTT","json":"https://pith.science/pith/4EIUKAODF2KD4BRDN2XQ7TMUTT.json","graph_json":"https://pith.science/api/pith-number/4EIUKAODF2KD4BRDN2XQ7TMUTT/graph.json","events_json":"https://pith.science/api/pith-number/4EIUKAODF2KD4BRDN2XQ7TMUTT/events.json","paper":"https://pith.science/paper/4EIUKAOD"},"agent_actions":{"view_html":"https://pith.science/pith/4EIUKAODF2KD4BRDN2XQ7TMUTT","download_json":"https://pith.science/pith/4EIUKAODF2KD4BRDN2XQ7TMUTT.json","view_paper":"https://pith.science/paper/4EIUKAOD","resolve_alias":"https://pith.science/api/pith-number/resolve?arxiv=2511.02824&json=true","fetch_graph":"https://pith.science/api/pith-number/4EIUKAODF2KD4BRDN2XQ7TMUTT/graph.json","fetch_events":"https://pith.science/api/pith-number/4EIUKAODF2KD4BRDN2XQ7TMUTT/events.json","actions":{"anchor_timestamp":"https://pith.science/pith/4EIUKAODF2KD4BRDN2XQ7TMUTT/action/timestamp_anchor","attest_storage":"https://pith.science/pith/4EIUKAODF2KD4BRDN2XQ7TMUTT/action/storage_attestation","attest_author":"https://pith.science/pith/4EIUKAODF2KD4BRDN2XQ7TMUTT/action/author_attestation","sign_citation":"https://pith.science/pith/4EIUKAODF2KD4BRDN2XQ7TMUTT/action/citation_signature","submit_replication":"https://pith.science/pith/4EIUKAODF2KD4BRDN2XQ7TMUTT/action/replication_record"}},"created_at":"2026-05-22T08:35:30.142983+00:00","updated_at":"2026-05-22T08:35:30.142983+00:00"}