{"state_type":"pith_open_graph_state","state_version":"1.0","pith_number":"pith:2026:XSJCDPQS372E5DUFEUGV5RKXKQ","merge_version":"pith-open-graph-merge-v1","event_count":7,"valid_event_count":7,"invalid_event_count":0,"equivocation_count":1,"current":{"canonical_record":{"metadata":{"abstract_canon_sha256":"934474672251d10a921e9abdad8961e6b2e4069302316d6df9a0e979a4754a03","cross_cats_sorted":["stat.ML"],"license":"http://arxiv.org/licenses/nonexclusive-distrib/1.0/","primary_cat":"cs.LG","submitted_at":"2026-05-13T18:01:43Z","title_canon_sha256":"daf73d720c130d23fcec478f4224a2da1974d195d2e321265396253c90e5ec7d"},"schema_version":"1.0","source":{"id":"2605.13986","kind":"arxiv","version":1}},"source_aliases":[{"alias_kind":"arxiv","alias_value":"2605.13986","created_at":"2026-05-17T23:39:13Z"},{"alias_kind":"arxiv_version","alias_value":"2605.13986v1","created_at":"2026-05-17T23:39:13Z"},{"alias_kind":"doi","alias_value":"10.48550/arxiv.2605.13986","created_at":"2026-05-17T23:39:13Z"},{"alias_kind":"pith_short_12","alias_value":"XSJCDPQS372E","created_at":"2026-05-18T12:33:37Z"},{"alias_kind":"pith_short_16","alias_value":"XSJCDPQS372E5DUF","created_at":"2026-05-18T12:33:37Z"},{"alias_kind":"pith_short_8","alias_value":"XSJCDPQS","created_at":"2026-05-18T12:33:37Z"}],"graph_snapshots":[{"event_id":"sha256:d4f243df8dbab91b70dc17a0af32808f85327516a587151b9a0ef5be6363ea0d","target":"graph","created_at":"2026-05-17T23:39:13Z","signer":{"key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","signer_id":"pith.science","signer_type":"pith_registry"},"payload":{"graph_snapshot":{"author_claims":{"count":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57","strong_count":0},"builder_version":"pith-number-builder-2026-05-17-v1","claims":{"count":4,"items":[{"attestation":"unclaimed","claim_id":"C1","kind":"strongest_claim","source":"verdict.strongest_claim","status":"machine_extracted","text":"On the standard tabular benchmark TabArena, a forward pass of TabPFN-3 outperforms all other models, including tuned and ensembled baselines, by a significant margin, and pareto-dominates the speed/performance frontier. TabPFN-3-Plus (Thinking) beats all non-TabPFN models by over 200 Elo on TabArena, rising to 420 Elo on the largest data subset, and outperforms AutoGluon 1.5 extreme while being 10x faster."},{"attestation":"unclaimed","claim_id":"C2","kind":"weakest_assumption","source":"verdict.weakest_assumption","status":"machine_extracted","text":"That benchmark wins on TabArena and other reported datasets, achieved via synthetic pretraining and test-time scaling, will generalize to arbitrary unseen real-world tabular distributions without hidden overfitting to the evaluation suites or synthetic data generator."},{"attestation":"unclaimed","claim_id":"C3","kind":"one_line_summary","source":"verdict.one_line_summary","status":"machine_extracted","text":"TabPFN-3 delivers state-of-the-art tabular prediction performance on benchmarks up to 1M rows, is up to 20x faster than prior versions, and introduces test-time scaling that beats non-TabPFN models by hundreds of Elo points."},{"attestation":"unclaimed","claim_id":"C4","kind":"headline","source":"verdict.pith_extraction.headline","status":"machine_extracted","text":"TabPFN-3 outperforms all tuned and ensembled models on the TabArena tabular benchmark with a single forward pass."}],"snapshot_sha256":"9c2eb3fb0e63e7af2fed6b1e71e2d46fa1e1dd374ca90cf468c24ae1b34b8618"},"formal_canon":{"evidence_count":2,"snapshot_sha256":"a704e78e85789a12bd7a5c9703756f095b1a5c40476d4b30cf6d9deb1483977e"},"paper":{"abstract_excerpt":"Tabular data underpins most high-value prediction problems in science and industry, and TabPFN has driven the foundation model revolution for this modality. Designed with feedback from our users, TabPFN-3 builds on this foundation to scale state-of-the-art performance to datasets with 1M training rows and substantially reduce training and inference time. Pretrained exclusively on synthetic data from our prior, TabPFN-3 dramatically pushes the frontier of tabular prediction and brings substantial gains on time series, relational, and tabular-text data. On the standard tabular benchmark TabArena","authors_text":"Adrian Hayler, Alan Arazi, Anurag Garg, Benjamin J\\\"ager, Bernhard Sch\\\"olkopf, Brendan Roof, Clara Cornu, David Salinas, Diana Kriuchkova, Dominik Safaric, Eliott Kalfon, Felix Birkel, Frank Hutter, Georg Grab, Jake Robertson, Jan Hendrik Metzen, Jerry Chen, Julien Siems, Klemens Fl\\\"oge, Kursat Kaya, Lennart Purucker, L\\'eo Grinsztajn, Lilly Charlotte Wehrhahn, Lydia Sidhoum, Madelon Hulsebos, Magnus B\\\"uhler, Marie Salmon, Mihir Manium, Nick Erickson, Noah Hollmann, Oscar Key, Philipp Jund, Philipp Singer, Samuel M\\\"uller, Sauraj Gambhir, Shi Bin (Liam) Hoo, Simon Bing, Simone Alessi, Siyuan Guo, Vladyslav Moroshan, Yann LeCun","cross_cats":["stat.ML"],"headline":"TabPFN-3 outperforms all tuned and ensembled models on the TabArena tabular benchmark with a single forward pass.","license":"http://arxiv.org/licenses/nonexclusive-distrib/1.0/","primary_cat":"cs.LG","submitted_at":"2026-05-13T18:01:43Z","title":"TabPFN-3: Technical Report"},"references":{"count":298,"internal_anchors":10,"resolved_work":298,"sample":[{"cited_arxiv_id":"","doi":"","is_internal_anchor":false,"ref_index":1,"title":"arXiv:2506.16791 [cs]","work_id":"155b5349-dee8-4870-965c-d54a700a19de","year":2025},{"cited_arxiv_id":"2003.06505","doi":"","is_internal_anchor":true,"ref_index":2,"title":"AutoGluon-Tabular: Robust and Accurate AutoML for Structured Data","work_id":"32ca4e6c-bd72-4586-8594-40eb6bcb6582","year":2003},{"cited_arxiv_id":"","doi":"","is_internal_anchor":false,"ref_index":3,"title":"A targeted real-time early warning score (trewscore) for septic shock.Science translational medicine, 7(299):299ra122–299ra122, 2015","work_id":"d0ee9103-1d6c-4559-a94d-4a9b0982590b","year":2015},{"cited_arxiv_id":"","doi":"","is_internal_anchor":false,"ref_index":4,"title":"Mimic-iii, a freely accessible critical care database.Scientific data, 3(1):1–9","work_id":"13d40ae1-31af-44be-b076-0f695baf06c1","year":2016},{"cited_arxiv_id":"","doi":"","is_internal_anchor":false,"ref_index":5,"title":"Deep neural networks detect suicide risk from textual facebook posts.Scientific reports, 10(1):16685, 2020","work_id":"c37e433c-b505-4c25-b86d-28a7053c35b7","year":2020}],"snapshot_sha256":"64be74b4799e08a11111a4ae45246b9dfc0fa4b9b032d5ed15177f39b6103526"},"source":{"id":"2605.13986","kind":"arxiv","version":1},"verdict":{"created_at":"2026-05-15T06:01:00.864685Z","id":"247b931c-a5c8-4309-87e2-c24bc67e4e35","model_set":{"reader":"grok-4.3"},"one_line_summary":"TabPFN-3 delivers state-of-the-art tabular prediction performance on benchmarks up to 1M rows, is up to 20x faster than prior versions, and introduces test-time scaling that beats non-TabPFN models by hundreds of Elo points.","pipeline_version":"pith-pipeline@v0.9.0","pith_extraction_headline":"TabPFN-3 outperforms all tuned and ensembled models on the TabArena tabular benchmark with a single forward pass.","strongest_claim":"On the standard tabular benchmark TabArena, a forward pass of TabPFN-3 outperforms all other models, including tuned and ensembled baselines, by a significant margin, and pareto-dominates the speed/performance frontier. TabPFN-3-Plus (Thinking) beats all non-TabPFN models by over 200 Elo on TabArena, rising to 420 Elo on the largest data subset, and outperforms AutoGluon 1.5 extreme while being 10x faster.","weakest_assumption":"That benchmark wins on TabArena and other reported datasets, achieved via synthetic pretraining and test-time scaling, will generalize to arbitrary unseen real-world tabular distributions without hidden overfitting to the evaluation suites or synthetic data generator."}},"verdict_id":"247b931c-a5c8-4309-87e2-c24bc67e4e35"}}],"author_attestations":[],"timestamp_anchors":[],"storage_attestations":[],"citation_signatures":[],"replication_records":[],"corrections":[],"mirror_hints":[],"record_created":{"event_id":"sha256:171ba927f6acec67d65988e7d09625ea10460c125e9c51276b76f71a649250bf","target":"record","created_at":"2026-05-17T23:39:13Z","signer":{"key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","signer_id":"pith.science","signer_type":"pith_registry"},"payload":{"attestation_state":"computed","canonical_record":{"metadata":{"abstract_canon_sha256":"934474672251d10a921e9abdad8961e6b2e4069302316d6df9a0e979a4754a03","cross_cats_sorted":["stat.ML"],"license":"http://arxiv.org/licenses/nonexclusive-distrib/1.0/","primary_cat":"cs.LG","submitted_at":"2026-05-13T18:01:43Z","title_canon_sha256":"daf73d720c130d23fcec478f4224a2da1974d195d2e321265396253c90e5ec7d"},"schema_version":"1.0","source":{"id":"2605.13986","kind":"arxiv","version":1}},"canonical_sha256":"bc9221be12dff44e8e85250d5ec5575405b13f3d27971128803d2e7670bb5e8a","receipt":{"algorithm":"ed25519","builder_version":"pith-number-builder-2026-05-17-v1","canonical_sha256":"bc9221be12dff44e8e85250d5ec5575405b13f3d27971128803d2e7670bb5e8a","first_computed_at":"2026-05-17T23:39:13.319210Z","key_id":"pith-v1-2026-05","kind":"pith_receipt","last_reissued_at":"2026-05-17T23:39:13.319210Z","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","receipt_version":"0.3","signature_b64":"1F//dGbgfqtVkZoTptkVvYg9C+z8IpQMECyakMLcOvyrrmZQ4rHMT/GQ3rviyGapvJnFp7lyS+gX75/q7zrhBw==","signature_status":"signed_v1","signed_at":"2026-05-17T23:39:13.319843Z","signed_message":"canonical_sha256_bytes"},"source_id":"2605.13986","source_kind":"arxiv","source_version":1}}},"equivocations":[{"signer_id":"pith.science","event_type":"integrity_finding","target":"integrity","event_ids":["sha256:136c8e770f3ba7f8ed29f7cc681c3f997580fbda039684ee932d42a526b9128c","sha256:8b21500da1ae350374afb63b103c4b8542f8c1ee5dfec4a8316bfe1208b3ee58","sha256:b260493efddc3610e5664ce5078810f9bcb2127b8d9cfc1f26e4efd79cfa492c","sha256:b5681eb096d2a2bbe76fe33a6f63f28c7a32e6dedddbe79ec342425b6e277bc6","sha256:e8b78f36ddd1b8748d959a80fdfe74ab627750cbdf437b4c3e351e3703f82163"]}],"invalid_events":[],"applied_event_ids":["sha256:171ba927f6acec67d65988e7d09625ea10460c125e9c51276b76f71a649250bf","sha256:d4f243df8dbab91b70dc17a0af32808f85327516a587151b9a0ef5be6363ea0d"],"state_sha256":"3a8caa3fdb321628715c1e4be2c54aaf60de1d70637744cf46d0c1329489b316"}