{"state_type":"pith_open_graph_state","state_version":"1.0","pith_number":"pith:2026:PK5JOMRFAOBHPK5XN33DHDLAJW","merge_version":"pith-open-graph-merge-v1","event_count":2,"valid_event_count":2,"invalid_event_count":0,"equivocation_count":0,"current":{"canonical_record":{"metadata":{"abstract_canon_sha256":"57b615f3453ed68939921552785edee228e347a89ddf50646e177f7f74c0c846","cross_cats_sorted":["cs.AI"],"license":"http://creativecommons.org/licenses/by/4.0/","primary_cat":"cs.LG","submitted_at":"2026-04-28T16:57:55Z","title_canon_sha256":"363aab4bae13ae5b327633d5b6d58a0c036a091a60c5d37ab622334b33173134"},"schema_version":"1.0","source":{"id":"2604.25858","kind":"arxiv","version":2}},"source_aliases":[{"alias_kind":"arxiv","alias_value":"2604.25858","created_at":"2026-05-20T00:03:12Z"},{"alias_kind":"arxiv_version","alias_value":"2604.25858v2","created_at":"2026-05-20T00:03:12Z"},{"alias_kind":"doi","alias_value":"10.48550/arxiv.2604.25858","created_at":"2026-05-20T00:03:12Z"},{"alias_kind":"pith_short_12","alias_value":"PK5JOMRFAOBH","created_at":"2026-05-20T00:03:12Z"},{"alias_kind":"pith_short_16","alias_value":"PK5JOMRFAOBHPK5X","created_at":"2026-05-20T00:03:12Z"},{"alias_kind":"pith_short_8","alias_value":"PK5JOMRF","created_at":"2026-05-20T00:03:12Z"}],"graph_snapshots":[{"event_id":"sha256:2920e3404069f61c2e6a34c391b76ae86279f4af084a33cf9b15420ce0b350b8","target":"graph","created_at":"2026-05-20T00:03:12Z","signer":{"key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","signer_id":"pith.science","signer_type":"pith_registry"},"payload":{"graph_snapshot":{"author_claims":{"count":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57","strong_count":0},"builder_version":"pith-number-builder-2026-05-17-v1","claims":{"count":4,"items":[{"attestation":"unclaimed","claim_id":"C1","kind":"strongest_claim","source":"verdict.strongest_claim","status":"machine_extracted","text":"Through extensive sweeps across dimensionality, sequence length, task diversity, and signal-to-noise regimes, we identify the parameter regions in which benign overfitting arises and characterize how it depends on data geometry and training exposure."},{"attestation":"unclaimed","claim_id":"C2","kind":"weakest_assumption","source":"verdict.weakest_assumption","status":"machine_extracted","text":"The linear in-context classifier formulation and controlled synthetic Gaussian-mixture setup isolate the geometric conditions under which models successfully infer task structure from context alone."},{"attestation":"unclaimed","claim_id":"C3","kind":"one_line_summary","source":"verdict.one_line_summary","status":"machine_extracted","text":"Systematic sweeps show in-context test accuracy for Gaussian-mixture classification depends on input dimension, number of examples, and pre-training task count, with benign overfitting appearing in specific geometry and noise regimes."},{"attestation":"unclaimed","claim_id":"C4","kind":"headline","source":"verdict.pith_extraction.headline","status":"machine_extracted","text":"Transformers succeed at in-context binary classification on Gaussian mixtures under specific alignments of dimension, example count, and task diversity."}],"snapshot_sha256":"5aa74a7984f288dbd1f5a5cd14073e1f21bf11d20907f113df9cdea929ae16f9"},"formal_canon":{"evidence_count":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"integrity":{"available":true,"clean":true,"detectors_run":[{"findings_count":0,"name":"doi_compliance","ran_at":"2026-05-19T20:43:09.338997Z","status":"completed","version":"1.0.0"}],"endpoint":"/pith/2604.25858/integrity.json","findings":[],"snapshot_sha256":"acafd5c73cdedff691191455c1584ae6cea5d0f339f8d3c848563496f58bebc9","summary":{"advisory":0,"by_detector":{},"critical":0,"informational":0}},"paper":{"abstract_excerpt":"Transformers have demonstrated a strong ability for in-context learning (ICL), enabling models to solve previously unseen tasks using only example input output pairs provided at inference time. While prior theoretical work has established conditions under which transformers can perform linear classification in-context, the empirical scaling behavior governing when this mechanism succeeds remains insufficiently characterized.\n  In this paper, we conduct a systematic empirical study of in-context learning for Gaussian-mixture binary classification tasks. Building on the theoretical framework of ","authors_text":"Arya Mazumdar, Leo Bangayan, Rushil Chandrupatla, Sebastian Leng","cross_cats":["cs.AI"],"headline":"Transformers succeed at in-context binary classification on Gaussian mixtures under specific alignments of dimension, example count, and task diversity.","license":"http://creativecommons.org/licenses/by/4.0/","primary_cat":"cs.LG","submitted_at":"2026-04-28T16:57:55Z","title":"Investigation into In-Context Learning Capabilities of Transformers"},"references":{"count":0,"internal_anchors":0,"resolved_work":0,"sample":[],"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"source":{"id":"2604.25858","kind":"arxiv","version":2},"verdict":{"created_at":"2026-05-07T16:25:42.888449Z","id":"77684d2a-c43d-408e-ad21-ce101aeaf7b3","model_set":{"reader":"grok-4.3"},"one_line_summary":"Systematic sweeps show in-context test accuracy for Gaussian-mixture classification depends on input dimension, number of examples, and pre-training task count, with benign overfitting appearing in specific geometry and noise regimes.","pipeline_version":"pith-pipeline@v0.9.0","pith_extraction_headline":"Transformers succeed at in-context binary classification on Gaussian mixtures under specific alignments of dimension, example count, and task diversity.","strongest_claim":"Through extensive sweeps across dimensionality, sequence length, task diversity, and signal-to-noise regimes, we identify the parameter regions in which benign overfitting arises and characterize how it depends on data geometry and training exposure.","weakest_assumption":"The linear in-context classifier formulation and controlled synthetic Gaussian-mixture setup isolate the geometric conditions under which models successfully infer task structure from context alone."}},"verdict_id":"77684d2a-c43d-408e-ad21-ce101aeaf7b3"}}],"author_attestations":[],"timestamp_anchors":[],"storage_attestations":[],"citation_signatures":[],"replication_records":[],"corrections":[],"mirror_hints":[],"record_created":{"event_id":"sha256:df702257c14485eb611b08facbc367bfecfb6f95c020934725093da439d44f86","target":"record","created_at":"2026-05-20T00:03:12Z","signer":{"key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","signer_id":"pith.science","signer_type":"pith_registry"},"payload":{"attestation_state":"computed","canonical_record":{"metadata":{"abstract_canon_sha256":"57b615f3453ed68939921552785edee228e347a89ddf50646e177f7f74c0c846","cross_cats_sorted":["cs.AI"],"license":"http://creativecommons.org/licenses/by/4.0/","primary_cat":"cs.LG","submitted_at":"2026-04-28T16:57:55Z","title_canon_sha256":"363aab4bae13ae5b327633d5b6d58a0c036a091a60c5d37ab622334b33173134"},"schema_version":"1.0","source":{"id":"2604.25858","kind":"arxiv","version":2}},"canonical_sha256":"7aba973225038277abb76ef6338d604db00dd237970f188ca7c44d00324e0c7e","receipt":{"algorithm":"ed25519","builder_version":"pith-number-builder-2026-05-17-v1","canonical_sha256":"7aba973225038277abb76ef6338d604db00dd237970f188ca7c44d00324e0c7e","first_computed_at":"2026-05-20T00:03:12.683711Z","key_id":"pith-v1-2026-05","kind":"pith_receipt","last_reissued_at":"2026-05-20T00:03:12.683711Z","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","receipt_version":"0.3","signature_b64":"+bJOCNad8O1mkANYo3slP8ynRHHsELe05eltOkj10/Ojciv/JJgN20PysAcewdXolSJ+Om53jRU978rZlwSSBw==","signature_status":"signed_v1","signed_at":"2026-05-20T00:03:12.684672Z","signed_message":"canonical_sha256_bytes"},"source_id":"2604.25858","source_kind":"arxiv","source_version":2}}},"equivocations":[],"invalid_events":[],"applied_event_ids":["sha256:df702257c14485eb611b08facbc367bfecfb6f95c020934725093da439d44f86","sha256:2920e3404069f61c2e6a34c391b76ae86279f4af084a33cf9b15420ce0b350b8"],"state_sha256":"7c8c365393c5ac4241c208fa51fec28eed98190294b6b8100291e91e2d917ecc"}