{"record_type":"pith_number_record","schema_url":"https://pith.science/schemas/pith-number/v1.json","pith_number":"pith:2026:HTCHN7B66WYEROBASDW4WBSDHY","short_pith_number":"pith:HTCHN7B6","schema_version":"1.0","canonical_sha256":"3cc476fc3ef5b048b82090edcb06433e22e20b69034a78dbf6331d350414ae6c","source":{"kind":"arxiv","id":"2605.30229","version":1},"attestation_state":"computed","paper":{"title":"Anti Mode-Collapse in Mean-Field Transformer via Auxiliary Variables","license":"http://creativecommons.org/licenses/by/4.0/","headline":"","cross_cats":[],"primary_cat":"cs.LG","authors_text":"Kohei Hayashi, Masaaki Imaizumi, Masanori Koyama, Noboru Isobe","submitted_at":"2026-05-28T16:59:42Z","abstract_excerpt":"We use a mean-field-based transformer model to theoretically investigate how auxiliary variables, such as positional encoding, prevent mode collapse of self-attention mechanisms. The use of mean-field transformers to analyze the properties of self-attention mechanisms has garnered significant attention in recent years due to their ability to comprehensively analyze token interactions. However, analysis of this simple model suggests that mode collapse, where token distributions degenerate to a single point, occurs during long inferences (i.e., many layers), indicating a discrepancy with reality"},"verification_status":{"content_addressed":true,"pith_receipt":true,"author_attested":false,"weak_author_claims":0,"strong_author_claims":0,"externally_anchored":false,"storage_verified":false,"citation_signatures":0,"replication_records":0,"graph_snapshot":true,"references_resolved":false,"formal_links_present":false},"canonical_record":{"source":{"id":"2605.30229","kind":"arxiv","version":1},"metadata":{"license":"http://creativecommons.org/licenses/by/4.0/","primary_cat":"cs.LG","submitted_at":"2026-05-28T16:59:42Z","cross_cats_sorted":[],"title_canon_sha256":"e63988d93bcfdf3c118dfc03b714aae99ad0632418d3071f9ac2b79f705f5b1c","abstract_canon_sha256":"bd3c232a73ccf22bc2f9073d7068fc80954c8dbcea2e360035cc08bcba2c41a5"},"schema_version":"1.0"},"receipt":{"kind":"pith_receipt","key_id":"pith-v1-2026-05","algorithm":"ed25519","signed_at":"2026-05-29T02:06:13.424937Z","signature_b64":"CTkm8hO0xIt51wEEsSDSU7KJn3CbwNQP+CXmTpLDzPChG00SrAzkDiUmUAkMVszYbEVbzfS365OGKeRY5E7HDQ==","signed_message":"canonical_sha256_bytes","builder_version":"pith-number-builder-2026-05-17-v1","receipt_version":"0.3","canonical_sha256":"3cc476fc3ef5b048b82090edcb06433e22e20b69034a78dbf6331d350414ae6c","last_reissued_at":"2026-05-29T02:06:13.424579Z","signature_status":"signed_v1","first_computed_at":"2026-05-29T02:06:13.424579Z","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54"},"graph_snapshot":{"paper":{"title":"Anti Mode-Collapse in Mean-Field Transformer via Auxiliary Variables","license":"http://creativecommons.org/licenses/by/4.0/","headline":"","cross_cats":[],"primary_cat":"cs.LG","authors_text":"Kohei Hayashi, Masaaki Imaizumi, Masanori Koyama, Noboru Isobe","submitted_at":"2026-05-28T16:59:42Z","abstract_excerpt":"We use a mean-field-based transformer model to theoretically investigate how auxiliary variables, such as positional encoding, prevent mode collapse of self-attention mechanisms. The use of mean-field transformers to analyze the properties of self-attention mechanisms has garnered significant attention in recent years due to their ability to comprehensively analyze token interactions. However, analysis of this simple model suggests that mode collapse, where token distributions degenerate to a single point, occurs during long inferences (i.e., many layers), indicating a discrepancy with reality"},"claims":{"count":0,"items":[],"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"source":{"id":"2605.30229","kind":"arxiv","version":1},"verdict":{"id":null,"model_set":{},"created_at":null,"strongest_claim":"","one_line_summary":"","pipeline_version":null,"weakest_assumption":"","pith_extraction_headline":""},"integrity":{"clean":true,"summary":{"advisory":0,"critical":0,"by_detector":{},"informational":0},"endpoint":"/pith/2605.30229/integrity.json","findings":[],"available":true,"detectors_run":[],"snapshot_sha256":"c28c3603d3b5d939e8dc4c7e95fa8dfce3d595e45f758748cecf8e644a296938"},"references":{"count":0,"sample":[],"resolved_work":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57","internal_anchors":0},"formal_canon":{"evidence_count":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"author_claims":{"count":0,"strong_count":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"builder_version":"pith-number-builder-2026-05-17-v1"},"aliases":[{"alias_kind":"arxiv","alias_value":"2605.30229","created_at":"2026-05-29T02:06:13.424648+00:00"},{"alias_kind":"arxiv_version","alias_value":"2605.30229v1","created_at":"2026-05-29T02:06:13.424648+00:00"},{"alias_kind":"doi","alias_value":"10.48550/arxiv.2605.30229","created_at":"2026-05-29T02:06:13.424648+00:00"},{"alias_kind":"pith_short_12","alias_value":"HTCHN7B66WYE","created_at":"2026-05-29T02:06:13.424648+00:00"},{"alias_kind":"pith_short_16","alias_value":"HTCHN7B66WYEROBA","created_at":"2026-05-29T02:06:13.424648+00:00"},{"alias_kind":"pith_short_8","alias_value":"HTCHN7B6","created_at":"2026-05-29T02:06:13.424648+00:00"}],"events":[],"event_summary":{},"paper_claims":[],"inbound_citations":{"count":0,"internal_anchor_count":0,"sample":[]},"formal_canon":{"evidence_count":0,"sample":[],"anchors":[]},"links":{"html":"https://pith.science/pith/HTCHN7B66WYEROBASDW4WBSDHY","json":"https://pith.science/pith/HTCHN7B66WYEROBASDW4WBSDHY.json","graph_json":"https://pith.science/api/pith-number/HTCHN7B66WYEROBASDW4WBSDHY/graph.json","events_json":"https://pith.science/api/pith-number/HTCHN7B66WYEROBASDW4WBSDHY/events.json","paper":"https://pith.science/paper/HTCHN7B6"},"agent_actions":{"view_html":"https://pith.science/pith/HTCHN7B66WYEROBASDW4WBSDHY","download_json":"https://pith.science/pith/HTCHN7B66WYEROBASDW4WBSDHY.json","view_paper":"https://pith.science/paper/HTCHN7B6","resolve_alias":"https://pith.science/api/pith-number/resolve?arxiv=2605.30229&json=true","fetch_graph":"https://pith.science/api/pith-number/HTCHN7B66WYEROBASDW4WBSDHY/graph.json","fetch_events":"https://pith.science/api/pith-number/HTCHN7B66WYEROBASDW4WBSDHY/events.json","actions":{"anchor_timestamp":"https://pith.science/pith/HTCHN7B66WYEROBASDW4WBSDHY/action/timestamp_anchor","attest_storage":"https://pith.science/pith/HTCHN7B66WYEROBASDW4WBSDHY/action/storage_attestation","attest_author":"https://pith.science/pith/HTCHN7B66WYEROBASDW4WBSDHY/action/author_attestation","sign_citation":"https://pith.science/pith/HTCHN7B66WYEROBASDW4WBSDHY/action/citation_signature","submit_replication":"https://pith.science/pith/HTCHN7B66WYEROBASDW4WBSDHY/action/replication_record"}},"created_at":"2026-05-29T02:06:13.424648+00:00","updated_at":"2026-05-29T02:06:13.424648+00:00"}