{"bundle_type":"pith_open_graph_bundle","bundle_version":"1.0","pith_number":"pith:2026:Q6N54BJLAK7DXTLT5BCWDA556P","short_pith_number":"pith:Q6N54BJL","canonical_record":{"source":{"id":"2606.17945","kind":"arxiv","version":1},"metadata":{"license":"http://creativecommons.org/licenses/by/4.0/","primary_cat":"cs.AI","submitted_at":"2026-06-16T13:53:48Z","cross_cats_sorted":[],"title_canon_sha256":"3e54df7dcd92fb247100b450b595fac7da8397af2bba9fd8b89ae3b2a465dd96","abstract_canon_sha256":"569af4a63c53da93a226abed901ebf526bbe11f8c2503c4d13532b7b31651ab5"},"schema_version":"1.0"},"canonical_sha256":"879bde052b02be3bcd73e8456183bdf3d286dc897c750d38f1c0d3ad42b8ef5d","source":{"kind":"arxiv","id":"2606.17945","version":1},"source_aliases":[{"alias_kind":"arxiv","alias_value":"2606.17945","created_at":"2026-06-19T16:10:44Z"},{"alias_kind":"arxiv_version","alias_value":"2606.17945v1","created_at":"2026-06-19T16:10:44Z"},{"alias_kind":"doi","alias_value":"10.48550/arxiv.2606.17945","created_at":"2026-06-19T16:10:44Z"},{"alias_kind":"pith_short_12","alias_value":"Q6N54BJLAK7D","created_at":"2026-06-19T16:10:44Z"},{"alias_kind":"pith_short_16","alias_value":"Q6N54BJLAK7DXTLT","created_at":"2026-06-19T16:10:44Z"},{"alias_kind":"pith_short_8","alias_value":"Q6N54BJL","created_at":"2026-06-19T16:10:44Z"}],"events":[{"event_type":"record_created","subject_pith_number":"pith:2026:Q6N54BJLAK7DXTLT5BCWDA556P","target":"record","payload":{"canonical_record":{"source":{"id":"2606.17945","kind":"arxiv","version":1},"metadata":{"license":"http://creativecommons.org/licenses/by/4.0/","primary_cat":"cs.AI","submitted_at":"2026-06-16T13:53:48Z","cross_cats_sorted":[],"title_canon_sha256":"3e54df7dcd92fb247100b450b595fac7da8397af2bba9fd8b89ae3b2a465dd96","abstract_canon_sha256":"569af4a63c53da93a226abed901ebf526bbe11f8c2503c4d13532b7b31651ab5"},"schema_version":"1.0"},"canonical_sha256":"879bde052b02be3bcd73e8456183bdf3d286dc897c750d38f1c0d3ad42b8ef5d","receipt":{"kind":"pith_receipt","key_id":"pith-v1-2026-05","algorithm":"ed25519","signed_at":"2026-06-19T16:10:44.186576Z","signature_b64":"zznasyfVuxXJE+mcdXXJV3oLIP34+9IFUFZTvutYrnPv6XxZ7iX3nfzJUtWqOxipwvgAE6Tmv7cgytG5RuokAQ==","signed_message":"canonical_sha256_bytes","builder_version":"pith-number-builder-2026-05-17-v1","receipt_version":"0.3","canonical_sha256":"879bde052b02be3bcd73e8456183bdf3d286dc897c750d38f1c0d3ad42b8ef5d","last_reissued_at":"2026-06-19T16:10:44.186216Z","signature_status":"signed_v1","first_computed_at":"2026-06-19T16:10:44.186216Z","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54"},"source_kind":"arxiv","source_id":"2606.17945","source_version":1,"attestation_state":"computed"},"signer":{"signer_id":"pith.science","signer_type":"pith_registry","key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54"},"created_at":"2026-06-19T16:10:44Z","supersedes":[],"prev_event":null,"signature":{"signature_status":"signed_v1","algorithm":"ed25519","key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","signature_b64":"cYYgXLPI+PLDC7MQkXgYMA74MPalWgx3forGe5NedcsxsgS7iogXtqSSoQ7jN7i98NEbzGkYOp4ORKg02No7Bg==","signed_message":"open_graph_event_sha256_bytes","signed_at":"2026-07-04T19:30:09.398542Z"},"content_sha256":"0592a68d2343da7ba10e068fd7dad58dc16b8137c87f2888a7f13d73bb56c61c","schema_version":"1.0","event_id":"sha256:0592a68d2343da7ba10e068fd7dad58dc16b8137c87f2888a7f13d73bb56c61c"},{"event_type":"graph_snapshot","subject_pith_number":"pith:2026:Q6N54BJLAK7DXTLT5BCWDA556P","target":"graph","payload":{"graph_snapshot":{"paper":{"title":"Small Initialization Matters for Large Language Models","license":"http://creativecommons.org/licenses/by/4.0/","headline":"","cross_cats":[],"primary_cat":"cs.AI","authors_text":"Feiyu Xiong, Hongkang Yang, Junjie Yao, Liangkai Hang, Zhi-Qin John Xu, Zhiyu Li","submitted_at":"2026-06-16T13:53:48Z","abstract_excerpt":"Large language models provide a tractable system for asking how intelligence itself emerges, rather than only how LLMs can be engineered. Although progress is usually attributed to scale, data and architecture, we show that parameter initialization is a gene-like determinant of training and, in particular, of model capacity. Reducing the initialization scale consistently improves pretraining, with the largest gains on reasoning-demanding tasks. We identify two widely used empirical settings that restrain the advantage of small initialization, and show how relaxing them restores favorable scali"},"claims":{"count":0,"items":[],"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"source":{"id":"2606.17945","kind":"arxiv","version":1},"verdict":{"id":null,"model_set":{},"created_at":null,"strongest_claim":"","one_line_summary":"","pipeline_version":null,"weakest_assumption":"","pith_extraction_headline":""},"integrity":{"clean":true,"summary":{"advisory":0,"critical":0,"by_detector":{},"informational":0},"endpoint":"/pith/2606.17945/integrity.json","findings":[],"available":true,"detectors_run":[],"snapshot_sha256":"c28c3603d3b5d939e8dc4c7e95fa8dfce3d595e45f758748cecf8e644a296938"},"references":{"count":0,"sample":[],"resolved_work":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57","internal_anchors":0},"formal_canon":{"evidence_count":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"author_claims":{"count":0,"strong_count":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"builder_version":"pith-number-builder-2026-05-17-v1"},"verdict_id":null},"signer":{"signer_id":"pith.science","signer_type":"pith_registry","key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54"},"created_at":"2026-06-19T16:10:44Z","supersedes":[],"prev_event":null,"signature":{"signature_status":"signed_v1","algorithm":"ed25519","key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","signature_b64":"jOUgqBs+DpMNdW+Y/GKZCktPMeuG3OD7YZ6Mw+kmeatTM+kmTJnPQxjj0/EYy2qJcEEic5nla5TgQrraE/a5Cg==","signed_message":"open_graph_event_sha256_bytes","signed_at":"2026-07-04T19:30:09.398946Z"},"content_sha256":"e3c9556bbf4441b5239436818a348e1d3eb9c35742a7e0bd0d14c6a8aecc3850","schema_version":"1.0","event_id":"sha256:e3c9556bbf4441b5239436818a348e1d3eb9c35742a7e0bd0d14c6a8aecc3850"}],"timestamp_proofs":[],"mirror_hints":[{"mirror_type":"https","name":"Pith Resolver","base_url":"https://pith.science","bundle_url":"https://pith.science/pith/Q6N54BJLAK7DXTLT5BCWDA556P/bundle.json","state_url":"https://pith.science/pith/Q6N54BJLAK7DXTLT5BCWDA556P/state.json","well_known_bundle_url":"https://pith.science/.well-known/pith/Q6N54BJLAK7DXTLT5BCWDA556P/bundle.json","status":"primary"}],"public_keys":[{"key_id":"pith-v1-2026-05","algorithm":"ed25519","format":"raw","public_key_b64":"stVStoiQhXFxp4s2pdzPNoqVNBMojDU/fJ2db5S3CbM=","public_key_hex":"b2d552b68890857171a78b36a5dccf368a953413288c353f7c9d9d6f94b709b3","fingerprint_sha256_b32_first128bits":"RVFV5Z2OI2J3ZUO7ERDEBCYNKS","fingerprint_sha256_hex":"8d4b5ee74e4693bcd1df2446408b0d54","rotates_at":null,"url":"https://pith.science/pith-signing-key.json","notes":"Pith uses this Ed25519 key to sign canonical record SHA-256 digests. Verify with: ed25519_verify(public_key, message=canonical_sha256_bytes, signature=base64decode(signature_b64))."}],"merge_version":"pith-open-graph-merge-v1","built_at":"2026-07-04T19:30:09Z","links":{"resolver":"https://pith.science/pith/Q6N54BJLAK7DXTLT5BCWDA556P","bundle":"https://pith.science/pith/Q6N54BJLAK7DXTLT5BCWDA556P/bundle.json","state":"https://pith.science/pith/Q6N54BJLAK7DXTLT5BCWDA556P/state.json","well_known_bundle":"https://pith.science/.well-known/pith/Q6N54BJLAK7DXTLT5BCWDA556P/bundle.json"},"state":{"state_type":"pith_open_graph_state","state_version":"1.0","pith_number":"pith:2026:Q6N54BJLAK7DXTLT5BCWDA556P","merge_version":"pith-open-graph-merge-v1","event_count":2,"valid_event_count":2,"invalid_event_count":0,"equivocation_count":0,"current":{"canonical_record":{"metadata":{"abstract_canon_sha256":"569af4a63c53da93a226abed901ebf526bbe11f8c2503c4d13532b7b31651ab5","cross_cats_sorted":[],"license":"http://creativecommons.org/licenses/by/4.0/","primary_cat":"cs.AI","submitted_at":"2026-06-16T13:53:48Z","title_canon_sha256":"3e54df7dcd92fb247100b450b595fac7da8397af2bba9fd8b89ae3b2a465dd96"},"schema_version":"1.0","source":{"id":"2606.17945","kind":"arxiv","version":1}},"source_aliases":[{"alias_kind":"arxiv","alias_value":"2606.17945","created_at":"2026-06-19T16:10:44Z"},{"alias_kind":"arxiv_version","alias_value":"2606.17945v1","created_at":"2026-06-19T16:10:44Z"},{"alias_kind":"doi","alias_value":"10.48550/arxiv.2606.17945","created_at":"2026-06-19T16:10:44Z"},{"alias_kind":"pith_short_12","alias_value":"Q6N54BJLAK7D","created_at":"2026-06-19T16:10:44Z"},{"alias_kind":"pith_short_16","alias_value":"Q6N54BJLAK7DXTLT","created_at":"2026-06-19T16:10:44Z"},{"alias_kind":"pith_short_8","alias_value":"Q6N54BJL","created_at":"2026-06-19T16:10:44Z"}],"graph_snapshots":[{"event_id":"sha256:e3c9556bbf4441b5239436818a348e1d3eb9c35742a7e0bd0d14c6a8aecc3850","target":"graph","created_at":"2026-06-19T16:10:44Z","signer":{"key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","signer_id":"pith.science","signer_type":"pith_registry"},"payload":{"graph_snapshot":{"author_claims":{"count":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57","strong_count":0},"builder_version":"pith-number-builder-2026-05-17-v1","claims":{"count":0,"items":[],"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"formal_canon":{"evidence_count":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"integrity":{"available":true,"clean":true,"detectors_run":[],"endpoint":"/pith/2606.17945/integrity.json","findings":[],"snapshot_sha256":"c28c3603d3b5d939e8dc4c7e95fa8dfce3d595e45f758748cecf8e644a296938","summary":{"advisory":0,"by_detector":{},"critical":0,"informational":0}},"paper":{"abstract_excerpt":"Large language models provide a tractable system for asking how intelligence itself emerges, rather than only how LLMs can be engineered. Although progress is usually attributed to scale, data and architecture, we show that parameter initialization is a gene-like determinant of training and, in particular, of model capacity. Reducing the initialization scale consistently improves pretraining, with the largest gains on reasoning-demanding tasks. We identify two widely used empirical settings that restrain the advantage of small initialization, and show how relaxing them restores favorable scali","authors_text":"Feiyu Xiong, Hongkang Yang, Junjie Yao, Liangkai Hang, Zhi-Qin John Xu, Zhiyu Li","cross_cats":[],"headline":"","license":"http://creativecommons.org/licenses/by/4.0/","primary_cat":"cs.AI","submitted_at":"2026-06-16T13:53:48Z","title":"Small Initialization Matters for Large Language Models"},"references":{"count":0,"internal_anchors":0,"resolved_work":0,"sample":[],"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"source":{"id":"2606.17945","kind":"arxiv","version":1},"verdict":{"created_at":null,"id":null,"model_set":{},"one_line_summary":"","pipeline_version":null,"pith_extraction_headline":"","strongest_claim":"","weakest_assumption":""}},"verdict_id":null}}],"author_attestations":[],"timestamp_anchors":[],"storage_attestations":[],"citation_signatures":[],"replication_records":[],"corrections":[],"mirror_hints":[],"record_created":{"event_id":"sha256:0592a68d2343da7ba10e068fd7dad58dc16b8137c87f2888a7f13d73bb56c61c","target":"record","created_at":"2026-06-19T16:10:44Z","signer":{"key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","signer_id":"pith.science","signer_type":"pith_registry"},"payload":{"attestation_state":"computed","canonical_record":{"metadata":{"abstract_canon_sha256":"569af4a63c53da93a226abed901ebf526bbe11f8c2503c4d13532b7b31651ab5","cross_cats_sorted":[],"license":"http://creativecommons.org/licenses/by/4.0/","primary_cat":"cs.AI","submitted_at":"2026-06-16T13:53:48Z","title_canon_sha256":"3e54df7dcd92fb247100b450b595fac7da8397af2bba9fd8b89ae3b2a465dd96"},"schema_version":"1.0","source":{"id":"2606.17945","kind":"arxiv","version":1}},"canonical_sha256":"879bde052b02be3bcd73e8456183bdf3d286dc897c750d38f1c0d3ad42b8ef5d","receipt":{"algorithm":"ed25519","builder_version":"pith-number-builder-2026-05-17-v1","canonical_sha256":"879bde052b02be3bcd73e8456183bdf3d286dc897c750d38f1c0d3ad42b8ef5d","first_computed_at":"2026-06-19T16:10:44.186216Z","key_id":"pith-v1-2026-05","kind":"pith_receipt","last_reissued_at":"2026-06-19T16:10:44.186216Z","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","receipt_version":"0.3","signature_b64":"zznasyfVuxXJE+mcdXXJV3oLIP34+9IFUFZTvutYrnPv6XxZ7iX3nfzJUtWqOxipwvgAE6Tmv7cgytG5RuokAQ==","signature_status":"signed_v1","signed_at":"2026-06-19T16:10:44.186576Z","signed_message":"canonical_sha256_bytes"},"source_id":"2606.17945","source_kind":"arxiv","source_version":1}}},"equivocations":[],"invalid_events":[],"applied_event_ids":["sha256:0592a68d2343da7ba10e068fd7dad58dc16b8137c87f2888a7f13d73bb56c61c","sha256:e3c9556bbf4441b5239436818a348e1d3eb9c35742a7e0bd0d14c6a8aecc3850"],"state_sha256":"3195569229766c817d9ae9063e36d5a5886121594d3be0d53ca036f5a8163466"},"bundle_signature":{"signature_status":"signed_v1","algorithm":"ed25519","key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","signature_b64":"gIwp5IqFrSt3HCeku/mtJdNQGTkjEj10RgDXJRHWsCexoqa1CbLWz2xZirhglEYx8AduY9jl8h37sWDXZ1slAg==","signed_message":"bundle_sha256_bytes","signed_at":"2026-07-04T19:30:09.400994Z","bundle_sha256":"ee4f9624677eb331a2cfd9b9b4ef0200b121fcea8f6730b11d2cdef858f84ab4"}}