{"state_type":"pith_open_graph_state","state_version":"1.0","pith_number":"pith:2025:XMKKDZROK3OLAGJX5VFA7YKND6","merge_version":"pith-open-graph-merge-v1","event_count":2,"valid_event_count":2,"invalid_event_count":0,"equivocation_count":0,"current":{"canonical_record":{"metadata":{"abstract_canon_sha256":"e33d8d67eed9faf296c1a4dfde403d07356cb250b95866b1a89a79a87b6a3e39","cross_cats_sorted":[],"license":"http://arxiv.org/licenses/nonexclusive-distrib/1.0/","primary_cat":"cs.LG","submitted_at":"2025-02-16T08:13:23Z","title_canon_sha256":"da1d429176ea1a439e9ad17defaee5d76f3da5332069187e9fd5d104724c1e94"},"schema_version":"1.0","source":{"id":"2502.11034","kind":"arxiv","version":3}},"source_aliases":[{"alias_kind":"arxiv","alias_value":"2502.11034","created_at":"2026-06-10T01:09:15Z"},{"alias_kind":"arxiv_version","alias_value":"2502.11034v3","created_at":"2026-06-10T01:09:15Z"},{"alias_kind":"doi","alias_value":"10.48550/arxiv.2502.11034","created_at":"2026-06-10T01:09:15Z"},{"alias_kind":"pith_short_12","alias_value":"XMKKDZROK3OL","created_at":"2026-06-10T01:09:15Z"},{"alias_kind":"pith_short_16","alias_value":"XMKKDZROK3OLAGJX","created_at":"2026-06-10T01:09:15Z"},{"alias_kind":"pith_short_8","alias_value":"XMKKDZRO","created_at":"2026-06-10T01:09:15Z"}],"graph_snapshots":[{"event_id":"sha256:0d4e254d7694063eb3f7e8bf006fa760ea8317949ab6ff9033998f4a804cbcf5","target":"graph","created_at":"2026-06-10T01:09:15Z","signer":{"key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","signer_id":"pith.science","signer_type":"pith_registry"},"payload":{"graph_snapshot":{"author_claims":{"count":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57","strong_count":0},"builder_version":"pith-number-builder-2026-05-17-v1","claims":{"count":0,"items":[],"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"formal_canon":{"evidence_count":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"integrity":{"available":true,"clean":true,"detectors_run":[],"endpoint":"/pith/2502.11034/integrity.json","findings":[],"snapshot_sha256":"c28c3603d3b5d939e8dc4c7e95fa8dfce3d595e45f758748cecf8e644a296938","summary":{"advisory":0,"by_detector":{},"critical":0,"informational":0}},"paper":{"abstract_excerpt":"Loss spikes remain a persistent obstacle in large-scale language model pretraining. While previous research has attempted to identify the root cause of loss spikes by investigating individual factors, we observe that, in practice, such spikes are typically triggered by the confluence of heterogeneous factors. Empirically, loss spikes may arise from a combination of data outliers, hardware or transient computational faults, numerical precision issues, and hyperparameter settings. Regardless of the underlying cause, these spikes manifest as unstable optimizer updates, as abnormal gradients conta","authors_text":"Congliang Chen, Dianhai Yu, Guoxia Wang, JiaBin Yang, Jinle Zeng, Li Shen, Shuai Li, Yanjun Ma","cross_cats":[],"headline":"","license":"http://arxiv.org/licenses/nonexclusive-distrib/1.0/","primary_cat":"cs.LG","submitted_at":"2025-02-16T08:13:23Z","title":"AdaGC: Enhancing LLM Pretraining Stability via Adaptive Gradient Clipping"},"references":{"count":0,"internal_anchors":0,"resolved_work":0,"sample":[],"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"source":{"id":"2502.11034","kind":"arxiv","version":3},"verdict":{"created_at":null,"id":null,"model_set":{},"one_line_summary":"","pipeline_version":null,"pith_extraction_headline":"","strongest_claim":"","weakest_assumption":""}},"verdict_id":null}}],"author_attestations":[],"timestamp_anchors":[],"storage_attestations":[],"citation_signatures":[],"replication_records":[],"corrections":[],"mirror_hints":[],"record_created":{"event_id":"sha256:4bd00124c93d31f0e11f61f8f75e96cccae830c96844138adc0e859aceee8246","target":"record","created_at":"2026-06-10T01:09:15Z","signer":{"key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","signer_id":"pith.science","signer_type":"pith_registry"},"payload":{"attestation_state":"computed","canonical_record":{"metadata":{"abstract_canon_sha256":"e33d8d67eed9faf296c1a4dfde403d07356cb250b95866b1a89a79a87b6a3e39","cross_cats_sorted":[],"license":"http://arxiv.org/licenses/nonexclusive-distrib/1.0/","primary_cat":"cs.LG","submitted_at":"2025-02-16T08:13:23Z","title_canon_sha256":"da1d429176ea1a439e9ad17defaee5d76f3da5332069187e9fd5d104724c1e94"},"schema_version":"1.0","source":{"id":"2502.11034","kind":"arxiv","version":3}},"canonical_sha256":"bb14a1e62e56dcb01937ed4a0fe14d1fbaac407bbe1fa6016ea2d878c930620b","receipt":{"algorithm":"ed25519","builder_version":"pith-number-builder-2026-05-17-v1","canonical_sha256":"bb14a1e62e56dcb01937ed4a0fe14d1fbaac407bbe1fa6016ea2d878c930620b","first_computed_at":"2026-06-10T01:09:15.417904Z","key_id":"pith-v1-2026-05","kind":"pith_receipt","last_reissued_at":"2026-06-10T01:09:15.417904Z","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","receipt_version":"0.3","signature_b64":"IWyk/xzy1NTn2v+RQlRrprWxVOJvo2hWoaXdKrfxMWHrPf4/MUsL1Eed3UN/Z12JKmXSoTAo2HSeIUoM7zGODw==","signature_status":"signed_v1","signed_at":"2026-06-10T01:09:15.419088Z","signed_message":"canonical_sha256_bytes"},"source_id":"2502.11034","source_kind":"arxiv","source_version":3}}},"equivocations":[],"invalid_events":[],"applied_event_ids":["sha256:4bd00124c93d31f0e11f61f8f75e96cccae830c96844138adc0e859aceee8246","sha256:0d4e254d7694063eb3f7e8bf006fa760ea8317949ab6ff9033998f4a804cbcf5"],"state_sha256":"527874a998ea53d361004f37af9b5a054b92d33dd8135a8c1da20e7623d525ba"}