{"state_type":"pith_open_graph_state","state_version":"1.0","pith_number":"pith:2026:4O5TM4K4IXJMBV74RFAFWCH5AX","merge_version":"pith-open-graph-merge-v1","event_count":2,"valid_event_count":2,"invalid_event_count":0,"equivocation_count":0,"current":{"canonical_record":{"metadata":{"abstract_canon_sha256":"75e2049aab6447ac214794c2746933d0e03ec86166a67dbafeef5c9adf666fd5","cross_cats_sorted":[],"license":"http://creativecommons.org/licenses/by/4.0/","primary_cat":"cs.LG","submitted_at":"2026-06-29T16:17:38Z","title_canon_sha256":"de25000a4993af7f233d808ccf9b875849b77ef6e8c8a505c308ed7b881ef985"},"schema_version":"1.0","source":{"id":"2606.30509","kind":"arxiv","version":1}},"source_aliases":[{"alias_kind":"arxiv","alias_value":"2606.30509","created_at":"2026-06-30T02:18:18Z"},{"alias_kind":"arxiv_version","alias_value":"2606.30509v1","created_at":"2026-06-30T02:18:18Z"},{"alias_kind":"doi","alias_value":"10.48550/arxiv.2606.30509","created_at":"2026-06-30T02:18:18Z"},{"alias_kind":"pith_short_12","alias_value":"4O5TM4K4IXJM","created_at":"2026-06-30T02:18:18Z"},{"alias_kind":"pith_short_16","alias_value":"4O5TM4K4IXJMBV74","created_at":"2026-06-30T02:18:18Z"},{"alias_kind":"pith_short_8","alias_value":"4O5TM4K4","created_at":"2026-06-30T02:18:18Z"}],"graph_snapshots":[{"event_id":"sha256:95df877d39dc10e6039047e5440ba77b34dfe72c11692ab90868aca30459af42","target":"graph","created_at":"2026-06-30T02:18:18Z","signer":{"key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","signer_id":"pith.science","signer_type":"pith_registry"},"payload":{"graph_snapshot":{"author_claims":{"count":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57","strong_count":0},"builder_version":"pith-number-builder-2026-05-17-v1","claims":{"count":0,"items":[],"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"formal_canon":{"evidence_count":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"integrity":{"available":true,"clean":true,"detectors_run":[],"endpoint":"/pith/2606.30509/integrity.json","findings":[],"snapshot_sha256":"c28c3603d3b5d939e8dc4c7e95fa8dfce3d595e45f758748cecf8e644a296938","summary":{"advisory":0,"by_detector":{},"critical":0,"informational":0}},"paper":{"abstract_excerpt":"Matrix factorization (i.e., problems of the form $\\min_{\\mathbf{P},\\mathbf{Q}} \\|\\mathbf{M}^\\star - \\mathbf{P}^\\top\\mathbf{Q}\\|_\\mathrm{F}^2$) is a minimal learning problem that exhibits both nonlinear parameter dynamics and representation learning. In this setting, we study how parameter trajectories under the Muon optimizer differ from those of gradient descent. We identify three main dynamical differences: 1) Muon avoids the slow saddle-to-saddle dynamics from small initialization. Muon instead learns all the top modes of $\\mathbf{M}^\\star$ at the same rate, with the smaller modes convergin","authors_text":"Dhruva Karkada, Jamie Simon, Mark Rhee","cross_cats":[],"headline":"","license":"http://creativecommons.org/licenses/by/4.0/","primary_cat":"cs.LG","submitted_at":"2026-06-29T16:17:38Z","title":"Muon learns balanced solutions in matrix factorization without slow saddle-to-saddle dynamics"},"references":{"count":0,"internal_anchors":0,"resolved_work":0,"sample":[],"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"source":{"id":"2606.30509","kind":"arxiv","version":1},"verdict":{"created_at":null,"id":null,"model_set":{},"one_line_summary":"","pipeline_version":null,"pith_extraction_headline":"","strongest_claim":"","weakest_assumption":""}},"verdict_id":null}}],"author_attestations":[],"timestamp_anchors":[],"storage_attestations":[],"citation_signatures":[],"replication_records":[],"corrections":[],"mirror_hints":[],"record_created":{"event_id":"sha256:532457e9a0cb71ed3afe354c5e7dabe7769311452593a3d1d5fe01b264460b31","target":"record","created_at":"2026-06-30T02:18:18Z","signer":{"key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","signer_id":"pith.science","signer_type":"pith_registry"},"payload":{"attestation_state":"computed","canonical_record":{"metadata":{"abstract_canon_sha256":"75e2049aab6447ac214794c2746933d0e03ec86166a67dbafeef5c9adf666fd5","cross_cats_sorted":[],"license":"http://creativecommons.org/licenses/by/4.0/","primary_cat":"cs.LG","submitted_at":"2026-06-29T16:17:38Z","title_canon_sha256":"de25000a4993af7f233d808ccf9b875849b77ef6e8c8a505c308ed7b881ef985"},"schema_version":"1.0","source":{"id":"2606.30509","kind":"arxiv","version":1}},"canonical_sha256":"e3bb36715c45d2c0d7fc89405b08fd05e6f057887dcac5feba34127f26477b2e","receipt":{"algorithm":"ed25519","builder_version":"pith-number-builder-2026-05-17-v1","canonical_sha256":"e3bb36715c45d2c0d7fc89405b08fd05e6f057887dcac5feba34127f26477b2e","first_computed_at":"2026-06-30T02:18:18.151873Z","key_id":"pith-v1-2026-05","kind":"pith_receipt","last_reissued_at":"2026-06-30T02:18:18.151873Z","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","receipt_version":"0.3","signature_b64":"O9ewIQShlin4o32ha7aZrQ5EFcXXEDU5gwk2eutzlxSOsqW9tbok+GxDFliAm9ksa5hB8drDGpcyq7QTytRKBQ==","signature_status":"signed_v1","signed_at":"2026-06-30T02:18:18.152371Z","signed_message":"canonical_sha256_bytes"},"source_id":"2606.30509","source_kind":"arxiv","source_version":1}}},"equivocations":[],"invalid_events":[],"applied_event_ids":["sha256:532457e9a0cb71ed3afe354c5e7dabe7769311452593a3d1d5fe01b264460b31","sha256:95df877d39dc10e6039047e5440ba77b34dfe72c11692ab90868aca30459af42"],"state_sha256":"cddba633d6ecd92f664d207af83d1c0297497c82da3c297ccf2ada555f6d8e3a"}