{"record_type":"pith_number_record","schema_url":"https://pith.science/schemas/pith-number/v1.json","pith_number":"pith:2026:U6G54NZX42QNZ6546JWRVL6T4D","short_pith_number":"pith:U6G54NZX","schema_version":"1.0","canonical_sha256":"a78dde3737e6a0dcfbbcf26d1aafd3e0e05b6d8c3ffa00194b6daa6cd89338b4","source":{"kind":"arxiv","id":"2605.26977","version":1},"attestation_state":"computed","paper":{"title":"Convergence of Spectral Descent for Non-smooth Optimization","license":"http://arxiv.org/licenses/nonexclusive-distrib/1.0/","headline":"","cross_cats":["math.OC"],"primary_cat":"cs.LG","authors_text":"Song Li, Yixuan Yang, Yuqing He","submitted_at":"2026-05-26T13:02:49Z","abstract_excerpt":"The Muon optimizer has recently demonstrated remarkable empirical success in training large language models. However, the theoretical understanding of its mechanisms remains limited. Current convergence guarantees for Muon rely heavily on smoothness assumptions, leaving its non-smooth convergence behavior largely unexplored. In this work, we take a step toward bridging this gap by investigating Spectral Descent (SD), a simplified variant of Muon, together with its truncated counterpart, Truncated Spectral Descent (TSD). Under convexity, Lipschitz continuity, and sharpness conditions, we establ"},"verification_status":{"content_addressed":true,"pith_receipt":true,"author_attested":false,"weak_author_claims":0,"strong_author_claims":0,"externally_anchored":false,"storage_verified":false,"citation_signatures":0,"replication_records":0,"graph_snapshot":true,"references_resolved":false,"formal_links_present":false},"canonical_record":{"source":{"id":"2605.26977","kind":"arxiv","version":1},"metadata":{"license":"http://arxiv.org/licenses/nonexclusive-distrib/1.0/","primary_cat":"cs.LG","submitted_at":"2026-05-26T13:02:49Z","cross_cats_sorted":["math.OC"],"title_canon_sha256":"a20dcde0674053b3618365be86ae8288eb271e8d48d3b84c31077d00eeee20e1","abstract_canon_sha256":"28ef79a755b46219b1ef4645a12dad2885ea5a1207d954db6a7e86d492ea53ac"},"schema_version":"1.0"},"receipt":{"kind":"pith_receipt","key_id":"pith-v1-2026-05","algorithm":"ed25519","signed_at":"2026-05-27T01:06:22.370485Z","signature_b64":"gZJdFfAyD6VH8Fl4W71rzNfPq0fbK3nIXEC6SaxSqnjPqgw9iauPgJ9oGREzf6yp0apX88Ljhhn8p407gBnwBQ==","signed_message":"canonical_sha256_bytes","builder_version":"pith-number-builder-2026-05-17-v1","receipt_version":"0.3","canonical_sha256":"a78dde3737e6a0dcfbbcf26d1aafd3e0e05b6d8c3ffa00194b6daa6cd89338b4","last_reissued_at":"2026-05-27T01:06:22.369847Z","signature_status":"signed_v1","first_computed_at":"2026-05-27T01:06:22.369847Z","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54"},"graph_snapshot":{"paper":{"title":"Convergence of Spectral Descent for Non-smooth Optimization","license":"http://arxiv.org/licenses/nonexclusive-distrib/1.0/","headline":"","cross_cats":["math.OC"],"primary_cat":"cs.LG","authors_text":"Song Li, Yixuan Yang, Yuqing He","submitted_at":"2026-05-26T13:02:49Z","abstract_excerpt":"The Muon optimizer has recently demonstrated remarkable empirical success in training large language models. However, the theoretical understanding of its mechanisms remains limited. Current convergence guarantees for Muon rely heavily on smoothness assumptions, leaving its non-smooth convergence behavior largely unexplored. In this work, we take a step toward bridging this gap by investigating Spectral Descent (SD), a simplified variant of Muon, together with its truncated counterpart, Truncated Spectral Descent (TSD). Under convexity, Lipschitz continuity, and sharpness conditions, we establ"},"claims":{"count":0,"items":[],"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"source":{"id":"2605.26977","kind":"arxiv","version":1},"verdict":{"id":null,"model_set":{},"created_at":null,"strongest_claim":"","one_line_summary":"","pipeline_version":null,"weakest_assumption":"","pith_extraction_headline":""},"integrity":{"clean":true,"summary":{"advisory":0,"critical":0,"by_detector":{},"informational":0},"endpoint":"/pith/2605.26977/integrity.json","findings":[],"available":true,"detectors_run":[],"snapshot_sha256":"c28c3603d3b5d939e8dc4c7e95fa8dfce3d595e45f758748cecf8e644a296938"},"references":{"count":0,"sample":[],"resolved_work":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57","internal_anchors":0},"formal_canon":{"evidence_count":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"author_claims":{"count":0,"strong_count":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"builder_version":"pith-number-builder-2026-05-17-v1"},"aliases":[{"alias_kind":"arxiv","alias_value":"2605.26977","created_at":"2026-05-27T01:06:22.369964+00:00"},{"alias_kind":"arxiv_version","alias_value":"2605.26977v1","created_at":"2026-05-27T01:06:22.369964+00:00"},{"alias_kind":"doi","alias_value":"10.48550/arxiv.2605.26977","created_at":"2026-05-27T01:06:22.369964+00:00"},{"alias_kind":"pith_short_12","alias_value":"U6G54NZX42QN","created_at":"2026-05-27T01:06:22.369964+00:00"},{"alias_kind":"pith_short_16","alias_value":"U6G54NZX42QNZ654","created_at":"2026-05-27T01:06:22.369964+00:00"},{"alias_kind":"pith_short_8","alias_value":"U6G54NZX","created_at":"2026-05-27T01:06:22.369964+00:00"}],"events":[],"event_summary":{},"paper_claims":[],"inbound_citations":{"count":0,"internal_anchor_count":0,"sample":[]},"formal_canon":{"evidence_count":0,"sample":[],"anchors":[]},"links":{"html":"https://pith.science/pith/U6G54NZX42QNZ6546JWRVL6T4D","json":"https://pith.science/pith/U6G54NZX42QNZ6546JWRVL6T4D.json","graph_json":"https://pith.science/api/pith-number/U6G54NZX42QNZ6546JWRVL6T4D/graph.json","events_json":"https://pith.science/api/pith-number/U6G54NZX42QNZ6546JWRVL6T4D/events.json","paper":"https://pith.science/paper/U6G54NZX"},"agent_actions":{"view_html":"https://pith.science/pith/U6G54NZX42QNZ6546JWRVL6T4D","download_json":"https://pith.science/pith/U6G54NZX42QNZ6546JWRVL6T4D.json","view_paper":"https://pith.science/paper/U6G54NZX","resolve_alias":"https://pith.science/api/pith-number/resolve?arxiv=2605.26977&json=true","fetch_graph":"https://pith.science/api/pith-number/U6G54NZX42QNZ6546JWRVL6T4D/graph.json","fetch_events":"https://pith.science/api/pith-number/U6G54NZX42QNZ6546JWRVL6T4D/events.json","actions":{"anchor_timestamp":"https://pith.science/pith/U6G54NZX42QNZ6546JWRVL6T4D/action/timestamp_anchor","attest_storage":"https://pith.science/pith/U6G54NZX42QNZ6546JWRVL6T4D/action/storage_attestation","attest_author":"https://pith.science/pith/U6G54NZX42QNZ6546JWRVL6T4D/action/author_attestation","sign_citation":"https://pith.science/pith/U6G54NZX42QNZ6546JWRVL6T4D/action/citation_signature","submit_replication":"https://pith.science/pith/U6G54NZX42QNZ6546JWRVL6T4D/action/replication_record"}},"created_at":"2026-05-27T01:06:22.369964+00:00","updated_at":"2026-05-27T01:06:22.369964+00:00"}