{"bundle_type":"pith_open_graph_bundle","bundle_version":"1.0","pith_number":"pith:2025:JR7N5D5K3HXQYSCUBMNG3CZINO","short_pith_number":"pith:JR7N5D5K","canonical_record":{"source":{"id":"2511.01938","kind":"arxiv","version":3},"metadata":{"license":"http://creativecommons.org/licenses/by/4.0/","primary_cat":"cs.LG","submitted_at":"2025-11-02T18:44:42Z","cross_cats_sorted":["cs.AI"],"title_canon_sha256":"2c5aa44a1072d3a580eb069994efa8f9d87de586c14d29289b081684fbb0021c","abstract_canon_sha256":"f52998b077ac93c46a17a74fffb6b62c861cc353363c4daa4e6810b30277cadf"},"schema_version":"1.0"},"canonical_sha256":"4c7ede8faad9ef0c48540b1a6d8b286ba55fad1783aa19cefa05154de111b3fe","source":{"kind":"arxiv","id":"2511.01938","version":3},"source_aliases":[{"alias_kind":"arxiv","alias_value":"2511.01938","created_at":"2026-06-02T01:03:37Z"},{"alias_kind":"arxiv_version","alias_value":"2511.01938v3","created_at":"2026-06-02T01:03:37Z"},{"alias_kind":"doi","alias_value":"10.48550/arxiv.2511.01938","created_at":"2026-06-02T01:03:37Z"},{"alias_kind":"pith_short_12","alias_value":"JR7N5D5K3HXQ","created_at":"2026-06-02T01:03:37Z"},{"alias_kind":"pith_short_16","alias_value":"JR7N5D5K3HXQYSCU","created_at":"2026-06-02T01:03:37Z"},{"alias_kind":"pith_short_8","alias_value":"JR7N5D5K","created_at":"2026-06-02T01:03:37Z"}],"events":[{"event_type":"record_created","subject_pith_number":"pith:2025:JR7N5D5K3HXQYSCUBMNG3CZINO","target":"record","payload":{"canonical_record":{"source":{"id":"2511.01938","kind":"arxiv","version":3},"metadata":{"license":"http://creativecommons.org/licenses/by/4.0/","primary_cat":"cs.LG","submitted_at":"2025-11-02T18:44:42Z","cross_cats_sorted":["cs.AI"],"title_canon_sha256":"2c5aa44a1072d3a580eb069994efa8f9d87de586c14d29289b081684fbb0021c","abstract_canon_sha256":"f52998b077ac93c46a17a74fffb6b62c861cc353363c4daa4e6810b30277cadf"},"schema_version":"1.0"},"canonical_sha256":"4c7ede8faad9ef0c48540b1a6d8b286ba55fad1783aa19cefa05154de111b3fe","receipt":{"kind":"pith_receipt","key_id":"pith-v1-2026-05","algorithm":"ed25519","signed_at":"2026-06-02T01:03:37.873712Z","signature_b64":"JVUMKE0C/DeVFrQM0RhctaMoxzNHUR6IwTWgapBHbZZw1Ko1ZLXvWy1n6q6SGtLxDd/Iwrw7BJWrh8zHIzcMBA==","signed_message":"canonical_sha256_bytes","builder_version":"pith-number-builder-2026-05-17-v1","receipt_version":"0.3","canonical_sha256":"4c7ede8faad9ef0c48540b1a6d8b286ba55fad1783aa19cefa05154de111b3fe","last_reissued_at":"2026-06-02T01:03:37.873161Z","signature_status":"signed_v1","first_computed_at":"2026-06-02T01:03:37.873161Z","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54"},"source_kind":"arxiv","source_id":"2511.01938","source_version":3,"attestation_state":"computed"},"signer":{"signer_id":"pith.science","signer_type":"pith_registry","key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54"},"created_at":"2026-06-02T01:03:37Z","supersedes":[],"prev_event":null,"signature":{"signature_status":"signed_v1","algorithm":"ed25519","key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","signature_b64":"1N8JTK+VQdX10fwOXeGF339YCkYd8BfUi2VUfhUH4HOWzn7R0ed/renIZ63E8psxPVapDsT3BbxyIf4UTugZAw==","signed_message":"open_graph_event_sha256_bytes","signed_at":"2026-06-10T08:08:00.697302Z"},"content_sha256":"11c3ba242768390f737fe0917cbe13dc84ce301fbf5d666233f65e658182ca9b","schema_version":"1.0","event_id":"sha256:11c3ba242768390f737fe0917cbe13dc84ce301fbf5d666233f65e658182ca9b"},{"event_type":"graph_snapshot","subject_pith_number":"pith:2025:JR7N5D5K3HXQYSCUBMNG3CZINO","target":"graph","payload":{"graph_snapshot":{"paper":{"title":"The Geometry of Grokking: Norm Minimization on the Zero-Loss Manifold","license":"http://creativecommons.org/licenses/by/4.0/","headline":"","cross_cats":["cs.AI"],"primary_cat":"cs.LG","authors_text":"Tiberiu Musat","submitted_at":"2025-11-02T18:44:42Z","abstract_excerpt":"Grokking is a puzzling phenomenon in neural networks where full generalization occurs only after a substantial delay following the complete memorization of the training data. Previous research has linked this delayed generalization to representation learning driven by weight decay, but the precise underlying dynamics remain elusive. In this paper, we argue that post-memorization learning can be understood through the lens of constrained optimization: gradient descent effectively minimizes the weight norm on the zero-loss manifold. We formally prove this in the limit of infinitesimally small le"},"claims":{"count":0,"items":[],"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"source":{"id":"2511.01938","kind":"arxiv","version":3},"verdict":{"id":null,"model_set":{},"created_at":null,"strongest_claim":"","one_line_summary":"","pipeline_version":null,"weakest_assumption":"","pith_extraction_headline":""},"integrity":{"clean":true,"summary":{"advisory":0,"critical":0,"by_detector":{},"informational":0},"endpoint":"/pith/2511.01938/integrity.json","findings":[],"available":true,"detectors_run":[],"snapshot_sha256":"c28c3603d3b5d939e8dc4c7e95fa8dfce3d595e45f758748cecf8e644a296938"},"references":{"count":0,"sample":[],"resolved_work":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57","internal_anchors":0},"formal_canon":{"evidence_count":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"author_claims":{"count":0,"strong_count":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"builder_version":"pith-number-builder-2026-05-17-v1"},"verdict_id":null},"signer":{"signer_id":"pith.science","signer_type":"pith_registry","key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54"},"created_at":"2026-06-02T01:03:37Z","supersedes":[],"prev_event":null,"signature":{"signature_status":"signed_v1","algorithm":"ed25519","key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","signature_b64":"VQCg8w9BXFPznIcDtzUMadQthuaHC0k0bGx+jhA+FyTTzBulPsUAIYR/3uaPp1kMRmhlLwagvVGhhJAha9BTAA==","signed_message":"open_graph_event_sha256_bytes","signed_at":"2026-06-10T08:08:00.698111Z"},"content_sha256":"8360bbcf95de3fe1b2458545a4dd40f4a49ea56302df4cca40c35e218d4d2c31","schema_version":"1.0","event_id":"sha256:8360bbcf95de3fe1b2458545a4dd40f4a49ea56302df4cca40c35e218d4d2c31"}],"timestamp_proofs":[],"mirror_hints":[{"mirror_type":"https","name":"Pith Resolver","base_url":"https://pith.science","bundle_url":"https://pith.science/pith/JR7N5D5K3HXQYSCUBMNG3CZINO/bundle.json","state_url":"https://pith.science/pith/JR7N5D5K3HXQYSCUBMNG3CZINO/state.json","well_known_bundle_url":"https://pith.science/.well-known/pith/JR7N5D5K3HXQYSCUBMNG3CZINO/bundle.json","status":"primary"}],"public_keys":[{"key_id":"pith-v1-2026-05","algorithm":"ed25519","format":"raw","public_key_b64":"stVStoiQhXFxp4s2pdzPNoqVNBMojDU/fJ2db5S3CbM=","public_key_hex":"b2d552b68890857171a78b36a5dccf368a953413288c353f7c9d9d6f94b709b3","fingerprint_sha256_b32_first128bits":"RVFV5Z2OI2J3ZUO7ERDEBCYNKS","fingerprint_sha256_hex":"8d4b5ee74e4693bcd1df2446408b0d54","rotates_at":null,"url":"https://pith.science/pith-signing-key.json","notes":"Pith uses this Ed25519 key to sign canonical record SHA-256 digests. Verify with: ed25519_verify(public_key, message=canonical_sha256_bytes, signature=base64decode(signature_b64))."}],"merge_version":"pith-open-graph-merge-v1","built_at":"2026-06-10T08:08:00Z","links":{"resolver":"https://pith.science/pith/JR7N5D5K3HXQYSCUBMNG3CZINO","bundle":"https://pith.science/pith/JR7N5D5K3HXQYSCUBMNG3CZINO/bundle.json","state":"https://pith.science/pith/JR7N5D5K3HXQYSCUBMNG3CZINO/state.json","well_known_bundle":"https://pith.science/.well-known/pith/JR7N5D5K3HXQYSCUBMNG3CZINO/bundle.json"},"state":{"state_type":"pith_open_graph_state","state_version":"1.0","pith_number":"pith:2025:JR7N5D5K3HXQYSCUBMNG3CZINO","merge_version":"pith-open-graph-merge-v1","event_count":2,"valid_event_count":2,"invalid_event_count":0,"equivocation_count":0,"current":{"canonical_record":{"metadata":{"abstract_canon_sha256":"f52998b077ac93c46a17a74fffb6b62c861cc353363c4daa4e6810b30277cadf","cross_cats_sorted":["cs.AI"],"license":"http://creativecommons.org/licenses/by/4.0/","primary_cat":"cs.LG","submitted_at":"2025-11-02T18:44:42Z","title_canon_sha256":"2c5aa44a1072d3a580eb069994efa8f9d87de586c14d29289b081684fbb0021c"},"schema_version":"1.0","source":{"id":"2511.01938","kind":"arxiv","version":3}},"source_aliases":[{"alias_kind":"arxiv","alias_value":"2511.01938","created_at":"2026-06-02T01:03:37Z"},{"alias_kind":"arxiv_version","alias_value":"2511.01938v3","created_at":"2026-06-02T01:03:37Z"},{"alias_kind":"doi","alias_value":"10.48550/arxiv.2511.01938","created_at":"2026-06-02T01:03:37Z"},{"alias_kind":"pith_short_12","alias_value":"JR7N5D5K3HXQ","created_at":"2026-06-02T01:03:37Z"},{"alias_kind":"pith_short_16","alias_value":"JR7N5D5K3HXQYSCU","created_at":"2026-06-02T01:03:37Z"},{"alias_kind":"pith_short_8","alias_value":"JR7N5D5K","created_at":"2026-06-02T01:03:37Z"}],"graph_snapshots":[{"event_id":"sha256:8360bbcf95de3fe1b2458545a4dd40f4a49ea56302df4cca40c35e218d4d2c31","target":"graph","created_at":"2026-06-02T01:03:37Z","signer":{"key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","signer_id":"pith.science","signer_type":"pith_registry"},"payload":{"graph_snapshot":{"author_claims":{"count":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57","strong_count":0},"builder_version":"pith-number-builder-2026-05-17-v1","claims":{"count":0,"items":[],"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"formal_canon":{"evidence_count":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"integrity":{"available":true,"clean":true,"detectors_run":[],"endpoint":"/pith/2511.01938/integrity.json","findings":[],"snapshot_sha256":"c28c3603d3b5d939e8dc4c7e95fa8dfce3d595e45f758748cecf8e644a296938","summary":{"advisory":0,"by_detector":{},"critical":0,"informational":0}},"paper":{"abstract_excerpt":"Grokking is a puzzling phenomenon in neural networks where full generalization occurs only after a substantial delay following the complete memorization of the training data. Previous research has linked this delayed generalization to representation learning driven by weight decay, but the precise underlying dynamics remain elusive. In this paper, we argue that post-memorization learning can be understood through the lens of constrained optimization: gradient descent effectively minimizes the weight norm on the zero-loss manifold. We formally prove this in the limit of infinitesimally small le","authors_text":"Tiberiu Musat","cross_cats":["cs.AI"],"headline":"","license":"http://creativecommons.org/licenses/by/4.0/","primary_cat":"cs.LG","submitted_at":"2025-11-02T18:44:42Z","title":"The Geometry of Grokking: Norm Minimization on the Zero-Loss Manifold"},"references":{"count":0,"internal_anchors":0,"resolved_work":0,"sample":[],"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"source":{"id":"2511.01938","kind":"arxiv","version":3},"verdict":{"created_at":null,"id":null,"model_set":{},"one_line_summary":"","pipeline_version":null,"pith_extraction_headline":"","strongest_claim":"","weakest_assumption":""}},"verdict_id":null}}],"author_attestations":[],"timestamp_anchors":[],"storage_attestations":[],"citation_signatures":[],"replication_records":[],"corrections":[],"mirror_hints":[],"record_created":{"event_id":"sha256:11c3ba242768390f737fe0917cbe13dc84ce301fbf5d666233f65e658182ca9b","target":"record","created_at":"2026-06-02T01:03:37Z","signer":{"key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","signer_id":"pith.science","signer_type":"pith_registry"},"payload":{"attestation_state":"computed","canonical_record":{"metadata":{"abstract_canon_sha256":"f52998b077ac93c46a17a74fffb6b62c861cc353363c4daa4e6810b30277cadf","cross_cats_sorted":["cs.AI"],"license":"http://creativecommons.org/licenses/by/4.0/","primary_cat":"cs.LG","submitted_at":"2025-11-02T18:44:42Z","title_canon_sha256":"2c5aa44a1072d3a580eb069994efa8f9d87de586c14d29289b081684fbb0021c"},"schema_version":"1.0","source":{"id":"2511.01938","kind":"arxiv","version":3}},"canonical_sha256":"4c7ede8faad9ef0c48540b1a6d8b286ba55fad1783aa19cefa05154de111b3fe","receipt":{"algorithm":"ed25519","builder_version":"pith-number-builder-2026-05-17-v1","canonical_sha256":"4c7ede8faad9ef0c48540b1a6d8b286ba55fad1783aa19cefa05154de111b3fe","first_computed_at":"2026-06-02T01:03:37.873161Z","key_id":"pith-v1-2026-05","kind":"pith_receipt","last_reissued_at":"2026-06-02T01:03:37.873161Z","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","receipt_version":"0.3","signature_b64":"JVUMKE0C/DeVFrQM0RhctaMoxzNHUR6IwTWgapBHbZZw1Ko1ZLXvWy1n6q6SGtLxDd/Iwrw7BJWrh8zHIzcMBA==","signature_status":"signed_v1","signed_at":"2026-06-02T01:03:37.873712Z","signed_message":"canonical_sha256_bytes"},"source_id":"2511.01938","source_kind":"arxiv","source_version":3}}},"equivocations":[],"invalid_events":[],"applied_event_ids":["sha256:11c3ba242768390f737fe0917cbe13dc84ce301fbf5d666233f65e658182ca9b","sha256:8360bbcf95de3fe1b2458545a4dd40f4a49ea56302df4cca40c35e218d4d2c31"],"state_sha256":"16ea7c9df8fd2f6bb1121435a38cdfe2e7414f47fa0ded3cec8a130717dcc483"},"bundle_signature":{"signature_status":"signed_v1","algorithm":"ed25519","key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","signature_b64":"CgtIUwTd++NdjZwx8BYeOipOxHI7MirQv14V++EAbgp7Hf+Mby7eRohoAtRXmhVvA2DWyykgAn5WXu1ymzVHBg==","signed_message":"bundle_sha256_bytes","signed_at":"2026-06-10T08:08:00.702212Z","bundle_sha256":"537350ff76f7197418617a9e69189f5fdb5db2b84ffd2be203c39f2a66756804"}}