{"bundle_type":"pith_open_graph_bundle","bundle_version":"1.0","pith_number":"pith:2017:M5BNRHPUWGA7MHPFDKCQKNVN6T","short_pith_number":"pith:M5BNRHPU","canonical_record":{"source":{"id":"1711.04623","kind":"arxiv","version":3},"metadata":{"license":"http://arxiv.org/licenses/nonexclusive-distrib/1.0/","primary_cat":"cs.LG","submitted_at":"2017-11-13T15:11:56Z","cross_cats_sorted":["cs.AI","cs.CV","stat.ML"],"title_canon_sha256":"8374a5494e65f1b9671443e920c94106ccb3751de54b7b0fb22be87c2beb9e16","abstract_canon_sha256":"422ac8d1f82e758fbdde6344531805f5be3c1f9e9c312b760582b691292c8113"},"schema_version":"1.0"},"canonical_sha256":"6742d89df4b181f61de51a850536adf4fdf7a8a9c65a8fd6111076b17f2d4ebe","source":{"kind":"arxiv","id":"1711.04623","version":3},"source_aliases":[{"alias_kind":"arxiv","alias_value":"1711.04623","created_at":"2026-05-18T00:05:51Z"},{"alias_kind":"arxiv_version","alias_value":"1711.04623v3","created_at":"2026-05-18T00:05:51Z"},{"alias_kind":"doi","alias_value":"10.48550/arxiv.1711.04623","created_at":"2026-05-18T00:05:51Z"},{"alias_kind":"pith_short_12","alias_value":"M5BNRHPUWGA7","created_at":"2026-05-18T12:31:28Z"},{"alias_kind":"pith_short_16","alias_value":"M5BNRHPUWGA7MHPF","created_at":"2026-05-18T12:31:28Z"},{"alias_kind":"pith_short_8","alias_value":"M5BNRHPU","created_at":"2026-05-18T12:31:28Z"}],"events":[{"event_type":"record_created","subject_pith_number":"pith:2017:M5BNRHPUWGA7MHPFDKCQKNVN6T","target":"record","payload":{"canonical_record":{"source":{"id":"1711.04623","kind":"arxiv","version":3},"metadata":{"license":"http://arxiv.org/licenses/nonexclusive-distrib/1.0/","primary_cat":"cs.LG","submitted_at":"2017-11-13T15:11:56Z","cross_cats_sorted":["cs.AI","cs.CV","stat.ML"],"title_canon_sha256":"8374a5494e65f1b9671443e920c94106ccb3751de54b7b0fb22be87c2beb9e16","abstract_canon_sha256":"422ac8d1f82e758fbdde6344531805f5be3c1f9e9c312b760582b691292c8113"},"schema_version":"1.0"},"canonical_sha256":"6742d89df4b181f61de51a850536adf4fdf7a8a9c65a8fd6111076b17f2d4ebe","receipt":{"kind":"pith_receipt","key_id":"pith-v1-2026-05","algorithm":"ed25519","signed_at":"2026-05-18T00:05:51.088728Z","signature_b64":"fP2OFxXEOBNgEQkyndIyq5a2KnNbadwB2qVlPEgvS5FTfw5x1r0BN1eB14cgl9ftHSWVnSqJCO8WdvyPxa4TDQ==","signed_message":"canonical_sha256_bytes","builder_version":"pith-number-builder-2026-05-17-v1","receipt_version":"0.3","canonical_sha256":"6742d89df4b181f61de51a850536adf4fdf7a8a9c65a8fd6111076b17f2d4ebe","last_reissued_at":"2026-05-18T00:05:51.088069Z","signature_status":"signed_v1","first_computed_at":"2026-05-18T00:05:51.088069Z","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54"},"source_kind":"arxiv","source_id":"1711.04623","source_version":3,"attestation_state":"computed"},"signer":{"signer_id":"pith.science","signer_type":"pith_registry","key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54"},"created_at":"2026-05-18T00:05:51Z","supersedes":[],"prev_event":null,"signature":{"signature_status":"signed_v1","algorithm":"ed25519","key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","signature_b64":"chVBWuwdjOJ1ruOyFOcUUIDKEUFhzEXIH3XEk1SRsl6TYcbrQ58cTa3s2O6rdEXhmsC8ZvkH+69l7xCzPGvfCw==","signed_message":"open_graph_event_sha256_bytes","signed_at":"2026-05-31T19:48:22.391217Z"},"content_sha256":"0cf2ca14dfbb6a8a567c89dbea99562ef2120338e18661863f3f37fa8abb78fe","schema_version":"1.0","event_id":"sha256:0cf2ca14dfbb6a8a567c89dbea99562ef2120338e18661863f3f37fa8abb78fe"},{"event_type":"graph_snapshot","subject_pith_number":"pith:2017:M5BNRHPUWGA7MHPFDKCQKNVN6T","target":"graph","payload":{"graph_snapshot":{"paper":{"title":"Three Factors Influencing Minima in SGD","license":"http://arxiv.org/licenses/nonexclusive-distrib/1.0/","headline":"","cross_cats":["cs.AI","cs.CV","stat.ML"],"primary_cat":"cs.LG","authors_text":"Amos Storkey, Asja Fischer, Devansh Arpit, Nicolas Ballas, Stanis{\\l}aw Jastrz\\k{e}bski, Yoshua Bengio, Zachary Kenton","submitted_at":"2017-11-13T15:11:56Z","abstract_excerpt":"We investigate the dynamical and convergent properties of stochastic gradient descent (SGD) applied to Deep Neural Networks (DNNs). Characterizing the relation between learning rate, batch size and the properties of the final minima, such as width or generalization, remains an open question. In order to tackle this problem we investigate the previously proposed approximation of SGD by a stochastic differential equation (SDE). We theoretically argue that three factors - learning rate, batch size and gradient covariance - influence the minima found by SGD. In particular we find that the ratio of"},"claims":{"count":0,"items":[],"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"source":{"id":"1711.04623","kind":"arxiv","version":3},"verdict":{"id":null,"model_set":{},"created_at":null,"strongest_claim":"","one_line_summary":"","pipeline_version":null,"weakest_assumption":"","pith_extraction_headline":""},"references":{"count":0,"sample":[],"resolved_work":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57","internal_anchors":0},"formal_canon":{"evidence_count":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"author_claims":{"count":0,"strong_count":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"builder_version":"pith-number-builder-2026-05-17-v1"},"verdict_id":null},"signer":{"signer_id":"pith.science","signer_type":"pith_registry","key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54"},"created_at":"2026-05-18T00:05:51Z","supersedes":[],"prev_event":null,"signature":{"signature_status":"signed_v1","algorithm":"ed25519","key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","signature_b64":"oGZpOZlHpzDebbIE0Dp9liG/l4q2JZIBxCSMCSm3ycPKIamscVGrRFmRM4HNecA/VskJJUEClbpRvl9tsKiaAg==","signed_message":"open_graph_event_sha256_bytes","signed_at":"2026-05-31T19:48:22.392012Z"},"content_sha256":"67eb3f4c0fa3f7ba298c13b7516c477f486b5d5152ce6939d702d7503bfa57cf","schema_version":"1.0","event_id":"sha256:67eb3f4c0fa3f7ba298c13b7516c477f486b5d5152ce6939d702d7503bfa57cf"}],"timestamp_proofs":[],"mirror_hints":[{"mirror_type":"https","name":"Pith Resolver","base_url":"https://pith.science","bundle_url":"https://pith.science/pith/M5BNRHPUWGA7MHPFDKCQKNVN6T/bundle.json","state_url":"https://pith.science/pith/M5BNRHPUWGA7MHPFDKCQKNVN6T/state.json","well_known_bundle_url":"https://pith.science/.well-known/pith/M5BNRHPUWGA7MHPFDKCQKNVN6T/bundle.json","status":"primary"}],"public_keys":[{"key_id":"pith-v1-2026-05","algorithm":"ed25519","format":"raw","public_key_b64":"stVStoiQhXFxp4s2pdzPNoqVNBMojDU/fJ2db5S3CbM=","public_key_hex":"b2d552b68890857171a78b36a5dccf368a953413288c353f7c9d9d6f94b709b3","fingerprint_sha256_b32_first128bits":"RVFV5Z2OI2J3ZUO7ERDEBCYNKS","fingerprint_sha256_hex":"8d4b5ee74e4693bcd1df2446408b0d54","rotates_at":null,"url":"https://pith.science/pith-signing-key.json","notes":"Pith uses this Ed25519 key to sign canonical record SHA-256 digests. Verify with: ed25519_verify(public_key, message=canonical_sha256_bytes, signature=base64decode(signature_b64))."}],"merge_version":"pith-open-graph-merge-v1","built_at":"2026-05-31T19:48:22Z","links":{"resolver":"https://pith.science/pith/M5BNRHPUWGA7MHPFDKCQKNVN6T","bundle":"https://pith.science/pith/M5BNRHPUWGA7MHPFDKCQKNVN6T/bundle.json","state":"https://pith.science/pith/M5BNRHPUWGA7MHPFDKCQKNVN6T/state.json","well_known_bundle":"https://pith.science/.well-known/pith/M5BNRHPUWGA7MHPFDKCQKNVN6T/bundle.json"},"state":{"state_type":"pith_open_graph_state","state_version":"1.0","pith_number":"pith:2017:M5BNRHPUWGA7MHPFDKCQKNVN6T","merge_version":"pith-open-graph-merge-v1","event_count":2,"valid_event_count":2,"invalid_event_count":0,"equivocation_count":0,"current":{"canonical_record":{"metadata":{"abstract_canon_sha256":"422ac8d1f82e758fbdde6344531805f5be3c1f9e9c312b760582b691292c8113","cross_cats_sorted":["cs.AI","cs.CV","stat.ML"],"license":"http://arxiv.org/licenses/nonexclusive-distrib/1.0/","primary_cat":"cs.LG","submitted_at":"2017-11-13T15:11:56Z","title_canon_sha256":"8374a5494e65f1b9671443e920c94106ccb3751de54b7b0fb22be87c2beb9e16"},"schema_version":"1.0","source":{"id":"1711.04623","kind":"arxiv","version":3}},"source_aliases":[{"alias_kind":"arxiv","alias_value":"1711.04623","created_at":"2026-05-18T00:05:51Z"},{"alias_kind":"arxiv_version","alias_value":"1711.04623v3","created_at":"2026-05-18T00:05:51Z"},{"alias_kind":"doi","alias_value":"10.48550/arxiv.1711.04623","created_at":"2026-05-18T00:05:51Z"},{"alias_kind":"pith_short_12","alias_value":"M5BNRHPUWGA7","created_at":"2026-05-18T12:31:28Z"},{"alias_kind":"pith_short_16","alias_value":"M5BNRHPUWGA7MHPF","created_at":"2026-05-18T12:31:28Z"},{"alias_kind":"pith_short_8","alias_value":"M5BNRHPU","created_at":"2026-05-18T12:31:28Z"}],"graph_snapshots":[{"event_id":"sha256:67eb3f4c0fa3f7ba298c13b7516c477f486b5d5152ce6939d702d7503bfa57cf","target":"graph","created_at":"2026-05-18T00:05:51Z","signer":{"key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","signer_id":"pith.science","signer_type":"pith_registry"},"payload":{"graph_snapshot":{"author_claims":{"count":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57","strong_count":0},"builder_version":"pith-number-builder-2026-05-17-v1","claims":{"count":0,"items":[],"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"formal_canon":{"evidence_count":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"paper":{"abstract_excerpt":"We investigate the dynamical and convergent properties of stochastic gradient descent (SGD) applied to Deep Neural Networks (DNNs). Characterizing the relation between learning rate, batch size and the properties of the final minima, such as width or generalization, remains an open question. In order to tackle this problem we investigate the previously proposed approximation of SGD by a stochastic differential equation (SDE). We theoretically argue that three factors - learning rate, batch size and gradient covariance - influence the minima found by SGD. In particular we find that the ratio of","authors_text":"Amos Storkey, Asja Fischer, Devansh Arpit, Nicolas Ballas, Stanis{\\l}aw Jastrz\\k{e}bski, Yoshua Bengio, Zachary Kenton","cross_cats":["cs.AI","cs.CV","stat.ML"],"headline":"","license":"http://arxiv.org/licenses/nonexclusive-distrib/1.0/","primary_cat":"cs.LG","submitted_at":"2017-11-13T15:11:56Z","title":"Three Factors Influencing Minima in SGD"},"references":{"count":0,"internal_anchors":0,"resolved_work":0,"sample":[],"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"source":{"id":"1711.04623","kind":"arxiv","version":3},"verdict":{"created_at":null,"id":null,"model_set":{},"one_line_summary":"","pipeline_version":null,"pith_extraction_headline":"","strongest_claim":"","weakest_assumption":""}},"verdict_id":null}}],"author_attestations":[],"timestamp_anchors":[],"storage_attestations":[],"citation_signatures":[],"replication_records":[],"corrections":[],"mirror_hints":[],"record_created":{"event_id":"sha256:0cf2ca14dfbb6a8a567c89dbea99562ef2120338e18661863f3f37fa8abb78fe","target":"record","created_at":"2026-05-18T00:05:51Z","signer":{"key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","signer_id":"pith.science","signer_type":"pith_registry"},"payload":{"attestation_state":"computed","canonical_record":{"metadata":{"abstract_canon_sha256":"422ac8d1f82e758fbdde6344531805f5be3c1f9e9c312b760582b691292c8113","cross_cats_sorted":["cs.AI","cs.CV","stat.ML"],"license":"http://arxiv.org/licenses/nonexclusive-distrib/1.0/","primary_cat":"cs.LG","submitted_at":"2017-11-13T15:11:56Z","title_canon_sha256":"8374a5494e65f1b9671443e920c94106ccb3751de54b7b0fb22be87c2beb9e16"},"schema_version":"1.0","source":{"id":"1711.04623","kind":"arxiv","version":3}},"canonical_sha256":"6742d89df4b181f61de51a850536adf4fdf7a8a9c65a8fd6111076b17f2d4ebe","receipt":{"algorithm":"ed25519","builder_version":"pith-number-builder-2026-05-17-v1","canonical_sha256":"6742d89df4b181f61de51a850536adf4fdf7a8a9c65a8fd6111076b17f2d4ebe","first_computed_at":"2026-05-18T00:05:51.088069Z","key_id":"pith-v1-2026-05","kind":"pith_receipt","last_reissued_at":"2026-05-18T00:05:51.088069Z","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","receipt_version":"0.3","signature_b64":"fP2OFxXEOBNgEQkyndIyq5a2KnNbadwB2qVlPEgvS5FTfw5x1r0BN1eB14cgl9ftHSWVnSqJCO8WdvyPxa4TDQ==","signature_status":"signed_v1","signed_at":"2026-05-18T00:05:51.088728Z","signed_message":"canonical_sha256_bytes"},"source_id":"1711.04623","source_kind":"arxiv","source_version":3}}},"equivocations":[],"invalid_events":[],"applied_event_ids":["sha256:0cf2ca14dfbb6a8a567c89dbea99562ef2120338e18661863f3f37fa8abb78fe","sha256:67eb3f4c0fa3f7ba298c13b7516c477f486b5d5152ce6939d702d7503bfa57cf"],"state_sha256":"c504f5b774ac76d0bdabf608a3df03d6efd53674c19d512c5890df4c0407807e"},"bundle_signature":{"signature_status":"signed_v1","algorithm":"ed25519","key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","signature_b64":"6o+p7woZz5xDu+NkoQzPm9WVfO5/xPeg7HAa9rwcHPKD9xDNgr2KboqtXmVOO6VB38bAqrxLGvP3i/C9SnalBQ==","signed_message":"bundle_sha256_bytes","signed_at":"2026-05-31T19:48:22.396575Z","bundle_sha256":"62ec571faca77c6ee00b9769549cdd2b4a578231f802c62140da7e3cc5aec66b"}}