{"bundle_type":"pith_open_graph_bundle","bundle_version":"1.0","pith_number":"pith:2018:3SCQQOUES7WBX7LCMUQF6FBI2E","short_pith_number":"pith:3SCQQOUE","canonical_record":{"source":{"id":"1803.01905","kind":"arxiv","version":3},"metadata":{"license":"http://arxiv.org/licenses/nonexclusive-distrib/1.0/","primary_cat":"stat.ML","submitted_at":"2018-03-05T20:03:46Z","cross_cats_sorted":["cs.LG"],"title_canon_sha256":"5eee7faf2b42553d55a8a63a80b129d7ca3aa44b46fedb0f577b9fc044960a16","abstract_canon_sha256":"24e91961e359120410ccffc0aaf28e6ede0facb96d2458cd2b12e63e7f6a7444"},"schema_version":"1.0"},"canonical_sha256":"dc85083a8497ec1bfd6265205f1428d12b64ebaaf5627026e244a86f322f9c56","source":{"kind":"arxiv","id":"1803.01905","version":3},"source_aliases":[{"alias_kind":"arxiv","alias_value":"1803.01905","created_at":"2026-05-17T23:50:38Z"},{"alias_kind":"arxiv_version","alias_value":"1803.01905v3","created_at":"2026-05-17T23:50:38Z"},{"alias_kind":"doi","alias_value":"10.48550/arxiv.1803.01905","created_at":"2026-05-17T23:50:38Z"},{"alias_kind":"pith_short_12","alias_value":"3SCQQOUES7WB","created_at":"2026-05-18T12:32:05Z"},{"alias_kind":"pith_short_16","alias_value":"3SCQQOUES7WBX7LC","created_at":"2026-05-18T12:32:05Z"},{"alias_kind":"pith_short_8","alias_value":"3SCQQOUE","created_at":"2026-05-18T12:32:05Z"}],"events":[{"event_type":"record_created","subject_pith_number":"pith:2018:3SCQQOUES7WBX7LCMUQF6FBI2E","target":"record","payload":{"canonical_record":{"source":{"id":"1803.01905","kind":"arxiv","version":3},"metadata":{"license":"http://arxiv.org/licenses/nonexclusive-distrib/1.0/","primary_cat":"stat.ML","submitted_at":"2018-03-05T20:03:46Z","cross_cats_sorted":["cs.LG"],"title_canon_sha256":"5eee7faf2b42553d55a8a63a80b129d7ca3aa44b46fedb0f577b9fc044960a16","abstract_canon_sha256":"24e91961e359120410ccffc0aaf28e6ede0facb96d2458cd2b12e63e7f6a7444"},"schema_version":"1.0"},"canonical_sha256":"dc85083a8497ec1bfd6265205f1428d12b64ebaaf5627026e244a86f322f9c56","receipt":{"kind":"pith_receipt","key_id":"pith-v1-2026-05","algorithm":"ed25519","signed_at":"2026-05-17T23:50:38.736679Z","signature_b64":"qwN70J/ZdKsmA3iNJlNKLHiBpU1bRmmPqwH9sxzUTl4IZPfZmeDxdLXPkSl5JtZO2d7hd5bu5rExoKTdiPLoBg==","signed_message":"canonical_sha256_bytes","builder_version":"pith-number-builder-2026-05-17-v1","receipt_version":"0.3","canonical_sha256":"dc85083a8497ec1bfd6265205f1428d12b64ebaaf5627026e244a86f322f9c56","last_reissued_at":"2026-05-17T23:50:38.736241Z","signature_status":"signed_v1","first_computed_at":"2026-05-17T23:50:38.736241Z","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54"},"source_kind":"arxiv","source_id":"1803.01905","source_version":3,"attestation_state":"computed"},"signer":{"signer_id":"pith.science","signer_type":"pith_registry","key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54"},"created_at":"2026-05-17T23:50:38Z","supersedes":[],"prev_event":null,"signature":{"signature_status":"signed_v1","algorithm":"ed25519","key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","signature_b64":"G1v4MQ1dR/P4uXI0wnRoJy3TUlDmJ3P6xNDtyaZfRPjD1jXl+QiooNJK3/LLO9QnQgZXvEvn6SJMFBv1bSJCDQ==","signed_message":"open_graph_event_sha256_bytes","signed_at":"2026-05-27T03:14:33.425579Z"},"content_sha256":"1998dd191addc26f9270baf452dc5ef14f6fe442f5c750077dcc0535fde4f72b","schema_version":"1.0","event_id":"sha256:1998dd191addc26f9270baf452dc5ef14f6fe442f5c750077dcc0535fde4f72b"},{"event_type":"graph_snapshot","subject_pith_number":"pith:2018:3SCQQOUES7WBX7LCMUQF6FBI2E","target":"graph","payload":{"graph_snapshot":{"paper":{"title":"Convergence of Gradient Descent on Separable Data","license":"http://arxiv.org/licenses/nonexclusive-distrib/1.0/","headline":"","cross_cats":["cs.LG"],"primary_cat":"stat.ML","authors_text":"Daniel Soudry, Jason D. Lee, Mor Shpigel Nacson, Nathan Srebro, Pedro H. P. Savarese, Suriya Gunasekar","submitted_at":"2018-03-05T20:03:46Z","abstract_excerpt":"We provide a detailed study on the implicit bias of gradient descent when optimizing loss functions with strictly monotone tails, such as the logistic loss, over separable datasets. We look at two basic questions: (a) what are the conditions on the tail of the loss function under which gradient descent converges in the direction of the $L_2$ maximum-margin separator? (b) how does the rate of margin convergence depend on the tail of the loss function and the choice of the step size? We show that for a large family of super-polynomial tailed losses, gradient descent iterates on linear networks o"},"claims":{"count":0,"items":[],"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"source":{"id":"1803.01905","kind":"arxiv","version":3},"verdict":{"id":null,"model_set":{},"created_at":null,"strongest_claim":"","one_line_summary":"","pipeline_version":null,"weakest_assumption":"","pith_extraction_headline":""},"references":{"count":0,"sample":[],"resolved_work":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57","internal_anchors":0},"formal_canon":{"evidence_count":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"author_claims":{"count":0,"strong_count":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"builder_version":"pith-number-builder-2026-05-17-v1"},"verdict_id":null},"signer":{"signer_id":"pith.science","signer_type":"pith_registry","key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54"},"created_at":"2026-05-17T23:50:38Z","supersedes":[],"prev_event":null,"signature":{"signature_status":"signed_v1","algorithm":"ed25519","key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","signature_b64":"/TdfY8jj62lL2VpW8ub+N4Y4b/ld0/TYa5d20in28VhBRuS8ECt8vacDCY28NypmfzNg/DWdAx47D+0e29lqAg==","signed_message":"open_graph_event_sha256_bytes","signed_at":"2026-05-27T03:14:33.426223Z"},"content_sha256":"04d416cc5d1f76ad4eb45f12f578d60064c5c06f22d9f6e59462f9d4c78fdbef","schema_version":"1.0","event_id":"sha256:04d416cc5d1f76ad4eb45f12f578d60064c5c06f22d9f6e59462f9d4c78fdbef"}],"timestamp_proofs":[],"mirror_hints":[{"mirror_type":"https","name":"Pith Resolver","base_url":"https://pith.science","bundle_url":"https://pith.science/pith/3SCQQOUES7WBX7LCMUQF6FBI2E/bundle.json","state_url":"https://pith.science/pith/3SCQQOUES7WBX7LCMUQF6FBI2E/state.json","well_known_bundle_url":"https://pith.science/.well-known/pith/3SCQQOUES7WBX7LCMUQF6FBI2E/bundle.json","status":"primary"}],"public_keys":[{"key_id":"pith-v1-2026-05","algorithm":"ed25519","format":"raw","public_key_b64":"stVStoiQhXFxp4s2pdzPNoqVNBMojDU/fJ2db5S3CbM=","public_key_hex":"b2d552b68890857171a78b36a5dccf368a953413288c353f7c9d9d6f94b709b3","fingerprint_sha256_b32_first128bits":"RVFV5Z2OI2J3ZUO7ERDEBCYNKS","fingerprint_sha256_hex":"8d4b5ee74e4693bcd1df2446408b0d54","rotates_at":null,"url":"https://pith.science/pith-signing-key.json","notes":"Pith uses this Ed25519 key to sign canonical record SHA-256 digests. Verify with: ed25519_verify(public_key, message=canonical_sha256_bytes, signature=base64decode(signature_b64))."}],"merge_version":"pith-open-graph-merge-v1","built_at":"2026-05-27T03:14:33Z","links":{"resolver":"https://pith.science/pith/3SCQQOUES7WBX7LCMUQF6FBI2E","bundle":"https://pith.science/pith/3SCQQOUES7WBX7LCMUQF6FBI2E/bundle.json","state":"https://pith.science/pith/3SCQQOUES7WBX7LCMUQF6FBI2E/state.json","well_known_bundle":"https://pith.science/.well-known/pith/3SCQQOUES7WBX7LCMUQF6FBI2E/bundle.json"},"state":{"state_type":"pith_open_graph_state","state_version":"1.0","pith_number":"pith:2018:3SCQQOUES7WBX7LCMUQF6FBI2E","merge_version":"pith-open-graph-merge-v1","event_count":2,"valid_event_count":2,"invalid_event_count":0,"equivocation_count":0,"current":{"canonical_record":{"metadata":{"abstract_canon_sha256":"24e91961e359120410ccffc0aaf28e6ede0facb96d2458cd2b12e63e7f6a7444","cross_cats_sorted":["cs.LG"],"license":"http://arxiv.org/licenses/nonexclusive-distrib/1.0/","primary_cat":"stat.ML","submitted_at":"2018-03-05T20:03:46Z","title_canon_sha256":"5eee7faf2b42553d55a8a63a80b129d7ca3aa44b46fedb0f577b9fc044960a16"},"schema_version":"1.0","source":{"id":"1803.01905","kind":"arxiv","version":3}},"source_aliases":[{"alias_kind":"arxiv","alias_value":"1803.01905","created_at":"2026-05-17T23:50:38Z"},{"alias_kind":"arxiv_version","alias_value":"1803.01905v3","created_at":"2026-05-17T23:50:38Z"},{"alias_kind":"doi","alias_value":"10.48550/arxiv.1803.01905","created_at":"2026-05-17T23:50:38Z"},{"alias_kind":"pith_short_12","alias_value":"3SCQQOUES7WB","created_at":"2026-05-18T12:32:05Z"},{"alias_kind":"pith_short_16","alias_value":"3SCQQOUES7WBX7LC","created_at":"2026-05-18T12:32:05Z"},{"alias_kind":"pith_short_8","alias_value":"3SCQQOUE","created_at":"2026-05-18T12:32:05Z"}],"graph_snapshots":[{"event_id":"sha256:04d416cc5d1f76ad4eb45f12f578d60064c5c06f22d9f6e59462f9d4c78fdbef","target":"graph","created_at":"2026-05-17T23:50:38Z","signer":{"key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","signer_id":"pith.science","signer_type":"pith_registry"},"payload":{"graph_snapshot":{"author_claims":{"count":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57","strong_count":0},"builder_version":"pith-number-builder-2026-05-17-v1","claims":{"count":0,"items":[],"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"formal_canon":{"evidence_count":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"paper":{"abstract_excerpt":"We provide a detailed study on the implicit bias of gradient descent when optimizing loss functions with strictly monotone tails, such as the logistic loss, over separable datasets. We look at two basic questions: (a) what are the conditions on the tail of the loss function under which gradient descent converges in the direction of the $L_2$ maximum-margin separator? (b) how does the rate of margin convergence depend on the tail of the loss function and the choice of the step size? We show that for a large family of super-polynomial tailed losses, gradient descent iterates on linear networks o","authors_text":"Daniel Soudry, Jason D. Lee, Mor Shpigel Nacson, Nathan Srebro, Pedro H. P. Savarese, Suriya Gunasekar","cross_cats":["cs.LG"],"headline":"","license":"http://arxiv.org/licenses/nonexclusive-distrib/1.0/","primary_cat":"stat.ML","submitted_at":"2018-03-05T20:03:46Z","title":"Convergence of Gradient Descent on Separable Data"},"references":{"count":0,"internal_anchors":0,"resolved_work":0,"sample":[],"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"source":{"id":"1803.01905","kind":"arxiv","version":3},"verdict":{"created_at":null,"id":null,"model_set":{},"one_line_summary":"","pipeline_version":null,"pith_extraction_headline":"","strongest_claim":"","weakest_assumption":""}},"verdict_id":null}}],"author_attestations":[],"timestamp_anchors":[],"storage_attestations":[],"citation_signatures":[],"replication_records":[],"corrections":[],"mirror_hints":[],"record_created":{"event_id":"sha256:1998dd191addc26f9270baf452dc5ef14f6fe442f5c750077dcc0535fde4f72b","target":"record","created_at":"2026-05-17T23:50:38Z","signer":{"key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","signer_id":"pith.science","signer_type":"pith_registry"},"payload":{"attestation_state":"computed","canonical_record":{"metadata":{"abstract_canon_sha256":"24e91961e359120410ccffc0aaf28e6ede0facb96d2458cd2b12e63e7f6a7444","cross_cats_sorted":["cs.LG"],"license":"http://arxiv.org/licenses/nonexclusive-distrib/1.0/","primary_cat":"stat.ML","submitted_at":"2018-03-05T20:03:46Z","title_canon_sha256":"5eee7faf2b42553d55a8a63a80b129d7ca3aa44b46fedb0f577b9fc044960a16"},"schema_version":"1.0","source":{"id":"1803.01905","kind":"arxiv","version":3}},"canonical_sha256":"dc85083a8497ec1bfd6265205f1428d12b64ebaaf5627026e244a86f322f9c56","receipt":{"algorithm":"ed25519","builder_version":"pith-number-builder-2026-05-17-v1","canonical_sha256":"dc85083a8497ec1bfd6265205f1428d12b64ebaaf5627026e244a86f322f9c56","first_computed_at":"2026-05-17T23:50:38.736241Z","key_id":"pith-v1-2026-05","kind":"pith_receipt","last_reissued_at":"2026-05-17T23:50:38.736241Z","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","receipt_version":"0.3","signature_b64":"qwN70J/ZdKsmA3iNJlNKLHiBpU1bRmmPqwH9sxzUTl4IZPfZmeDxdLXPkSl5JtZO2d7hd5bu5rExoKTdiPLoBg==","signature_status":"signed_v1","signed_at":"2026-05-17T23:50:38.736679Z","signed_message":"canonical_sha256_bytes"},"source_id":"1803.01905","source_kind":"arxiv","source_version":3}}},"equivocations":[],"invalid_events":[],"applied_event_ids":["sha256:1998dd191addc26f9270baf452dc5ef14f6fe442f5c750077dcc0535fde4f72b","sha256:04d416cc5d1f76ad4eb45f12f578d60064c5c06f22d9f6e59462f9d4c78fdbef"],"state_sha256":"a28a073835b0fa735782dd7df19958534aadba09fb6feab1c180b62770e58a30"},"bundle_signature":{"signature_status":"signed_v1","algorithm":"ed25519","key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","signature_b64":"5pzyRwgUz+H0S0GnPrOWN3U3qEwvGLIQkJ9Qdy4+jITsKVvZi2QK+dyazqaYOVOKzhxbY/svqXRdOZ2gQk7EAw==","signed_message":"bundle_sha256_bytes","signed_at":"2026-05-27T03:14:33.429513Z","bundle_sha256":"52bcd7d69761934bfd35073c488a0edc5d27ac8ac6431198ae41ec9230b81684"}}