{"bundle_type":"pith_open_graph_bundle","bundle_version":"1.0","pith_number":"pith:2018:6DFKPMMQUA7GP4KK5K7REXH4IU","short_pith_number":"pith:6DFKPMMQ","canonical_record":{"source":{"id":"1811.10779","kind":"arxiv","version":1},"metadata":{"license":"http://arxiv.org/licenses/nonexclusive-distrib/1.0/","primary_cat":"cs.CV","submitted_at":"2018-11-27T02:37:03Z","cross_cats_sorted":[],"title_canon_sha256":"21334485c10c3275276ad653b5eed50889a410a6d686027623f818e809d377b1","abstract_canon_sha256":"46c13d09618021ce34e3f18170197e5ef0393e8b6ca3fd079f37e6cad54077bd"},"schema_version":"1.0"},"canonical_sha256":"f0caa7b190a03e67f14aeabf125cfc451e05e4e5bb77c79700bd33ae49ae647e","source":{"kind":"arxiv","id":"1811.10779","version":1},"source_aliases":[{"alias_kind":"arxiv","alias_value":"1811.10779","created_at":"2026-05-17T23:59:47Z"},{"alias_kind":"arxiv_version","alias_value":"1811.10779v1","created_at":"2026-05-17T23:59:47Z"},{"alias_kind":"doi","alias_value":"10.48550/arxiv.1811.10779","created_at":"2026-05-17T23:59:47Z"},{"alias_kind":"pith_short_12","alias_value":"6DFKPMMQUA7G","created_at":"2026-05-18T12:32:08Z"},{"alias_kind":"pith_short_16","alias_value":"6DFKPMMQUA7GP4KK","created_at":"2026-05-18T12:32:08Z"},{"alias_kind":"pith_short_8","alias_value":"6DFKPMMQ","created_at":"2026-05-18T12:32:08Z"}],"events":[{"event_type":"record_created","subject_pith_number":"pith:2018:6DFKPMMQUA7GP4KK5K7REXH4IU","target":"record","payload":{"canonical_record":{"source":{"id":"1811.10779","kind":"arxiv","version":1},"metadata":{"license":"http://arxiv.org/licenses/nonexclusive-distrib/1.0/","primary_cat":"cs.CV","submitted_at":"2018-11-27T02:37:03Z","cross_cats_sorted":[],"title_canon_sha256":"21334485c10c3275276ad653b5eed50889a410a6d686027623f818e809d377b1","abstract_canon_sha256":"46c13d09618021ce34e3f18170197e5ef0393e8b6ca3fd079f37e6cad54077bd"},"schema_version":"1.0"},"canonical_sha256":"f0caa7b190a03e67f14aeabf125cfc451e05e4e5bb77c79700bd33ae49ae647e","receipt":{"kind":"pith_receipt","key_id":"pith-v1-2026-05","algorithm":"ed25519","signed_at":"2026-05-17T23:59:47.553788Z","signature_b64":"JYn48/yy1fdm5cZQD2AHx34ILQYrHKKuwmYXs7xsceveNsYzJ7Mfgi95t6EF/HAyzq2634an+BAy2pZWBMLgBw==","signed_message":"canonical_sha256_bytes","builder_version":"pith-number-builder-2026-05-17-v1","receipt_version":"0.3","canonical_sha256":"f0caa7b190a03e67f14aeabf125cfc451e05e4e5bb77c79700bd33ae49ae647e","last_reissued_at":"2026-05-17T23:59:47.553376Z","signature_status":"signed_v1","first_computed_at":"2026-05-17T23:59:47.553376Z","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54"},"source_kind":"arxiv","source_id":"1811.10779","source_version":1,"attestation_state":"computed"},"signer":{"signer_id":"pith.science","signer_type":"pith_registry","key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54"},"created_at":"2026-05-17T23:59:47Z","supersedes":[],"prev_event":null,"signature":{"signature_status":"signed_v1","algorithm":"ed25519","key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","signature_b64":"LeIbBzoX69UU+7e9CpeJTY1sNpNjFM3A6O+nXxzc0MoFSjV1s0bI5NArMgQ+L+Lf0Wk9SOCt6cIoRtJdVzPBCg==","signed_message":"open_graph_event_sha256_bytes","signed_at":"2026-06-04T19:22:50.308339Z"},"content_sha256":"7f2f4c4f5d6e1ff1840392f197755ed0b21fd41a49a2f5ac659f63c0eafe2fc3","schema_version":"1.0","event_id":"sha256:7f2f4c4f5d6e1ff1840392f197755ed0b21fd41a49a2f5ac659f63c0eafe2fc3"},{"event_type":"graph_snapshot","subject_pith_number":"pith:2018:6DFKPMMQUA7GP4KK5K7REXH4IU","target":"graph","payload":{"graph_snapshot":{"paper":{"title":"Tackling Early Sparse Gradients in Softmax Activation Using Leaky Squared Euclidean Distance","license":"http://arxiv.org/licenses/nonexclusive-distrib/1.0/","headline":"","cross_cats":[],"primary_cat":"cs.CV","authors_text":"Rujie Liu, Wei Shen","submitted_at":"2018-11-27T02:37:03Z","abstract_excerpt":"Softmax activation is commonly used to output the probability distribution over categories based on certain distance metric. In scenarios like one-shot learning, the distance metric is often chosen to be squared Euclidean distance between the query sample and the category prototype. This practice works well in most time. However, we find that choosing squared Euclidean distance may cause distance explosion leading gradients to be extremely sparse in the early stage of back propagation. We term this phenomena as the early sparse gradients problem. Though it doesn't deteriorate the convergence o"},"claims":{"count":0,"items":[],"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"source":{"id":"1811.10779","kind":"arxiv","version":1},"verdict":{"id":null,"model_set":{},"created_at":null,"strongest_claim":"","one_line_summary":"","pipeline_version":null,"weakest_assumption":"","pith_extraction_headline":""},"references":{"count":0,"sample":[],"resolved_work":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57","internal_anchors":0},"formal_canon":{"evidence_count":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"author_claims":{"count":0,"strong_count":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"builder_version":"pith-number-builder-2026-05-17-v1"},"verdict_id":null},"signer":{"signer_id":"pith.science","signer_type":"pith_registry","key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54"},"created_at":"2026-05-17T23:59:47Z","supersedes":[],"prev_event":null,"signature":{"signature_status":"signed_v1","algorithm":"ed25519","key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","signature_b64":"S702brHZow3sXG0FbH3rp6aLgVrEjLCKQt2iXEYXCg7TilCrWMF4mfinCt0byhZrSWXtHD2T3fC9+dXeWuy5BA==","signed_message":"open_graph_event_sha256_bytes","signed_at":"2026-06-04T19:22:50.308690Z"},"content_sha256":"35cdd95010a4b8b74e6712477c092c6ea15725e52ba0eb2b3787d7bd69671bf9","schema_version":"1.0","event_id":"sha256:35cdd95010a4b8b74e6712477c092c6ea15725e52ba0eb2b3787d7bd69671bf9"}],"timestamp_proofs":[],"mirror_hints":[{"mirror_type":"https","name":"Pith Resolver","base_url":"https://pith.science","bundle_url":"https://pith.science/pith/6DFKPMMQUA7GP4KK5K7REXH4IU/bundle.json","state_url":"https://pith.science/pith/6DFKPMMQUA7GP4KK5K7REXH4IU/state.json","well_known_bundle_url":"https://pith.science/.well-known/pith/6DFKPMMQUA7GP4KK5K7REXH4IU/bundle.json","status":"primary"}],"public_keys":[{"key_id":"pith-v1-2026-05","algorithm":"ed25519","format":"raw","public_key_b64":"stVStoiQhXFxp4s2pdzPNoqVNBMojDU/fJ2db5S3CbM=","public_key_hex":"b2d552b68890857171a78b36a5dccf368a953413288c353f7c9d9d6f94b709b3","fingerprint_sha256_b32_first128bits":"RVFV5Z2OI2J3ZUO7ERDEBCYNKS","fingerprint_sha256_hex":"8d4b5ee74e4693bcd1df2446408b0d54","rotates_at":null,"url":"https://pith.science/pith-signing-key.json","notes":"Pith uses this Ed25519 key to sign canonical record SHA-256 digests. Verify with: ed25519_verify(public_key, message=canonical_sha256_bytes, signature=base64decode(signature_b64))."}],"merge_version":"pith-open-graph-merge-v1","built_at":"2026-06-04T19:22:50Z","links":{"resolver":"https://pith.science/pith/6DFKPMMQUA7GP4KK5K7REXH4IU","bundle":"https://pith.science/pith/6DFKPMMQUA7GP4KK5K7REXH4IU/bundle.json","state":"https://pith.science/pith/6DFKPMMQUA7GP4KK5K7REXH4IU/state.json","well_known_bundle":"https://pith.science/.well-known/pith/6DFKPMMQUA7GP4KK5K7REXH4IU/bundle.json"},"state":{"state_type":"pith_open_graph_state","state_version":"1.0","pith_number":"pith:2018:6DFKPMMQUA7GP4KK5K7REXH4IU","merge_version":"pith-open-graph-merge-v1","event_count":2,"valid_event_count":2,"invalid_event_count":0,"equivocation_count":0,"current":{"canonical_record":{"metadata":{"abstract_canon_sha256":"46c13d09618021ce34e3f18170197e5ef0393e8b6ca3fd079f37e6cad54077bd","cross_cats_sorted":[],"license":"http://arxiv.org/licenses/nonexclusive-distrib/1.0/","primary_cat":"cs.CV","submitted_at":"2018-11-27T02:37:03Z","title_canon_sha256":"21334485c10c3275276ad653b5eed50889a410a6d686027623f818e809d377b1"},"schema_version":"1.0","source":{"id":"1811.10779","kind":"arxiv","version":1}},"source_aliases":[{"alias_kind":"arxiv","alias_value":"1811.10779","created_at":"2026-05-17T23:59:47Z"},{"alias_kind":"arxiv_version","alias_value":"1811.10779v1","created_at":"2026-05-17T23:59:47Z"},{"alias_kind":"doi","alias_value":"10.48550/arxiv.1811.10779","created_at":"2026-05-17T23:59:47Z"},{"alias_kind":"pith_short_12","alias_value":"6DFKPMMQUA7G","created_at":"2026-05-18T12:32:08Z"},{"alias_kind":"pith_short_16","alias_value":"6DFKPMMQUA7GP4KK","created_at":"2026-05-18T12:32:08Z"},{"alias_kind":"pith_short_8","alias_value":"6DFKPMMQ","created_at":"2026-05-18T12:32:08Z"}],"graph_snapshots":[{"event_id":"sha256:35cdd95010a4b8b74e6712477c092c6ea15725e52ba0eb2b3787d7bd69671bf9","target":"graph","created_at":"2026-05-17T23:59:47Z","signer":{"key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","signer_id":"pith.science","signer_type":"pith_registry"},"payload":{"graph_snapshot":{"author_claims":{"count":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57","strong_count":0},"builder_version":"pith-number-builder-2026-05-17-v1","claims":{"count":0,"items":[],"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"formal_canon":{"evidence_count":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"paper":{"abstract_excerpt":"Softmax activation is commonly used to output the probability distribution over categories based on certain distance metric. In scenarios like one-shot learning, the distance metric is often chosen to be squared Euclidean distance between the query sample and the category prototype. This practice works well in most time. However, we find that choosing squared Euclidean distance may cause distance explosion leading gradients to be extremely sparse in the early stage of back propagation. We term this phenomena as the early sparse gradients problem. Though it doesn't deteriorate the convergence o","authors_text":"Rujie Liu, Wei Shen","cross_cats":[],"headline":"","license":"http://arxiv.org/licenses/nonexclusive-distrib/1.0/","primary_cat":"cs.CV","submitted_at":"2018-11-27T02:37:03Z","title":"Tackling Early Sparse Gradients in Softmax Activation Using Leaky Squared Euclidean Distance"},"references":{"count":0,"internal_anchors":0,"resolved_work":0,"sample":[],"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"source":{"id":"1811.10779","kind":"arxiv","version":1},"verdict":{"created_at":null,"id":null,"model_set":{},"one_line_summary":"","pipeline_version":null,"pith_extraction_headline":"","strongest_claim":"","weakest_assumption":""}},"verdict_id":null}}],"author_attestations":[],"timestamp_anchors":[],"storage_attestations":[],"citation_signatures":[],"replication_records":[],"corrections":[],"mirror_hints":[],"record_created":{"event_id":"sha256:7f2f4c4f5d6e1ff1840392f197755ed0b21fd41a49a2f5ac659f63c0eafe2fc3","target":"record","created_at":"2026-05-17T23:59:47Z","signer":{"key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","signer_id":"pith.science","signer_type":"pith_registry"},"payload":{"attestation_state":"computed","canonical_record":{"metadata":{"abstract_canon_sha256":"46c13d09618021ce34e3f18170197e5ef0393e8b6ca3fd079f37e6cad54077bd","cross_cats_sorted":[],"license":"http://arxiv.org/licenses/nonexclusive-distrib/1.0/","primary_cat":"cs.CV","submitted_at":"2018-11-27T02:37:03Z","title_canon_sha256":"21334485c10c3275276ad653b5eed50889a410a6d686027623f818e809d377b1"},"schema_version":"1.0","source":{"id":"1811.10779","kind":"arxiv","version":1}},"canonical_sha256":"f0caa7b190a03e67f14aeabf125cfc451e05e4e5bb77c79700bd33ae49ae647e","receipt":{"algorithm":"ed25519","builder_version":"pith-number-builder-2026-05-17-v1","canonical_sha256":"f0caa7b190a03e67f14aeabf125cfc451e05e4e5bb77c79700bd33ae49ae647e","first_computed_at":"2026-05-17T23:59:47.553376Z","key_id":"pith-v1-2026-05","kind":"pith_receipt","last_reissued_at":"2026-05-17T23:59:47.553376Z","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","receipt_version":"0.3","signature_b64":"JYn48/yy1fdm5cZQD2AHx34ILQYrHKKuwmYXs7xsceveNsYzJ7Mfgi95t6EF/HAyzq2634an+BAy2pZWBMLgBw==","signature_status":"signed_v1","signed_at":"2026-05-17T23:59:47.553788Z","signed_message":"canonical_sha256_bytes"},"source_id":"1811.10779","source_kind":"arxiv","source_version":1}}},"equivocations":[],"invalid_events":[],"applied_event_ids":["sha256:7f2f4c4f5d6e1ff1840392f197755ed0b21fd41a49a2f5ac659f63c0eafe2fc3","sha256:35cdd95010a4b8b74e6712477c092c6ea15725e52ba0eb2b3787d7bd69671bf9"],"state_sha256":"139c4ebdef113b1b6086a944bfe791f807de345ddc42316ec087247954bb269e"},"bundle_signature":{"signature_status":"signed_v1","algorithm":"ed25519","key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","signature_b64":"Ra9K+sbzcM+HcF0Ck/QUsBz3PIFosr71Sr+uIouW5n0W4dDi3mSqPQ7iYK+fhKyaOnI67IZEC6m53soIWWBOBQ==","signed_message":"bundle_sha256_bytes","signed_at":"2026-06-04T19:22:50.310664Z","bundle_sha256":"1b8bc5fb853b6c6356ac8228567f7df01caeb9737bc9b92f0d2b46d4f316c1d8"}}