{"bundle_type":"pith_open_graph_bundle","bundle_version":"1.0","pith_number":"pith:2017:I74RDOL3ZLVX77XQHXPOZGMON2","short_pith_number":"pith:I74RDOL3","canonical_record":{"source":{"id":"1708.07227","kind":"arxiv","version":1},"metadata":{"license":"http://creativecommons.org/licenses/by/4.0/","primary_cat":"cs.LG","submitted_at":"2017-08-24T00:20:16Z","cross_cats_sorted":[],"title_canon_sha256":"e1c2a11c8c238a266ccb0fbc68938cd62050514097ae6f0bb0bde8fa0a094a48","abstract_canon_sha256":"d3bc72e9e2c2cef82adc213110dc4ecf2b9d70c7382012ff708e9358ce6f1a8b"},"schema_version":"1.0"},"canonical_sha256":"47f911b97bcaeb7ffef03ddeec998e6ea407e5beb858e35f2a6836da74c85895","source":{"kind":"arxiv","id":"1708.07227","version":1},"source_aliases":[{"alias_kind":"arxiv","alias_value":"1708.07227","created_at":"2026-05-18T00:36:46Z"},{"alias_kind":"arxiv_version","alias_value":"1708.07227v1","created_at":"2026-05-18T00:36:46Z"},{"alias_kind":"doi","alias_value":"10.48550/arxiv.1708.07227","created_at":"2026-05-18T00:36:46Z"},{"alias_kind":"pith_short_12","alias_value":"I74RDOL3ZLVX","created_at":"2026-05-18T12:31:21Z"},{"alias_kind":"pith_short_16","alias_value":"I74RDOL3ZLVX77XQ","created_at":"2026-05-18T12:31:21Z"},{"alias_kind":"pith_short_8","alias_value":"I74RDOL3","created_at":"2026-05-18T12:31:21Z"}],"events":[{"event_type":"record_created","subject_pith_number":"pith:2017:I74RDOL3ZLVX77XQHXPOZGMON2","target":"record","payload":{"canonical_record":{"source":{"id":"1708.07227","kind":"arxiv","version":1},"metadata":{"license":"http://creativecommons.org/licenses/by/4.0/","primary_cat":"cs.LG","submitted_at":"2017-08-24T00:20:16Z","cross_cats_sorted":[],"title_canon_sha256":"e1c2a11c8c238a266ccb0fbc68938cd62050514097ae6f0bb0bde8fa0a094a48","abstract_canon_sha256":"d3bc72e9e2c2cef82adc213110dc4ecf2b9d70c7382012ff708e9358ce6f1a8b"},"schema_version":"1.0"},"canonical_sha256":"47f911b97bcaeb7ffef03ddeec998e6ea407e5beb858e35f2a6836da74c85895","receipt":{"kind":"pith_receipt","key_id":"pith-v1-2026-05","algorithm":"ed25519","signed_at":"2026-05-18T00:36:46.858486Z","signature_b64":"S1el3XwN0mzFSAdc314/npk12JjCCFEKtxH0tsCnppGmCuAdeK0SGHB/8t8T+eS+5c91GSj6SXv3RqkEuw6RAg==","signed_message":"canonical_sha256_bytes","builder_version":"pith-number-builder-2026-05-17-v1","receipt_version":"0.3","canonical_sha256":"47f911b97bcaeb7ffef03ddeec998e6ea407e5beb858e35f2a6836da74c85895","last_reissued_at":"2026-05-18T00:36:46.857965Z","signature_status":"signed_v1","first_computed_at":"2026-05-18T00:36:46.857965Z","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54"},"source_kind":"arxiv","source_id":"1708.07227","source_version":1,"attestation_state":"computed"},"signer":{"signer_id":"pith.science","signer_type":"pith_registry","key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54"},"created_at":"2026-05-18T00:36:46Z","supersedes":[],"prev_event":null,"signature":{"signature_status":"signed_v1","algorithm":"ed25519","key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","signature_b64":"PDsTVUdb7dR826J19OzwKAKuBDM7tQ2U4HblKZEagMZ+NegEgK4CZ+k962ziAFp9mfKt6yUewakWLYRfiBLtBg==","signed_message":"open_graph_event_sha256_bytes","signed_at":"2026-06-12T03:44:59.094887Z"},"content_sha256":"f6031202c4ff41956f7dcef38a85fee0e5d2fc3f79a6bd2f4d168b6c7893d5b1","schema_version":"1.0","event_id":"sha256:f6031202c4ff41956f7dcef38a85fee0e5d2fc3f79a6bd2f4d168b6c7893d5b1"},{"event_type":"graph_snapshot","subject_pith_number":"pith:2017:I74RDOL3ZLVX77XQHXPOZGMON2","target":"graph","payload":{"graph_snapshot":{"paper":{"title":"Proportionate gradient updates with PercentDelta","license":"http://creativecommons.org/licenses/by/4.0/","headline":"","cross_cats":[],"primary_cat":"cs.LG","authors_text":"Sami Abu-el-haija","submitted_at":"2017-08-24T00:20:16Z","abstract_excerpt":"Deep Neural Networks are generally trained using iterative gradient updates. Magnitudes of gradients are affected by many factors, including choice of activation functions and initialization. More importantly, gradient magnitudes can greatly differ across layers, with some layers receiving much smaller gradients than others. causing some layers to train slower than others and therefore slowing down the overall convergence. We analytically explain this disproportionality. Then we propose to explicitly train all layers at the same speed, by scaling the gradient w.r.t. every trainable tensor to b"},"claims":{"count":0,"items":[],"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"source":{"id":"1708.07227","kind":"arxiv","version":1},"verdict":{"id":null,"model_set":{},"created_at":null,"strongest_claim":"","one_line_summary":"","pipeline_version":null,"weakest_assumption":"","pith_extraction_headline":""},"references":{"count":0,"sample":[],"resolved_work":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57","internal_anchors":0},"formal_canon":{"evidence_count":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"author_claims":{"count":0,"strong_count":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"builder_version":"pith-number-builder-2026-05-17-v1"},"verdict_id":null},"signer":{"signer_id":"pith.science","signer_type":"pith_registry","key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54"},"created_at":"2026-05-18T00:36:46Z","supersedes":[],"prev_event":null,"signature":{"signature_status":"signed_v1","algorithm":"ed25519","key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","signature_b64":"/gLcbFxjLl8d3z+ardGq8g70aw10RbDWc0j21RtGSid6HdeuxES7QYKh7stRcg17m0igw446VX4285iWqZnsDQ==","signed_message":"open_graph_event_sha256_bytes","signed_at":"2026-06-12T03:44:59.095234Z"},"content_sha256":"c077222e4c499a30a495159899aee07e306cb872983acbe793a64e046741dc73","schema_version":"1.0","event_id":"sha256:c077222e4c499a30a495159899aee07e306cb872983acbe793a64e046741dc73"}],"timestamp_proofs":[],"mirror_hints":[{"mirror_type":"https","name":"Pith Resolver","base_url":"https://pith.science","bundle_url":"https://pith.science/pith/I74RDOL3ZLVX77XQHXPOZGMON2/bundle.json","state_url":"https://pith.science/pith/I74RDOL3ZLVX77XQHXPOZGMON2/state.json","well_known_bundle_url":"https://pith.science/.well-known/pith/I74RDOL3ZLVX77XQHXPOZGMON2/bundle.json","status":"primary"}],"public_keys":[{"key_id":"pith-v1-2026-05","algorithm":"ed25519","format":"raw","public_key_b64":"stVStoiQhXFxp4s2pdzPNoqVNBMojDU/fJ2db5S3CbM=","public_key_hex":"b2d552b68890857171a78b36a5dccf368a953413288c353f7c9d9d6f94b709b3","fingerprint_sha256_b32_first128bits":"RVFV5Z2OI2J3ZUO7ERDEBCYNKS","fingerprint_sha256_hex":"8d4b5ee74e4693bcd1df2446408b0d54","rotates_at":null,"url":"https://pith.science/pith-signing-key.json","notes":"Pith uses this Ed25519 key to sign canonical record SHA-256 digests. Verify with: ed25519_verify(public_key, message=canonical_sha256_bytes, signature=base64decode(signature_b64))."}],"merge_version":"pith-open-graph-merge-v1","built_at":"2026-06-12T03:44:59Z","links":{"resolver":"https://pith.science/pith/I74RDOL3ZLVX77XQHXPOZGMON2","bundle":"https://pith.science/pith/I74RDOL3ZLVX77XQHXPOZGMON2/bundle.json","state":"https://pith.science/pith/I74RDOL3ZLVX77XQHXPOZGMON2/state.json","well_known_bundle":"https://pith.science/.well-known/pith/I74RDOL3ZLVX77XQHXPOZGMON2/bundle.json"},"state":{"state_type":"pith_open_graph_state","state_version":"1.0","pith_number":"pith:2017:I74RDOL3ZLVX77XQHXPOZGMON2","merge_version":"pith-open-graph-merge-v1","event_count":2,"valid_event_count":2,"invalid_event_count":0,"equivocation_count":0,"current":{"canonical_record":{"metadata":{"abstract_canon_sha256":"d3bc72e9e2c2cef82adc213110dc4ecf2b9d70c7382012ff708e9358ce6f1a8b","cross_cats_sorted":[],"license":"http://creativecommons.org/licenses/by/4.0/","primary_cat":"cs.LG","submitted_at":"2017-08-24T00:20:16Z","title_canon_sha256":"e1c2a11c8c238a266ccb0fbc68938cd62050514097ae6f0bb0bde8fa0a094a48"},"schema_version":"1.0","source":{"id":"1708.07227","kind":"arxiv","version":1}},"source_aliases":[{"alias_kind":"arxiv","alias_value":"1708.07227","created_at":"2026-05-18T00:36:46Z"},{"alias_kind":"arxiv_version","alias_value":"1708.07227v1","created_at":"2026-05-18T00:36:46Z"},{"alias_kind":"doi","alias_value":"10.48550/arxiv.1708.07227","created_at":"2026-05-18T00:36:46Z"},{"alias_kind":"pith_short_12","alias_value":"I74RDOL3ZLVX","created_at":"2026-05-18T12:31:21Z"},{"alias_kind":"pith_short_16","alias_value":"I74RDOL3ZLVX77XQ","created_at":"2026-05-18T12:31:21Z"},{"alias_kind":"pith_short_8","alias_value":"I74RDOL3","created_at":"2026-05-18T12:31:21Z"}],"graph_snapshots":[{"event_id":"sha256:c077222e4c499a30a495159899aee07e306cb872983acbe793a64e046741dc73","target":"graph","created_at":"2026-05-18T00:36:46Z","signer":{"key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","signer_id":"pith.science","signer_type":"pith_registry"},"payload":{"graph_snapshot":{"author_claims":{"count":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57","strong_count":0},"builder_version":"pith-number-builder-2026-05-17-v1","claims":{"count":0,"items":[],"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"formal_canon":{"evidence_count":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"paper":{"abstract_excerpt":"Deep Neural Networks are generally trained using iterative gradient updates. Magnitudes of gradients are affected by many factors, including choice of activation functions and initialization. More importantly, gradient magnitudes can greatly differ across layers, with some layers receiving much smaller gradients than others. causing some layers to train slower than others and therefore slowing down the overall convergence. We analytically explain this disproportionality. Then we propose to explicitly train all layers at the same speed, by scaling the gradient w.r.t. every trainable tensor to b","authors_text":"Sami Abu-el-haija","cross_cats":[],"headline":"","license":"http://creativecommons.org/licenses/by/4.0/","primary_cat":"cs.LG","submitted_at":"2017-08-24T00:20:16Z","title":"Proportionate gradient updates with PercentDelta"},"references":{"count":0,"internal_anchors":0,"resolved_work":0,"sample":[],"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"source":{"id":"1708.07227","kind":"arxiv","version":1},"verdict":{"created_at":null,"id":null,"model_set":{},"one_line_summary":"","pipeline_version":null,"pith_extraction_headline":"","strongest_claim":"","weakest_assumption":""}},"verdict_id":null}}],"author_attestations":[],"timestamp_anchors":[],"storage_attestations":[],"citation_signatures":[],"replication_records":[],"corrections":[],"mirror_hints":[],"record_created":{"event_id":"sha256:f6031202c4ff41956f7dcef38a85fee0e5d2fc3f79a6bd2f4d168b6c7893d5b1","target":"record","created_at":"2026-05-18T00:36:46Z","signer":{"key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","signer_id":"pith.science","signer_type":"pith_registry"},"payload":{"attestation_state":"computed","canonical_record":{"metadata":{"abstract_canon_sha256":"d3bc72e9e2c2cef82adc213110dc4ecf2b9d70c7382012ff708e9358ce6f1a8b","cross_cats_sorted":[],"license":"http://creativecommons.org/licenses/by/4.0/","primary_cat":"cs.LG","submitted_at":"2017-08-24T00:20:16Z","title_canon_sha256":"e1c2a11c8c238a266ccb0fbc68938cd62050514097ae6f0bb0bde8fa0a094a48"},"schema_version":"1.0","source":{"id":"1708.07227","kind":"arxiv","version":1}},"canonical_sha256":"47f911b97bcaeb7ffef03ddeec998e6ea407e5beb858e35f2a6836da74c85895","receipt":{"algorithm":"ed25519","builder_version":"pith-number-builder-2026-05-17-v1","canonical_sha256":"47f911b97bcaeb7ffef03ddeec998e6ea407e5beb858e35f2a6836da74c85895","first_computed_at":"2026-05-18T00:36:46.857965Z","key_id":"pith-v1-2026-05","kind":"pith_receipt","last_reissued_at":"2026-05-18T00:36:46.857965Z","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","receipt_version":"0.3","signature_b64":"S1el3XwN0mzFSAdc314/npk12JjCCFEKtxH0tsCnppGmCuAdeK0SGHB/8t8T+eS+5c91GSj6SXv3RqkEuw6RAg==","signature_status":"signed_v1","signed_at":"2026-05-18T00:36:46.858486Z","signed_message":"canonical_sha256_bytes"},"source_id":"1708.07227","source_kind":"arxiv","source_version":1}}},"equivocations":[],"invalid_events":[],"applied_event_ids":["sha256:f6031202c4ff41956f7dcef38a85fee0e5d2fc3f79a6bd2f4d168b6c7893d5b1","sha256:c077222e4c499a30a495159899aee07e306cb872983acbe793a64e046741dc73"],"state_sha256":"c99130f5ca42f6e1f0ed52fd6f0c4d2cc28736293747d81541c4a488105f9ea3"},"bundle_signature":{"signature_status":"signed_v1","algorithm":"ed25519","key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","signature_b64":"K7pWJnIk+48ef5wbruRTiqQZ8UphdXGfnUpJD94w5NdYVhWsAkJC0zRjWcEuSpgfN3ZOBX76fZXe7gmOeW6oAw==","signed_message":"bundle_sha256_bytes","signed_at":"2026-06-12T03:44:59.097291Z","bundle_sha256":"a8d1fad7dc3ec936e14cc30fc17e69b91e8495e461671bd5ae9fcb59f4ff3292"}}