{"bundle_type":"pith_open_graph_bundle","bundle_version":"1.0","pith_number":"pith:2017:P5FZCUYMCBYOWFTX4NSSEMNIGE","short_pith_number":"pith:P5FZCUYM","canonical_record":{"source":{"id":"1705.11159","kind":"arxiv","version":1},"metadata":{"license":"http://arxiv.org/licenses/nonexclusive-distrib/1.0/","primary_cat":"cs.LG","submitted_at":"2017-05-31T15:58:35Z","cross_cats_sorted":[],"title_canon_sha256":"5290540a0ea2c0cba39a4dcf07248ac2d8f5ebe2647a69e55466bb052ba28c4e","abstract_canon_sha256":"7900ed35c572c60742e69a816bcccfe468a936912b0e22b73aba8b66da5cd657"},"schema_version":"1.0"},"canonical_sha256":"7f4b91530c1070eb1677e3652231a8312f8b877f80a6e18348198fb54e4d9c87","source":{"kind":"arxiv","id":"1705.11159","version":1},"source_aliases":[{"alias_kind":"arxiv","alias_value":"1705.11159","created_at":"2026-05-18T00:43:19Z"},{"alias_kind":"arxiv_version","alias_value":"1705.11159v1","created_at":"2026-05-18T00:43:19Z"},{"alias_kind":"doi","alias_value":"10.48550/arxiv.1705.11159","created_at":"2026-05-18T00:43:19Z"},{"alias_kind":"pith_short_12","alias_value":"P5FZCUYMCBYO","created_at":"2026-05-18T12:31:37Z"},{"alias_kind":"pith_short_16","alias_value":"P5FZCUYMCBYOWFTX","created_at":"2026-05-18T12:31:37Z"},{"alias_kind":"pith_short_8","alias_value":"P5FZCUYM","created_at":"2026-05-18T12:31:37Z"}],"events":[{"event_type":"record_created","subject_pith_number":"pith:2017:P5FZCUYMCBYOWFTX4NSSEMNIGE","target":"record","payload":{"canonical_record":{"source":{"id":"1705.11159","kind":"arxiv","version":1},"metadata":{"license":"http://arxiv.org/licenses/nonexclusive-distrib/1.0/","primary_cat":"cs.LG","submitted_at":"2017-05-31T15:58:35Z","cross_cats_sorted":[],"title_canon_sha256":"5290540a0ea2c0cba39a4dcf07248ac2d8f5ebe2647a69e55466bb052ba28c4e","abstract_canon_sha256":"7900ed35c572c60742e69a816bcccfe468a936912b0e22b73aba8b66da5cd657"},"schema_version":"1.0"},"canonical_sha256":"7f4b91530c1070eb1677e3652231a8312f8b877f80a6e18348198fb54e4d9c87","receipt":{"kind":"pith_receipt","key_id":"pith-v1-2026-05","algorithm":"ed25519","signed_at":"2026-05-18T00:43:19.087962Z","signature_b64":"nrS426mC3pVk99JZPhe129IO1IGnDdBnSThR6erf2+j7KTME0zCcfBMMGx/D3rtwuhtlvAF+38d1tGVC9f3CBw==","signed_message":"canonical_sha256_bytes","builder_version":"pith-number-builder-2026-05-17-v1","receipt_version":"0.3","canonical_sha256":"7f4b91530c1070eb1677e3652231a8312f8b877f80a6e18348198fb54e4d9c87","last_reissued_at":"2026-05-18T00:43:19.087339Z","signature_status":"signed_v1","first_computed_at":"2026-05-18T00:43:19.087339Z","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54"},"source_kind":"arxiv","source_id":"1705.11159","source_version":1,"attestation_state":"computed"},"signer":{"signer_id":"pith.science","signer_type":"pith_registry","key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54"},"created_at":"2026-05-18T00:43:19Z","supersedes":[],"prev_event":null,"signature":{"signature_status":"signed_v1","algorithm":"ed25519","key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","signature_b64":"f8Nl+AWOXifLKnx/BucwW0ICrqvoviYWVY0wmB67X7DkaaUZmQ5QmyOPaBvirGr6NtmOVVkylZmMJRmQS1/OCA==","signed_message":"open_graph_event_sha256_bytes","signed_at":"2026-05-20T00:46:27.490392Z"},"content_sha256":"e69d941e82f0356ac1ec8f9734dc08b1551aac9d9e3c0e5594165369d5cbfc37","schema_version":"1.0","event_id":"sha256:e69d941e82f0356ac1ec8f9734dc08b1551aac9d9e3c0e5594165369d5cbfc37"},{"event_type":"graph_snapshot","subject_pith_number":"pith:2017:P5FZCUYMCBYOWFTX4NSSEMNIGE","target":"graph","payload":{"graph_snapshot":{"paper":{"title":"Reinforcement Learning for Learning Rate Control","license":"http://arxiv.org/licenses/nonexclusive-distrib/1.0/","headline":"","cross_cats":[],"primary_cat":"cs.LG","authors_text":"Chang Xu, Gang Wang, Tao Qin, Tie-Yan Liu","submitted_at":"2017-05-31T15:58:35Z","abstract_excerpt":"Stochastic gradient descent (SGD), which updates the model parameters by adding a local gradient times a learning rate at each step, is widely used in model training of machine learning algorithms such as neural networks. It is observed that the models trained by SGD are sensitive to learning rates and good learning rates are problem specific. We propose an algorithm to automatically learn learning rates using neural network based actor-critic methods from deep reinforcement learning (RL).In particular, we train a policy network called actor to decide the learning rate at each step during trai"},"claims":{"count":0,"items":[],"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"source":{"id":"1705.11159","kind":"arxiv","version":1},"verdict":{"id":null,"model_set":{},"created_at":null,"strongest_claim":"","one_line_summary":"","pipeline_version":null,"weakest_assumption":"","pith_extraction_headline":""},"references":{"count":0,"sample":[],"resolved_work":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57","internal_anchors":0},"formal_canon":{"evidence_count":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"author_claims":{"count":0,"strong_count":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"builder_version":"pith-number-builder-2026-05-17-v1"},"verdict_id":null},"signer":{"signer_id":"pith.science","signer_type":"pith_registry","key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54"},"created_at":"2026-05-18T00:43:19Z","supersedes":[],"prev_event":null,"signature":{"signature_status":"signed_v1","algorithm":"ed25519","key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","signature_b64":"Aa3nAmtJDTNMcjn3dFH3MzsPFEsjrVobDFowhu5cE1pPqyYwCzFFGYLmMWHii0czhBHcBKXQlDX1Bi4f7JjEDA==","signed_message":"open_graph_event_sha256_bytes","signed_at":"2026-05-20T00:46:27.491196Z"},"content_sha256":"450b30eeed4903845471ca7d66ab91fb2ef3789ec39e67fe9f7c576ae45f3234","schema_version":"1.0","event_id":"sha256:450b30eeed4903845471ca7d66ab91fb2ef3789ec39e67fe9f7c576ae45f3234"}],"timestamp_proofs":[],"mirror_hints":[{"mirror_type":"https","name":"Pith Resolver","base_url":"https://pith.science","bundle_url":"https://pith.science/pith/P5FZCUYMCBYOWFTX4NSSEMNIGE/bundle.json","state_url":"https://pith.science/pith/P5FZCUYMCBYOWFTX4NSSEMNIGE/state.json","well_known_bundle_url":"https://pith.science/.well-known/pith/P5FZCUYMCBYOWFTX4NSSEMNIGE/bundle.json","status":"primary"}],"public_keys":[{"key_id":"pith-v1-2026-05","algorithm":"ed25519","format":"raw","public_key_b64":"stVStoiQhXFxp4s2pdzPNoqVNBMojDU/fJ2db5S3CbM=","public_key_hex":"b2d552b68890857171a78b36a5dccf368a953413288c353f7c9d9d6f94b709b3","fingerprint_sha256_b32_first128bits":"RVFV5Z2OI2J3ZUO7ERDEBCYNKS","fingerprint_sha256_hex":"8d4b5ee74e4693bcd1df2446408b0d54","rotates_at":null,"url":"https://pith.science/pith-signing-key.json","notes":"Pith uses this Ed25519 key to sign canonical record SHA-256 digests. Verify with: ed25519_verify(public_key, message=canonical_sha256_bytes, signature=base64decode(signature_b64))."}],"merge_version":"pith-open-graph-merge-v1","built_at":"2026-05-20T00:46:27Z","links":{"resolver":"https://pith.science/pith/P5FZCUYMCBYOWFTX4NSSEMNIGE","bundle":"https://pith.science/pith/P5FZCUYMCBYOWFTX4NSSEMNIGE/bundle.json","state":"https://pith.science/pith/P5FZCUYMCBYOWFTX4NSSEMNIGE/state.json","well_known_bundle":"https://pith.science/.well-known/pith/P5FZCUYMCBYOWFTX4NSSEMNIGE/bundle.json"},"state":{"state_type":"pith_open_graph_state","state_version":"1.0","pith_number":"pith:2017:P5FZCUYMCBYOWFTX4NSSEMNIGE","merge_version":"pith-open-graph-merge-v1","event_count":2,"valid_event_count":2,"invalid_event_count":0,"equivocation_count":0,"current":{"canonical_record":{"metadata":{"abstract_canon_sha256":"7900ed35c572c60742e69a816bcccfe468a936912b0e22b73aba8b66da5cd657","cross_cats_sorted":[],"license":"http://arxiv.org/licenses/nonexclusive-distrib/1.0/","primary_cat":"cs.LG","submitted_at":"2017-05-31T15:58:35Z","title_canon_sha256":"5290540a0ea2c0cba39a4dcf07248ac2d8f5ebe2647a69e55466bb052ba28c4e"},"schema_version":"1.0","source":{"id":"1705.11159","kind":"arxiv","version":1}},"source_aliases":[{"alias_kind":"arxiv","alias_value":"1705.11159","created_at":"2026-05-18T00:43:19Z"},{"alias_kind":"arxiv_version","alias_value":"1705.11159v1","created_at":"2026-05-18T00:43:19Z"},{"alias_kind":"doi","alias_value":"10.48550/arxiv.1705.11159","created_at":"2026-05-18T00:43:19Z"},{"alias_kind":"pith_short_12","alias_value":"P5FZCUYMCBYO","created_at":"2026-05-18T12:31:37Z"},{"alias_kind":"pith_short_16","alias_value":"P5FZCUYMCBYOWFTX","created_at":"2026-05-18T12:31:37Z"},{"alias_kind":"pith_short_8","alias_value":"P5FZCUYM","created_at":"2026-05-18T12:31:37Z"}],"graph_snapshots":[{"event_id":"sha256:450b30eeed4903845471ca7d66ab91fb2ef3789ec39e67fe9f7c576ae45f3234","target":"graph","created_at":"2026-05-18T00:43:19Z","signer":{"key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","signer_id":"pith.science","signer_type":"pith_registry"},"payload":{"graph_snapshot":{"author_claims":{"count":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57","strong_count":0},"builder_version":"pith-number-builder-2026-05-17-v1","claims":{"count":0,"items":[],"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"formal_canon":{"evidence_count":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"paper":{"abstract_excerpt":"Stochastic gradient descent (SGD), which updates the model parameters by adding a local gradient times a learning rate at each step, is widely used in model training of machine learning algorithms such as neural networks. It is observed that the models trained by SGD are sensitive to learning rates and good learning rates are problem specific. We propose an algorithm to automatically learn learning rates using neural network based actor-critic methods from deep reinforcement learning (RL).In particular, we train a policy network called actor to decide the learning rate at each step during trai","authors_text":"Chang Xu, Gang Wang, Tao Qin, Tie-Yan Liu","cross_cats":[],"headline":"","license":"http://arxiv.org/licenses/nonexclusive-distrib/1.0/","primary_cat":"cs.LG","submitted_at":"2017-05-31T15:58:35Z","title":"Reinforcement Learning for Learning Rate Control"},"references":{"count":0,"internal_anchors":0,"resolved_work":0,"sample":[],"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"source":{"id":"1705.11159","kind":"arxiv","version":1},"verdict":{"created_at":null,"id":null,"model_set":{},"one_line_summary":"","pipeline_version":null,"pith_extraction_headline":"","strongest_claim":"","weakest_assumption":""}},"verdict_id":null}}],"author_attestations":[],"timestamp_anchors":[],"storage_attestations":[],"citation_signatures":[],"replication_records":[],"corrections":[],"mirror_hints":[],"record_created":{"event_id":"sha256:e69d941e82f0356ac1ec8f9734dc08b1551aac9d9e3c0e5594165369d5cbfc37","target":"record","created_at":"2026-05-18T00:43:19Z","signer":{"key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","signer_id":"pith.science","signer_type":"pith_registry"},"payload":{"attestation_state":"computed","canonical_record":{"metadata":{"abstract_canon_sha256":"7900ed35c572c60742e69a816bcccfe468a936912b0e22b73aba8b66da5cd657","cross_cats_sorted":[],"license":"http://arxiv.org/licenses/nonexclusive-distrib/1.0/","primary_cat":"cs.LG","submitted_at":"2017-05-31T15:58:35Z","title_canon_sha256":"5290540a0ea2c0cba39a4dcf07248ac2d8f5ebe2647a69e55466bb052ba28c4e"},"schema_version":"1.0","source":{"id":"1705.11159","kind":"arxiv","version":1}},"canonical_sha256":"7f4b91530c1070eb1677e3652231a8312f8b877f80a6e18348198fb54e4d9c87","receipt":{"algorithm":"ed25519","builder_version":"pith-number-builder-2026-05-17-v1","canonical_sha256":"7f4b91530c1070eb1677e3652231a8312f8b877f80a6e18348198fb54e4d9c87","first_computed_at":"2026-05-18T00:43:19.087339Z","key_id":"pith-v1-2026-05","kind":"pith_receipt","last_reissued_at":"2026-05-18T00:43:19.087339Z","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","receipt_version":"0.3","signature_b64":"nrS426mC3pVk99JZPhe129IO1IGnDdBnSThR6erf2+j7KTME0zCcfBMMGx/D3rtwuhtlvAF+38d1tGVC9f3CBw==","signature_status":"signed_v1","signed_at":"2026-05-18T00:43:19.087962Z","signed_message":"canonical_sha256_bytes"},"source_id":"1705.11159","source_kind":"arxiv","source_version":1}}},"equivocations":[],"invalid_events":[],"applied_event_ids":["sha256:e69d941e82f0356ac1ec8f9734dc08b1551aac9d9e3c0e5594165369d5cbfc37","sha256:450b30eeed4903845471ca7d66ab91fb2ef3789ec39e67fe9f7c576ae45f3234"],"state_sha256":"804b59c2f28cbdfd330b3804b452f07d59b80c27653d2a9c0bbb04f98508f99d"},"bundle_signature":{"signature_status":"signed_v1","algorithm":"ed25519","key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","signature_b64":"y6Qa3rnTmBSx8h9ZczqIWomKy/ZTMwFqP6xsoSSi9otyxZtX7RhMy3elEfJ0wKiE3rKO0DlvpLHfqpa7CyWVBA==","signed_message":"bundle_sha256_bytes","signed_at":"2026-05-20T00:46:27.496525Z","bundle_sha256":"392831a353c71198e6c244187f3d443ce6a7ea21c2092343d9fa87eb5091477d"}}