{"bundle_type":"pith_open_graph_bundle","bundle_version":"1.0","pith_number":"pith:2016:N3VEWPOEBNXSVZXVISOPZLGISU","short_pith_number":"pith:N3VEWPOE","canonical_record":{"source":{"id":"1607.00446","kind":"arxiv","version":2},"metadata":{"license":"http://arxiv.org/licenses/nonexclusive-distrib/1.0/","primary_cat":"cs.AI","submitted_at":"2016-07-02T01:33:00Z","cross_cats_sorted":["cs.LG","stat.ML"],"title_canon_sha256":"0f57fbaae635827dd50b316ccafa614a4412537f1f339ea0b18da1868d728533","abstract_canon_sha256":"c86d123082c7b02b53a7b2d60e90f290a76279404273c8a3cc0dd6f67c9c4cdc"},"schema_version":"1.0"},"canonical_sha256":"6eea4b3dc40b6f2ae6f5449cfcacc89528d40dff2dea5f63402b4dc65fc92519","source":{"kind":"arxiv","id":"1607.00446","version":2},"source_aliases":[{"alias_kind":"arxiv","alias_value":"1607.00446","created_at":"2026-05-18T01:01:30Z"},{"alias_kind":"arxiv_version","alias_value":"1607.00446v2","created_at":"2026-05-18T01:01:30Z"},{"alias_kind":"doi","alias_value":"10.48550/arxiv.1607.00446","created_at":"2026-05-18T01:01:30Z"},{"alias_kind":"pith_short_12","alias_value":"N3VEWPOEBNXS","created_at":"2026-05-18T12:30:32Z"},{"alias_kind":"pith_short_16","alias_value":"N3VEWPOEBNXSVZXV","created_at":"2026-05-18T12:30:32Z"},{"alias_kind":"pith_short_8","alias_value":"N3VEWPOE","created_at":"2026-05-18T12:30:32Z"}],"events":[{"event_type":"record_created","subject_pith_number":"pith:2016:N3VEWPOEBNXSVZXVISOPZLGISU","target":"record","payload":{"canonical_record":{"source":{"id":"1607.00446","kind":"arxiv","version":2},"metadata":{"license":"http://arxiv.org/licenses/nonexclusive-distrib/1.0/","primary_cat":"cs.AI","submitted_at":"2016-07-02T01:33:00Z","cross_cats_sorted":["cs.LG","stat.ML"],"title_canon_sha256":"0f57fbaae635827dd50b316ccafa614a4412537f1f339ea0b18da1868d728533","abstract_canon_sha256":"c86d123082c7b02b53a7b2d60e90f290a76279404273c8a3cc0dd6f67c9c4cdc"},"schema_version":"1.0"},"canonical_sha256":"6eea4b3dc40b6f2ae6f5449cfcacc89528d40dff2dea5f63402b4dc65fc92519","receipt":{"kind":"pith_receipt","key_id":"pith-v1-2026-05","algorithm":"ed25519","signed_at":"2026-05-18T01:01:30.976956Z","signature_b64":"lya0934ehlwmUWUpocVTc6KO/pdeBuS8r5fpAoAFnTeB04RqdTeOuoU8QVM4BHiVZGkOoW1utjBm7SjcRYoMCw==","signed_message":"canonical_sha256_bytes","builder_version":"pith-number-builder-2026-05-17-v1","receipt_version":"0.3","canonical_sha256":"6eea4b3dc40b6f2ae6f5449cfcacc89528d40dff2dea5f63402b4dc65fc92519","last_reissued_at":"2026-05-18T01:01:30.976498Z","signature_status":"signed_v1","first_computed_at":"2026-05-18T01:01:30.976498Z","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54"},"source_kind":"arxiv","source_id":"1607.00446","source_version":2,"attestation_state":"computed"},"signer":{"signer_id":"pith.science","signer_type":"pith_registry","key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54"},"created_at":"2026-05-18T01:01:30Z","supersedes":[],"prev_event":null,"signature":{"signature_status":"signed_v1","algorithm":"ed25519","key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","signature_b64":"jAiRBp0WryhJMI3Z+zTr0uAGFT+4MXk/iDXdXfh9bm+eIKeKbnh6hirhQFysm595tilVFJIh+eOHRQLhACB3Cg==","signed_message":"open_graph_event_sha256_bytes","signed_at":"2026-05-26T02:21:52.356704Z"},"content_sha256":"7b8680c8a19f5a14c9f7f86249f1dd5bf0880c8051aa93e32155a204cc50b04e","schema_version":"1.0","event_id":"sha256:7b8680c8a19f5a14c9f7f86249f1dd5bf0880c8051aa93e32155a204cc50b04e"},{"event_type":"graph_snapshot","subject_pith_number":"pith:2016:N3VEWPOEBNXSVZXVISOPZLGISU","target":"graph","payload":{"graph_snapshot":{"paper":{"title":"A Greedy Approach to Adapting the Trace Parameter for Temporal Difference Learning","license":"http://arxiv.org/licenses/nonexclusive-distrib/1.0/","headline":"","cross_cats":["cs.LG","stat.ML"],"primary_cat":"cs.AI","authors_text":"Adam White, Martha White","submitted_at":"2016-07-02T01:33:00Z","abstract_excerpt":"One of the main obstacles to broad application of reinforcement learning methods is the parameter sensitivity of our core learning algorithms. In many large-scale applications, online computation and function approximation represent key strategies in scaling up reinforcement learning algorithms. In this setting, we have effective and reasonably well understood algorithms for adapting the learning-rate parameter, online during learning. Such meta-learning approaches can improve robustness of learning and enable specialization to current task, improving learning speed. For temporal-difference le"},"claims":{"count":0,"items":[],"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"source":{"id":"1607.00446","kind":"arxiv","version":2},"verdict":{"id":null,"model_set":{},"created_at":null,"strongest_claim":"","one_line_summary":"","pipeline_version":null,"weakest_assumption":"","pith_extraction_headline":""},"references":{"count":0,"sample":[],"resolved_work":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57","internal_anchors":0},"formal_canon":{"evidence_count":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"author_claims":{"count":0,"strong_count":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"builder_version":"pith-number-builder-2026-05-17-v1"},"verdict_id":null},"signer":{"signer_id":"pith.science","signer_type":"pith_registry","key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54"},"created_at":"2026-05-18T01:01:30Z","supersedes":[],"prev_event":null,"signature":{"signature_status":"signed_v1","algorithm":"ed25519","key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","signature_b64":"KbEd8o/bacs6CVnl9A0Zb8HXwDyTt909nMDZkQbOc4AXHV7yjJMdavb1EODgQYQZH4jKNV9aihFbO6+v7saMBA==","signed_message":"open_graph_event_sha256_bytes","signed_at":"2026-05-26T02:21:52.357330Z"},"content_sha256":"29de8e567f3c2e98e7292ad8a5d428457ffbe53693f895eb3fa68d6bb35541e9","schema_version":"1.0","event_id":"sha256:29de8e567f3c2e98e7292ad8a5d428457ffbe53693f895eb3fa68d6bb35541e9"}],"timestamp_proofs":[],"mirror_hints":[{"mirror_type":"https","name":"Pith Resolver","base_url":"https://pith.science","bundle_url":"https://pith.science/pith/N3VEWPOEBNXSVZXVISOPZLGISU/bundle.json","state_url":"https://pith.science/pith/N3VEWPOEBNXSVZXVISOPZLGISU/state.json","well_known_bundle_url":"https://pith.science/.well-known/pith/N3VEWPOEBNXSVZXVISOPZLGISU/bundle.json","status":"primary"}],"public_keys":[{"key_id":"pith-v1-2026-05","algorithm":"ed25519","format":"raw","public_key_b64":"stVStoiQhXFxp4s2pdzPNoqVNBMojDU/fJ2db5S3CbM=","public_key_hex":"b2d552b68890857171a78b36a5dccf368a953413288c353f7c9d9d6f94b709b3","fingerprint_sha256_b32_first128bits":"RVFV5Z2OI2J3ZUO7ERDEBCYNKS","fingerprint_sha256_hex":"8d4b5ee74e4693bcd1df2446408b0d54","rotates_at":null,"url":"https://pith.science/pith-signing-key.json","notes":"Pith uses this Ed25519 key to sign canonical record SHA-256 digests. Verify with: ed25519_verify(public_key, message=canonical_sha256_bytes, signature=base64decode(signature_b64))."}],"merge_version":"pith-open-graph-merge-v1","built_at":"2026-05-26T02:21:52Z","links":{"resolver":"https://pith.science/pith/N3VEWPOEBNXSVZXVISOPZLGISU","bundle":"https://pith.science/pith/N3VEWPOEBNXSVZXVISOPZLGISU/bundle.json","state":"https://pith.science/pith/N3VEWPOEBNXSVZXVISOPZLGISU/state.json","well_known_bundle":"https://pith.science/.well-known/pith/N3VEWPOEBNXSVZXVISOPZLGISU/bundle.json"},"state":{"state_type":"pith_open_graph_state","state_version":"1.0","pith_number":"pith:2016:N3VEWPOEBNXSVZXVISOPZLGISU","merge_version":"pith-open-graph-merge-v1","event_count":2,"valid_event_count":2,"invalid_event_count":0,"equivocation_count":0,"current":{"canonical_record":{"metadata":{"abstract_canon_sha256":"c86d123082c7b02b53a7b2d60e90f290a76279404273c8a3cc0dd6f67c9c4cdc","cross_cats_sorted":["cs.LG","stat.ML"],"license":"http://arxiv.org/licenses/nonexclusive-distrib/1.0/","primary_cat":"cs.AI","submitted_at":"2016-07-02T01:33:00Z","title_canon_sha256":"0f57fbaae635827dd50b316ccafa614a4412537f1f339ea0b18da1868d728533"},"schema_version":"1.0","source":{"id":"1607.00446","kind":"arxiv","version":2}},"source_aliases":[{"alias_kind":"arxiv","alias_value":"1607.00446","created_at":"2026-05-18T01:01:30Z"},{"alias_kind":"arxiv_version","alias_value":"1607.00446v2","created_at":"2026-05-18T01:01:30Z"},{"alias_kind":"doi","alias_value":"10.48550/arxiv.1607.00446","created_at":"2026-05-18T01:01:30Z"},{"alias_kind":"pith_short_12","alias_value":"N3VEWPOEBNXS","created_at":"2026-05-18T12:30:32Z"},{"alias_kind":"pith_short_16","alias_value":"N3VEWPOEBNXSVZXV","created_at":"2026-05-18T12:30:32Z"},{"alias_kind":"pith_short_8","alias_value":"N3VEWPOE","created_at":"2026-05-18T12:30:32Z"}],"graph_snapshots":[{"event_id":"sha256:29de8e567f3c2e98e7292ad8a5d428457ffbe53693f895eb3fa68d6bb35541e9","target":"graph","created_at":"2026-05-18T01:01:30Z","signer":{"key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","signer_id":"pith.science","signer_type":"pith_registry"},"payload":{"graph_snapshot":{"author_claims":{"count":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57","strong_count":0},"builder_version":"pith-number-builder-2026-05-17-v1","claims":{"count":0,"items":[],"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"formal_canon":{"evidence_count":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"paper":{"abstract_excerpt":"One of the main obstacles to broad application of reinforcement learning methods is the parameter sensitivity of our core learning algorithms. In many large-scale applications, online computation and function approximation represent key strategies in scaling up reinforcement learning algorithms. In this setting, we have effective and reasonably well understood algorithms for adapting the learning-rate parameter, online during learning. Such meta-learning approaches can improve robustness of learning and enable specialization to current task, improving learning speed. For temporal-difference le","authors_text":"Adam White, Martha White","cross_cats":["cs.LG","stat.ML"],"headline":"","license":"http://arxiv.org/licenses/nonexclusive-distrib/1.0/","primary_cat":"cs.AI","submitted_at":"2016-07-02T01:33:00Z","title":"A Greedy Approach to Adapting the Trace Parameter for Temporal Difference Learning"},"references":{"count":0,"internal_anchors":0,"resolved_work":0,"sample":[],"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"source":{"id":"1607.00446","kind":"arxiv","version":2},"verdict":{"created_at":null,"id":null,"model_set":{},"one_line_summary":"","pipeline_version":null,"pith_extraction_headline":"","strongest_claim":"","weakest_assumption":""}},"verdict_id":null}}],"author_attestations":[],"timestamp_anchors":[],"storage_attestations":[],"citation_signatures":[],"replication_records":[],"corrections":[],"mirror_hints":[],"record_created":{"event_id":"sha256:7b8680c8a19f5a14c9f7f86249f1dd5bf0880c8051aa93e32155a204cc50b04e","target":"record","created_at":"2026-05-18T01:01:30Z","signer":{"key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","signer_id":"pith.science","signer_type":"pith_registry"},"payload":{"attestation_state":"computed","canonical_record":{"metadata":{"abstract_canon_sha256":"c86d123082c7b02b53a7b2d60e90f290a76279404273c8a3cc0dd6f67c9c4cdc","cross_cats_sorted":["cs.LG","stat.ML"],"license":"http://arxiv.org/licenses/nonexclusive-distrib/1.0/","primary_cat":"cs.AI","submitted_at":"2016-07-02T01:33:00Z","title_canon_sha256":"0f57fbaae635827dd50b316ccafa614a4412537f1f339ea0b18da1868d728533"},"schema_version":"1.0","source":{"id":"1607.00446","kind":"arxiv","version":2}},"canonical_sha256":"6eea4b3dc40b6f2ae6f5449cfcacc89528d40dff2dea5f63402b4dc65fc92519","receipt":{"algorithm":"ed25519","builder_version":"pith-number-builder-2026-05-17-v1","canonical_sha256":"6eea4b3dc40b6f2ae6f5449cfcacc89528d40dff2dea5f63402b4dc65fc92519","first_computed_at":"2026-05-18T01:01:30.976498Z","key_id":"pith-v1-2026-05","kind":"pith_receipt","last_reissued_at":"2026-05-18T01:01:30.976498Z","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","receipt_version":"0.3","signature_b64":"lya0934ehlwmUWUpocVTc6KO/pdeBuS8r5fpAoAFnTeB04RqdTeOuoU8QVM4BHiVZGkOoW1utjBm7SjcRYoMCw==","signature_status":"signed_v1","signed_at":"2026-05-18T01:01:30.976956Z","signed_message":"canonical_sha256_bytes"},"source_id":"1607.00446","source_kind":"arxiv","source_version":2}}},"equivocations":[],"invalid_events":[],"applied_event_ids":["sha256:7b8680c8a19f5a14c9f7f86249f1dd5bf0880c8051aa93e32155a204cc50b04e","sha256:29de8e567f3c2e98e7292ad8a5d428457ffbe53693f895eb3fa68d6bb35541e9"],"state_sha256":"c92a9c77e2030202bb679dbcbac3fed5fb212659b029b1c103259a4a09601ad3"},"bundle_signature":{"signature_status":"signed_v1","algorithm":"ed25519","key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","signature_b64":"kdzwmHPb4BIQ8xsACTNh3daYTbUdXgIp/G8msjp7XbJjdsJHMGzLnWmI4ItByh+Q7+j0bxqFE86f0wAGtMDhBg==","signed_message":"bundle_sha256_bytes","signed_at":"2026-05-26T02:21:52.360457Z","bundle_sha256":"5ac4d80ebbf2865e59c6009f1b6e2e52e98c14aea3f1ffd54fafa4bffde0c3ea"}}