{"bundle_type":"pith_open_graph_bundle","bundle_version":"1.0","pith_number":"pith:2019:6HCSNN7OV52M3VT4H4QSTUSBKD","short_pith_number":"pith:6HCSNN7O","canonical_record":{"source":{"id":"1907.02908","kind":"arxiv","version":1},"metadata":{"license":"http://arxiv.org/licenses/nonexclusive-distrib/1.0/","primary_cat":"cs.LG","submitted_at":"2019-07-05T16:14:55Z","cross_cats_sorted":["cs.AI","stat.ML"],"title_canon_sha256":"fba98bd15904f9fd04f034c12f00ede3a045f18ee17200801d106857f9085ce6","abstract_canon_sha256":"33d38104297957af69a114013ceb06b85c26f7a07fb1003ede6f5cfbf9b0df43"},"schema_version":"1.0"},"canonical_sha256":"f1c526b7eeaf74cdd67c3f2129d24150e6724308ee7f9737f859868d8f27b4c2","source":{"kind":"arxiv","id":"1907.02908","version":1},"source_aliases":[{"alias_kind":"arxiv","alias_value":"1907.02908","created_at":"2026-05-17T23:41:22Z"},{"alias_kind":"arxiv_version","alias_value":"1907.02908v1","created_at":"2026-05-17T23:41:22Z"},{"alias_kind":"doi","alias_value":"10.48550/arxiv.1907.02908","created_at":"2026-05-17T23:41:22Z"},{"alias_kind":"pith_short_12","alias_value":"6HCSNN7OV52M","created_at":"2026-05-18T12:33:10Z"},{"alias_kind":"pith_short_16","alias_value":"6HCSNN7OV52M3VT4","created_at":"2026-05-18T12:33:10Z"},{"alias_kind":"pith_short_8","alias_value":"6HCSNN7O","created_at":"2026-05-18T12:33:10Z"}],"events":[{"event_type":"record_created","subject_pith_number":"pith:2019:6HCSNN7OV52M3VT4H4QSTUSBKD","target":"record","payload":{"canonical_record":{"source":{"id":"1907.02908","kind":"arxiv","version":1},"metadata":{"license":"http://arxiv.org/licenses/nonexclusive-distrib/1.0/","primary_cat":"cs.LG","submitted_at":"2019-07-05T16:14:55Z","cross_cats_sorted":["cs.AI","stat.ML"],"title_canon_sha256":"fba98bd15904f9fd04f034c12f00ede3a045f18ee17200801d106857f9085ce6","abstract_canon_sha256":"33d38104297957af69a114013ceb06b85c26f7a07fb1003ede6f5cfbf9b0df43"},"schema_version":"1.0"},"canonical_sha256":"f1c526b7eeaf74cdd67c3f2129d24150e6724308ee7f9737f859868d8f27b4c2","receipt":{"kind":"pith_receipt","key_id":"pith-v1-2026-05","algorithm":"ed25519","signed_at":"2026-05-17T23:41:22.640334Z","signature_b64":"bydHSIs/Dr5Oo76XcLOppWC8bpJmtuqzVTatc2ZvWyaL1WmIjw4n1uIgu2vwwcw/KGiY9XFltDKnEsn9IuW3Aw==","signed_message":"canonical_sha256_bytes","builder_version":"pith-number-builder-2026-05-17-v1","receipt_version":"0.3","canonical_sha256":"f1c526b7eeaf74cdd67c3f2129d24150e6724308ee7f9737f859868d8f27b4c2","last_reissued_at":"2026-05-17T23:41:22.639669Z","signature_status":"signed_v1","first_computed_at":"2026-05-17T23:41:22.639669Z","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54"},"source_kind":"arxiv","source_id":"1907.02908","source_version":1,"attestation_state":"computed"},"signer":{"signer_id":"pith.science","signer_type":"pith_registry","key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54"},"created_at":"2026-05-17T23:41:22Z","supersedes":[],"prev_event":null,"signature":{"signature_status":"signed_v1","algorithm":"ed25519","key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","signature_b64":"iCoOmHJPlO04uKyhA9gzu9C0R322/V7DuDtT7bJqt/tajV7gtlrjbERSGFQNPSSYXR0jlZTUNypprLYhTr1rDw==","signed_message":"open_graph_event_sha256_bytes","signed_at":"2026-05-25T17:10:29.738965Z"},"content_sha256":"ae5c5abcf2549a91bd9e6864efefc1b4852d314503a6ecdc20af0d551fb66ff9","schema_version":"1.0","event_id":"sha256:ae5c5abcf2549a91bd9e6864efefc1b4852d314503a6ecdc20af0d551fb66ff9"},{"event_type":"graph_snapshot","subject_pith_number":"pith:2019:6HCSNN7OV52M3VT4H4QSTUSBKD","target":"graph","payload":{"graph_snapshot":{"paper":{"title":"On Inductive Biases in Deep Reinforcement Learning","license":"http://arxiv.org/licenses/nonexclusive-distrib/1.0/","headline":"","cross_cats":["cs.AI","stat.ML"],"primary_cat":"cs.LG","authors_text":"David Silver, Hado van Hasselt, Joseph Modayil, Matteo Hessel","submitted_at":"2019-07-05T16:14:55Z","abstract_excerpt":"Many deep reinforcement learning algorithms contain inductive biases that sculpt the agent's objective and its interface to the environment. These inductive biases can take many forms, including domain knowledge and pretuned hyper-parameters. In general, there is a trade-off between generality and performance when algorithms use such biases. Stronger biases can lead to faster learning, but weaker biases can potentially lead to more general algorithms. This trade-off is important because inductive biases are not free; substantial effort may be required to obtain relevant domain knowledge or to "},"claims":{"count":0,"items":[],"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"source":{"id":"1907.02908","kind":"arxiv","version":1},"verdict":{"id":null,"model_set":{},"created_at":null,"strongest_claim":"","one_line_summary":"","pipeline_version":null,"weakest_assumption":"","pith_extraction_headline":""},"references":{"count":0,"sample":[],"resolved_work":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57","internal_anchors":0},"formal_canon":{"evidence_count":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"author_claims":{"count":0,"strong_count":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"builder_version":"pith-number-builder-2026-05-17-v1"},"verdict_id":null},"signer":{"signer_id":"pith.science","signer_type":"pith_registry","key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54"},"created_at":"2026-05-17T23:41:22Z","supersedes":[],"prev_event":null,"signature":{"signature_status":"signed_v1","algorithm":"ed25519","key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","signature_b64":"1KGTc+f+AcRpaNmx3nOI0dVKN6JAGGEEwqWePt4UIYIqvVa+c0JxgOrTeTRUSYzBKU/dlUKY0kWHM4alYPvVBg==","signed_message":"open_graph_event_sha256_bytes","signed_at":"2026-05-25T17:10:29.739648Z"},"content_sha256":"4c1e25b6d645d9af0aa16039c2419268183d80f2b41820d3c9b165c94a51ad83","schema_version":"1.0","event_id":"sha256:4c1e25b6d645d9af0aa16039c2419268183d80f2b41820d3c9b165c94a51ad83"}],"timestamp_proofs":[],"mirror_hints":[{"mirror_type":"https","name":"Pith Resolver","base_url":"https://pith.science","bundle_url":"https://pith.science/pith/6HCSNN7OV52M3VT4H4QSTUSBKD/bundle.json","state_url":"https://pith.science/pith/6HCSNN7OV52M3VT4H4QSTUSBKD/state.json","well_known_bundle_url":"https://pith.science/.well-known/pith/6HCSNN7OV52M3VT4H4QSTUSBKD/bundle.json","status":"primary"}],"public_keys":[{"key_id":"pith-v1-2026-05","algorithm":"ed25519","format":"raw","public_key_b64":"stVStoiQhXFxp4s2pdzPNoqVNBMojDU/fJ2db5S3CbM=","public_key_hex":"b2d552b68890857171a78b36a5dccf368a953413288c353f7c9d9d6f94b709b3","fingerprint_sha256_b32_first128bits":"RVFV5Z2OI2J3ZUO7ERDEBCYNKS","fingerprint_sha256_hex":"8d4b5ee74e4693bcd1df2446408b0d54","rotates_at":null,"url":"https://pith.science/pith-signing-key.json","notes":"Pith uses this Ed25519 key to sign canonical record SHA-256 digests. Verify with: ed25519_verify(public_key, message=canonical_sha256_bytes, signature=base64decode(signature_b64))."}],"merge_version":"pith-open-graph-merge-v1","built_at":"2026-05-25T17:10:29Z","links":{"resolver":"https://pith.science/pith/6HCSNN7OV52M3VT4H4QSTUSBKD","bundle":"https://pith.science/pith/6HCSNN7OV52M3VT4H4QSTUSBKD/bundle.json","state":"https://pith.science/pith/6HCSNN7OV52M3VT4H4QSTUSBKD/state.json","well_known_bundle":"https://pith.science/.well-known/pith/6HCSNN7OV52M3VT4H4QSTUSBKD/bundle.json"},"state":{"state_type":"pith_open_graph_state","state_version":"1.0","pith_number":"pith:2019:6HCSNN7OV52M3VT4H4QSTUSBKD","merge_version":"pith-open-graph-merge-v1","event_count":2,"valid_event_count":2,"invalid_event_count":0,"equivocation_count":0,"current":{"canonical_record":{"metadata":{"abstract_canon_sha256":"33d38104297957af69a114013ceb06b85c26f7a07fb1003ede6f5cfbf9b0df43","cross_cats_sorted":["cs.AI","stat.ML"],"license":"http://arxiv.org/licenses/nonexclusive-distrib/1.0/","primary_cat":"cs.LG","submitted_at":"2019-07-05T16:14:55Z","title_canon_sha256":"fba98bd15904f9fd04f034c12f00ede3a045f18ee17200801d106857f9085ce6"},"schema_version":"1.0","source":{"id":"1907.02908","kind":"arxiv","version":1}},"source_aliases":[{"alias_kind":"arxiv","alias_value":"1907.02908","created_at":"2026-05-17T23:41:22Z"},{"alias_kind":"arxiv_version","alias_value":"1907.02908v1","created_at":"2026-05-17T23:41:22Z"},{"alias_kind":"doi","alias_value":"10.48550/arxiv.1907.02908","created_at":"2026-05-17T23:41:22Z"},{"alias_kind":"pith_short_12","alias_value":"6HCSNN7OV52M","created_at":"2026-05-18T12:33:10Z"},{"alias_kind":"pith_short_16","alias_value":"6HCSNN7OV52M3VT4","created_at":"2026-05-18T12:33:10Z"},{"alias_kind":"pith_short_8","alias_value":"6HCSNN7O","created_at":"2026-05-18T12:33:10Z"}],"graph_snapshots":[{"event_id":"sha256:4c1e25b6d645d9af0aa16039c2419268183d80f2b41820d3c9b165c94a51ad83","target":"graph","created_at":"2026-05-17T23:41:22Z","signer":{"key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","signer_id":"pith.science","signer_type":"pith_registry"},"payload":{"graph_snapshot":{"author_claims":{"count":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57","strong_count":0},"builder_version":"pith-number-builder-2026-05-17-v1","claims":{"count":0,"items":[],"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"formal_canon":{"evidence_count":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"paper":{"abstract_excerpt":"Many deep reinforcement learning algorithms contain inductive biases that sculpt the agent's objective and its interface to the environment. These inductive biases can take many forms, including domain knowledge and pretuned hyper-parameters. In general, there is a trade-off between generality and performance when algorithms use such biases. Stronger biases can lead to faster learning, but weaker biases can potentially lead to more general algorithms. This trade-off is important because inductive biases are not free; substantial effort may be required to obtain relevant domain knowledge or to ","authors_text":"David Silver, Hado van Hasselt, Joseph Modayil, Matteo Hessel","cross_cats":["cs.AI","stat.ML"],"headline":"","license":"http://arxiv.org/licenses/nonexclusive-distrib/1.0/","primary_cat":"cs.LG","submitted_at":"2019-07-05T16:14:55Z","title":"On Inductive Biases in Deep Reinforcement Learning"},"references":{"count":0,"internal_anchors":0,"resolved_work":0,"sample":[],"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"source":{"id":"1907.02908","kind":"arxiv","version":1},"verdict":{"created_at":null,"id":null,"model_set":{},"one_line_summary":"","pipeline_version":null,"pith_extraction_headline":"","strongest_claim":"","weakest_assumption":""}},"verdict_id":null}}],"author_attestations":[],"timestamp_anchors":[],"storage_attestations":[],"citation_signatures":[],"replication_records":[],"corrections":[],"mirror_hints":[],"record_created":{"event_id":"sha256:ae5c5abcf2549a91bd9e6864efefc1b4852d314503a6ecdc20af0d551fb66ff9","target":"record","created_at":"2026-05-17T23:41:22Z","signer":{"key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","signer_id":"pith.science","signer_type":"pith_registry"},"payload":{"attestation_state":"computed","canonical_record":{"metadata":{"abstract_canon_sha256":"33d38104297957af69a114013ceb06b85c26f7a07fb1003ede6f5cfbf9b0df43","cross_cats_sorted":["cs.AI","stat.ML"],"license":"http://arxiv.org/licenses/nonexclusive-distrib/1.0/","primary_cat":"cs.LG","submitted_at":"2019-07-05T16:14:55Z","title_canon_sha256":"fba98bd15904f9fd04f034c12f00ede3a045f18ee17200801d106857f9085ce6"},"schema_version":"1.0","source":{"id":"1907.02908","kind":"arxiv","version":1}},"canonical_sha256":"f1c526b7eeaf74cdd67c3f2129d24150e6724308ee7f9737f859868d8f27b4c2","receipt":{"algorithm":"ed25519","builder_version":"pith-number-builder-2026-05-17-v1","canonical_sha256":"f1c526b7eeaf74cdd67c3f2129d24150e6724308ee7f9737f859868d8f27b4c2","first_computed_at":"2026-05-17T23:41:22.639669Z","key_id":"pith-v1-2026-05","kind":"pith_receipt","last_reissued_at":"2026-05-17T23:41:22.639669Z","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","receipt_version":"0.3","signature_b64":"bydHSIs/Dr5Oo76XcLOppWC8bpJmtuqzVTatc2ZvWyaL1WmIjw4n1uIgu2vwwcw/KGiY9XFltDKnEsn9IuW3Aw==","signature_status":"signed_v1","signed_at":"2026-05-17T23:41:22.640334Z","signed_message":"canonical_sha256_bytes"},"source_id":"1907.02908","source_kind":"arxiv","source_version":1}}},"equivocations":[],"invalid_events":[],"applied_event_ids":["sha256:ae5c5abcf2549a91bd9e6864efefc1b4852d314503a6ecdc20af0d551fb66ff9","sha256:4c1e25b6d645d9af0aa16039c2419268183d80f2b41820d3c9b165c94a51ad83"],"state_sha256":"a70df6ae0281be448628b7421cffe05e09044248be2930219c296252689222bd"},"bundle_signature":{"signature_status":"signed_v1","algorithm":"ed25519","key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","signature_b64":"IZa51O/pDkweOYhnm9zeOHkHwhBIhsXllORhc1FDU62dwypVFIrL+sakEvz5ugwgsImWSlya/62hsqJiAuCxAg==","signed_message":"bundle_sha256_bytes","signed_at":"2026-05-25T17:10:29.743304Z","bundle_sha256":"9c57ef41063ab9efb51ced4f95c6877f5c407352182e9a0dd68caa3edf1caeaa"}}