{"bundle_type":"pith_open_graph_bundle","bundle_version":"1.0","pith_number":"pith:2019:GXIRMJ6UERXKJTI42UPLHRGKNF","short_pith_number":"pith:GXIRMJ6U","canonical_record":{"source":{"id":"1901.08486","kind":"arxiv","version":1},"metadata":{"license":"http://arxiv.org/licenses/nonexclusive-distrib/1.0/","primary_cat":"cs.LG","submitted_at":"2019-01-24T16:26:16Z","cross_cats_sorted":["cs.AI","cs.CV"],"title_canon_sha256":"33a3198c5aaef2aa796590631e33cf4b33b9ab2be141d813ef8f0298923f3f44","abstract_canon_sha256":"a9234216d8fadf71c219a85b8c7b3099db26681c8339c299292d7c1316cf8182"},"schema_version":"1.0"},"canonical_sha256":"35d11627d4246ea4cd1cd51eb3c4ca69543ae6842859a9fe3d3a9b258d247b13","source":{"kind":"arxiv","id":"1901.08486","version":1},"source_aliases":[{"alias_kind":"arxiv","alias_value":"1901.08486","created_at":"2026-05-17T23:55:35Z"},{"alias_kind":"arxiv_version","alias_value":"1901.08486v1","created_at":"2026-05-17T23:55:35Z"},{"alias_kind":"doi","alias_value":"10.48550/arxiv.1901.08486","created_at":"2026-05-17T23:55:35Z"},{"alias_kind":"pith_short_12","alias_value":"GXIRMJ6UERXK","created_at":"2026-05-18T12:33:18Z"},{"alias_kind":"pith_short_16","alias_value":"GXIRMJ6UERXKJTI4","created_at":"2026-05-18T12:33:18Z"},{"alias_kind":"pith_short_8","alias_value":"GXIRMJ6U","created_at":"2026-05-18T12:33:18Z"}],"events":[{"event_type":"record_created","subject_pith_number":"pith:2019:GXIRMJ6UERXKJTI42UPLHRGKNF","target":"record","payload":{"canonical_record":{"source":{"id":"1901.08486","kind":"arxiv","version":1},"metadata":{"license":"http://arxiv.org/licenses/nonexclusive-distrib/1.0/","primary_cat":"cs.LG","submitted_at":"2019-01-24T16:26:16Z","cross_cats_sorted":["cs.AI","cs.CV"],"title_canon_sha256":"33a3198c5aaef2aa796590631e33cf4b33b9ab2be141d813ef8f0298923f3f44","abstract_canon_sha256":"a9234216d8fadf71c219a85b8c7b3099db26681c8339c299292d7c1316cf8182"},"schema_version":"1.0"},"canonical_sha256":"35d11627d4246ea4cd1cd51eb3c4ca69543ae6842859a9fe3d3a9b258d247b13","receipt":{"kind":"pith_receipt","key_id":"pith-v1-2026-05","algorithm":"ed25519","signed_at":"2026-05-17T23:55:35.345012Z","signature_b64":"HBf/cuD6+WUMVdBrcG12eLkPGlxrPruKZ2JcT1eOCseewxBuddHNiDBdmCiihveAqbvG3pvhcgPGejjWtk1dBw==","signed_message":"canonical_sha256_bytes","builder_version":"pith-number-builder-2026-05-17-v1","receipt_version":"0.3","canonical_sha256":"35d11627d4246ea4cd1cd51eb3c4ca69543ae6842859a9fe3d3a9b258d247b13","last_reissued_at":"2026-05-17T23:55:35.344411Z","signature_status":"signed_v1","first_computed_at":"2026-05-17T23:55:35.344411Z","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54"},"source_kind":"arxiv","source_id":"1901.08486","source_version":1,"attestation_state":"computed"},"signer":{"signer_id":"pith.science","signer_type":"pith_registry","key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54"},"created_at":"2026-05-17T23:55:35Z","supersedes":[],"prev_event":null,"signature":{"signature_status":"signed_v1","algorithm":"ed25519","key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","signature_b64":"2uN1v7fNkSsOd1SdvbtwHQA2GyQjgD3uJjpPjekBR4smpZA2Aj9IDq6KN8IU+yoG1a9uoJc333pwB8k3G7/MCw==","signed_message":"open_graph_event_sha256_bytes","signed_at":"2026-05-27T13:58:32.304072Z"},"content_sha256":"14c0ec1f8cb28ad63381eaae0ab1757f86f1157c5d25d8649d42d0f4aa592e88","schema_version":"1.0","event_id":"sha256:14c0ec1f8cb28ad63381eaae0ab1757f86f1157c5d25d8649d42d0f4aa592e88"},{"event_type":"graph_snapshot","subject_pith_number":"pith:2019:GXIRMJ6UERXKJTI42UPLHRGKNF","target":"graph","payload":{"graph_snapshot":{"paper":{"title":"Never Forget: Balancing Exploration and Exploitation via Learning Optical Flow","license":"http://arxiv.org/licenses/nonexclusive-distrib/1.0/","headline":"","cross_cats":["cs.AI","cs.CV"],"primary_cat":"cs.LG","authors_text":"Chun-Yi Lee, Hsuan-Kung Yang, Kuan-Wei Ho, Min-Fong Hong, Po-Han Chiang","submitted_at":"2019-01-24T16:26:16Z","abstract_excerpt":"Exploration bonus derived from the novelty of the states in an environment has become a popular approach to motivate exploration for deep reinforcement learning agents in the past few years. Recent methods such as curiosity-driven exploration usually estimate the novelty of new observations by the prediction errors of their system dynamics models. Due to the capacity limitation of the models and difficulty of performing next-frame prediction, however, these methods typically fail to balance between exploration and exploitation in high-dimensional observation tasks, resulting in the agents forg"},"claims":{"count":0,"items":[],"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"source":{"id":"1901.08486","kind":"arxiv","version":1},"verdict":{"id":null,"model_set":{},"created_at":null,"strongest_claim":"","one_line_summary":"","pipeline_version":null,"weakest_assumption":"","pith_extraction_headline":""},"references":{"count":0,"sample":[],"resolved_work":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57","internal_anchors":0},"formal_canon":{"evidence_count":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"author_claims":{"count":0,"strong_count":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"builder_version":"pith-number-builder-2026-05-17-v1"},"verdict_id":null},"signer":{"signer_id":"pith.science","signer_type":"pith_registry","key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54"},"created_at":"2026-05-17T23:55:35Z","supersedes":[],"prev_event":null,"signature":{"signature_status":"signed_v1","algorithm":"ed25519","key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","signature_b64":"I2lzt4G/cYiZww4g+r8dBAEEp0YJ8xFbhZVBjh6nKakfFFNKJJBT+1BrDKtqUzV1Ndu1riW1YCmkSnBMrm88Dw==","signed_message":"open_graph_event_sha256_bytes","signed_at":"2026-05-27T13:58:32.304561Z"},"content_sha256":"ab1062453bdb4b05bac9d7f69c19668c5267431fdde1ec48f0fb80e6ab175673","schema_version":"1.0","event_id":"sha256:ab1062453bdb4b05bac9d7f69c19668c5267431fdde1ec48f0fb80e6ab175673"}],"timestamp_proofs":[],"mirror_hints":[{"mirror_type":"https","name":"Pith Resolver","base_url":"https://pith.science","bundle_url":"https://pith.science/pith/GXIRMJ6UERXKJTI42UPLHRGKNF/bundle.json","state_url":"https://pith.science/pith/GXIRMJ6UERXKJTI42UPLHRGKNF/state.json","well_known_bundle_url":"https://pith.science/.well-known/pith/GXIRMJ6UERXKJTI42UPLHRGKNF/bundle.json","status":"primary"}],"public_keys":[{"key_id":"pith-v1-2026-05","algorithm":"ed25519","format":"raw","public_key_b64":"stVStoiQhXFxp4s2pdzPNoqVNBMojDU/fJ2db5S3CbM=","public_key_hex":"b2d552b68890857171a78b36a5dccf368a953413288c353f7c9d9d6f94b709b3","fingerprint_sha256_b32_first128bits":"RVFV5Z2OI2J3ZUO7ERDEBCYNKS","fingerprint_sha256_hex":"8d4b5ee74e4693bcd1df2446408b0d54","rotates_at":null,"url":"https://pith.science/pith-signing-key.json","notes":"Pith uses this Ed25519 key to sign canonical record SHA-256 digests. Verify with: ed25519_verify(public_key, message=canonical_sha256_bytes, signature=base64decode(signature_b64))."}],"merge_version":"pith-open-graph-merge-v1","built_at":"2026-05-27T13:58:32Z","links":{"resolver":"https://pith.science/pith/GXIRMJ6UERXKJTI42UPLHRGKNF","bundle":"https://pith.science/pith/GXIRMJ6UERXKJTI42UPLHRGKNF/bundle.json","state":"https://pith.science/pith/GXIRMJ6UERXKJTI42UPLHRGKNF/state.json","well_known_bundle":"https://pith.science/.well-known/pith/GXIRMJ6UERXKJTI42UPLHRGKNF/bundle.json"},"state":{"state_type":"pith_open_graph_state","state_version":"1.0","pith_number":"pith:2019:GXIRMJ6UERXKJTI42UPLHRGKNF","merge_version":"pith-open-graph-merge-v1","event_count":2,"valid_event_count":2,"invalid_event_count":0,"equivocation_count":0,"current":{"canonical_record":{"metadata":{"abstract_canon_sha256":"a9234216d8fadf71c219a85b8c7b3099db26681c8339c299292d7c1316cf8182","cross_cats_sorted":["cs.AI","cs.CV"],"license":"http://arxiv.org/licenses/nonexclusive-distrib/1.0/","primary_cat":"cs.LG","submitted_at":"2019-01-24T16:26:16Z","title_canon_sha256":"33a3198c5aaef2aa796590631e33cf4b33b9ab2be141d813ef8f0298923f3f44"},"schema_version":"1.0","source":{"id":"1901.08486","kind":"arxiv","version":1}},"source_aliases":[{"alias_kind":"arxiv","alias_value":"1901.08486","created_at":"2026-05-17T23:55:35Z"},{"alias_kind":"arxiv_version","alias_value":"1901.08486v1","created_at":"2026-05-17T23:55:35Z"},{"alias_kind":"doi","alias_value":"10.48550/arxiv.1901.08486","created_at":"2026-05-17T23:55:35Z"},{"alias_kind":"pith_short_12","alias_value":"GXIRMJ6UERXK","created_at":"2026-05-18T12:33:18Z"},{"alias_kind":"pith_short_16","alias_value":"GXIRMJ6UERXKJTI4","created_at":"2026-05-18T12:33:18Z"},{"alias_kind":"pith_short_8","alias_value":"GXIRMJ6U","created_at":"2026-05-18T12:33:18Z"}],"graph_snapshots":[{"event_id":"sha256:ab1062453bdb4b05bac9d7f69c19668c5267431fdde1ec48f0fb80e6ab175673","target":"graph","created_at":"2026-05-17T23:55:35Z","signer":{"key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","signer_id":"pith.science","signer_type":"pith_registry"},"payload":{"graph_snapshot":{"author_claims":{"count":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57","strong_count":0},"builder_version":"pith-number-builder-2026-05-17-v1","claims":{"count":0,"items":[],"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"formal_canon":{"evidence_count":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"paper":{"abstract_excerpt":"Exploration bonus derived from the novelty of the states in an environment has become a popular approach to motivate exploration for deep reinforcement learning agents in the past few years. Recent methods such as curiosity-driven exploration usually estimate the novelty of new observations by the prediction errors of their system dynamics models. Due to the capacity limitation of the models and difficulty of performing next-frame prediction, however, these methods typically fail to balance between exploration and exploitation in high-dimensional observation tasks, resulting in the agents forg","authors_text":"Chun-Yi Lee, Hsuan-Kung Yang, Kuan-Wei Ho, Min-Fong Hong, Po-Han Chiang","cross_cats":["cs.AI","cs.CV"],"headline":"","license":"http://arxiv.org/licenses/nonexclusive-distrib/1.0/","primary_cat":"cs.LG","submitted_at":"2019-01-24T16:26:16Z","title":"Never Forget: Balancing Exploration and Exploitation via Learning Optical Flow"},"references":{"count":0,"internal_anchors":0,"resolved_work":0,"sample":[],"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"source":{"id":"1901.08486","kind":"arxiv","version":1},"verdict":{"created_at":null,"id":null,"model_set":{},"one_line_summary":"","pipeline_version":null,"pith_extraction_headline":"","strongest_claim":"","weakest_assumption":""}},"verdict_id":null}}],"author_attestations":[],"timestamp_anchors":[],"storage_attestations":[],"citation_signatures":[],"replication_records":[],"corrections":[],"mirror_hints":[],"record_created":{"event_id":"sha256:14c0ec1f8cb28ad63381eaae0ab1757f86f1157c5d25d8649d42d0f4aa592e88","target":"record","created_at":"2026-05-17T23:55:35Z","signer":{"key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","signer_id":"pith.science","signer_type":"pith_registry"},"payload":{"attestation_state":"computed","canonical_record":{"metadata":{"abstract_canon_sha256":"a9234216d8fadf71c219a85b8c7b3099db26681c8339c299292d7c1316cf8182","cross_cats_sorted":["cs.AI","cs.CV"],"license":"http://arxiv.org/licenses/nonexclusive-distrib/1.0/","primary_cat":"cs.LG","submitted_at":"2019-01-24T16:26:16Z","title_canon_sha256":"33a3198c5aaef2aa796590631e33cf4b33b9ab2be141d813ef8f0298923f3f44"},"schema_version":"1.0","source":{"id":"1901.08486","kind":"arxiv","version":1}},"canonical_sha256":"35d11627d4246ea4cd1cd51eb3c4ca69543ae6842859a9fe3d3a9b258d247b13","receipt":{"algorithm":"ed25519","builder_version":"pith-number-builder-2026-05-17-v1","canonical_sha256":"35d11627d4246ea4cd1cd51eb3c4ca69543ae6842859a9fe3d3a9b258d247b13","first_computed_at":"2026-05-17T23:55:35.344411Z","key_id":"pith-v1-2026-05","kind":"pith_receipt","last_reissued_at":"2026-05-17T23:55:35.344411Z","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","receipt_version":"0.3","signature_b64":"HBf/cuD6+WUMVdBrcG12eLkPGlxrPruKZ2JcT1eOCseewxBuddHNiDBdmCiihveAqbvG3pvhcgPGejjWtk1dBw==","signature_status":"signed_v1","signed_at":"2026-05-17T23:55:35.345012Z","signed_message":"canonical_sha256_bytes"},"source_id":"1901.08486","source_kind":"arxiv","source_version":1}}},"equivocations":[],"invalid_events":[],"applied_event_ids":["sha256:14c0ec1f8cb28ad63381eaae0ab1757f86f1157c5d25d8649d42d0f4aa592e88","sha256:ab1062453bdb4b05bac9d7f69c19668c5267431fdde1ec48f0fb80e6ab175673"],"state_sha256":"4afc646df329bc4b474c8d0e591ee3a00f404e0909a4fa4f5063d35f4e136169"},"bundle_signature":{"signature_status":"signed_v1","algorithm":"ed25519","key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","signature_b64":"szkt0YrelClOYtRjv3EM34SclX2kiiuB4CjqNsZ5iIxNsz9/etT3ArBMSv3I7j/xeTviwhIUN+7yOoWnVhIsBw==","signed_message":"bundle_sha256_bytes","signed_at":"2026-05-27T13:58:32.307283Z","bundle_sha256":"5f2ec449bd1b0509dfba6e26db9335eca488058c94179a48bba808f3e129103e"}}