{"bundle_type":"pith_open_graph_bundle","bundle_version":"1.0","pith_number":"pith:2019:RRZMC7BJCP2ZP5NNK4HHGDNXDW","short_pith_number":"pith:RRZMC7BJ","canonical_record":{"source":{"id":"1901.01492","kind":"arxiv","version":1},"metadata":{"license":"http://arxiv.org/licenses/nonexclusive-distrib/1.0/","primary_cat":"cs.CV","submitted_at":"2019-01-06T03:15:15Z","cross_cats_sorted":[],"title_canon_sha256":"5741c1be1c9cd3b838693ce5c2193b13a0b7f58c74896c49cda3c223c68937f0","abstract_canon_sha256":"9519dc239e29055c5b5b1d5556259c5d50e9ded0a883a717840347d5ce60c0ac"},"schema_version":"1.0"},"canonical_sha256":"8c72c17c2913f597f5ad570e730db71dabb847a7ce0649a848cc0560f997d649","source":{"kind":"arxiv","id":"1901.01492","version":1},"source_aliases":[{"alias_kind":"arxiv","alias_value":"1901.01492","created_at":"2026-05-17T23:56:51Z"},{"alias_kind":"arxiv_version","alias_value":"1901.01492v1","created_at":"2026-05-17T23:56:51Z"},{"alias_kind":"doi","alias_value":"10.48550/arxiv.1901.01492","created_at":"2026-05-17T23:56:51Z"},{"alias_kind":"pith_short_12","alias_value":"RRZMC7BJCP2Z","created_at":"2026-05-18T12:33:27Z"},{"alias_kind":"pith_short_16","alias_value":"RRZMC7BJCP2ZP5NN","created_at":"2026-05-18T12:33:27Z"},{"alias_kind":"pith_short_8","alias_value":"RRZMC7BJ","created_at":"2026-05-18T12:33:27Z"}],"events":[{"event_type":"record_created","subject_pith_number":"pith:2019:RRZMC7BJCP2ZP5NNK4HHGDNXDW","target":"record","payload":{"canonical_record":{"source":{"id":"1901.01492","kind":"arxiv","version":1},"metadata":{"license":"http://arxiv.org/licenses/nonexclusive-distrib/1.0/","primary_cat":"cs.CV","submitted_at":"2019-01-06T03:15:15Z","cross_cats_sorted":[],"title_canon_sha256":"5741c1be1c9cd3b838693ce5c2193b13a0b7f58c74896c49cda3c223c68937f0","abstract_canon_sha256":"9519dc239e29055c5b5b1d5556259c5d50e9ded0a883a717840347d5ce60c0ac"},"schema_version":"1.0"},"canonical_sha256":"8c72c17c2913f597f5ad570e730db71dabb847a7ce0649a848cc0560f997d649","receipt":{"kind":"pith_receipt","key_id":"pith-v1-2026-05","algorithm":"ed25519","signed_at":"2026-05-17T23:56:51.876599Z","signature_b64":"GmBu26HgZrFVTjblmbz+pyxKU/rjVC6OtXs6AMF8PAtvPb5YsQxazPFpcYKa1x6TR35NClOS7JIHqHcUzH9ECg==","signed_message":"canonical_sha256_bytes","builder_version":"pith-number-builder-2026-05-17-v1","receipt_version":"0.3","canonical_sha256":"8c72c17c2913f597f5ad570e730db71dabb847a7ce0649a848cc0560f997d649","last_reissued_at":"2026-05-17T23:56:51.876186Z","signature_status":"signed_v1","first_computed_at":"2026-05-17T23:56:51.876186Z","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54"},"source_kind":"arxiv","source_id":"1901.01492","source_version":1,"attestation_state":"computed"},"signer":{"signer_id":"pith.science","signer_type":"pith_registry","key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54"},"created_at":"2026-05-17T23:56:51Z","supersedes":[],"prev_event":null,"signature":{"signature_status":"signed_v1","algorithm":"ed25519","key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","signature_b64":"eUzYzyUGTTEZIEKQ3m+Ao0LpExNe7K4LLGwedim6y147X13wtm4St7HeLYYzMfAt+XS9AfdQ30sSyu8LSJg7Cg==","signed_message":"open_graph_event_sha256_bytes","signed_at":"2026-06-11T23:33:46.530820Z"},"content_sha256":"424981931f4fa6f5b95acbc85d98fb041f5dc1cd3242b8645bde2910cb0a8d17","schema_version":"1.0","event_id":"sha256:424981931f4fa6f5b95acbc85d98fb041f5dc1cd3242b8645bde2910cb0a8d17"},{"event_type":"graph_snapshot","subject_pith_number":"pith:2019:RRZMC7BJCP2ZP5NNK4HHGDNXDW","target":"graph","payload":{"graph_snapshot":{"paper":{"title":"What Should I Do Now? Marrying Reinforcement Learning and Symbolic Planning","license":"http://arxiv.org/licenses/nonexclusive-distrib/1.0/","headline":"","cross_cats":[],"primary_cat":"cs.CV","authors_text":"Ali Farhadi, Daniel Gordon, Dieter Fox","submitted_at":"2019-01-06T03:15:15Z","abstract_excerpt":"Long-term planning poses a major difficulty to many reinforcement learning algorithms. This problem becomes even more pronounced in dynamic visual environments. In this work we propose Hierarchical Planning and Reinforcement Learning (HIP-RL), a method for merging the benefits and capabilities of Symbolic Planning with the learning abilities of Deep Reinforcement Learning. We apply HIPRL to the complex visual tasks of interactive question answering and visual semantic planning and achieve state-of-the-art results on three challenging datasets all while taking fewer steps at test time and train"},"claims":{"count":0,"items":[],"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"source":{"id":"1901.01492","kind":"arxiv","version":1},"verdict":{"id":null,"model_set":{},"created_at":null,"strongest_claim":"","one_line_summary":"","pipeline_version":null,"weakest_assumption":"","pith_extraction_headline":""},"references":{"count":0,"sample":[],"resolved_work":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57","internal_anchors":0},"formal_canon":{"evidence_count":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"author_claims":{"count":0,"strong_count":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"builder_version":"pith-number-builder-2026-05-17-v1"},"verdict_id":null},"signer":{"signer_id":"pith.science","signer_type":"pith_registry","key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54"},"created_at":"2026-05-17T23:56:51Z","supersedes":[],"prev_event":null,"signature":{"signature_status":"signed_v1","algorithm":"ed25519","key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","signature_b64":"9Bz29WnO+x/KZ4tc099Z7FalL33c7bGGoPBbXMgP+ZYnnhcSkiphEF88EVeQGuvIFJeiioZe+vx55mYO8KidBQ==","signed_message":"open_graph_event_sha256_bytes","signed_at":"2026-06-11T23:33:46.531593Z"},"content_sha256":"d9b8286842d52af272418d8608f70e7e187a639805ad36dfee0d26c56fd48fc0","schema_version":"1.0","event_id":"sha256:d9b8286842d52af272418d8608f70e7e187a639805ad36dfee0d26c56fd48fc0"}],"timestamp_proofs":[],"mirror_hints":[{"mirror_type":"https","name":"Pith Resolver","base_url":"https://pith.science","bundle_url":"https://pith.science/pith/RRZMC7BJCP2ZP5NNK4HHGDNXDW/bundle.json","state_url":"https://pith.science/pith/RRZMC7BJCP2ZP5NNK4HHGDNXDW/state.json","well_known_bundle_url":"https://pith.science/.well-known/pith/RRZMC7BJCP2ZP5NNK4HHGDNXDW/bundle.json","status":"primary"}],"public_keys":[{"key_id":"pith-v1-2026-05","algorithm":"ed25519","format":"raw","public_key_b64":"stVStoiQhXFxp4s2pdzPNoqVNBMojDU/fJ2db5S3CbM=","public_key_hex":"b2d552b68890857171a78b36a5dccf368a953413288c353f7c9d9d6f94b709b3","fingerprint_sha256_b32_first128bits":"RVFV5Z2OI2J3ZUO7ERDEBCYNKS","fingerprint_sha256_hex":"8d4b5ee74e4693bcd1df2446408b0d54","rotates_at":null,"url":"https://pith.science/pith-signing-key.json","notes":"Pith uses this Ed25519 key to sign canonical record SHA-256 digests. Verify with: ed25519_verify(public_key, message=canonical_sha256_bytes, signature=base64decode(signature_b64))."}],"merge_version":"pith-open-graph-merge-v1","built_at":"2026-06-11T23:33:46Z","links":{"resolver":"https://pith.science/pith/RRZMC7BJCP2ZP5NNK4HHGDNXDW","bundle":"https://pith.science/pith/RRZMC7BJCP2ZP5NNK4HHGDNXDW/bundle.json","state":"https://pith.science/pith/RRZMC7BJCP2ZP5NNK4HHGDNXDW/state.json","well_known_bundle":"https://pith.science/.well-known/pith/RRZMC7BJCP2ZP5NNK4HHGDNXDW/bundle.json"},"state":{"state_type":"pith_open_graph_state","state_version":"1.0","pith_number":"pith:2019:RRZMC7BJCP2ZP5NNK4HHGDNXDW","merge_version":"pith-open-graph-merge-v1","event_count":2,"valid_event_count":2,"invalid_event_count":0,"equivocation_count":0,"current":{"canonical_record":{"metadata":{"abstract_canon_sha256":"9519dc239e29055c5b5b1d5556259c5d50e9ded0a883a717840347d5ce60c0ac","cross_cats_sorted":[],"license":"http://arxiv.org/licenses/nonexclusive-distrib/1.0/","primary_cat":"cs.CV","submitted_at":"2019-01-06T03:15:15Z","title_canon_sha256":"5741c1be1c9cd3b838693ce5c2193b13a0b7f58c74896c49cda3c223c68937f0"},"schema_version":"1.0","source":{"id":"1901.01492","kind":"arxiv","version":1}},"source_aliases":[{"alias_kind":"arxiv","alias_value":"1901.01492","created_at":"2026-05-17T23:56:51Z"},{"alias_kind":"arxiv_version","alias_value":"1901.01492v1","created_at":"2026-05-17T23:56:51Z"},{"alias_kind":"doi","alias_value":"10.48550/arxiv.1901.01492","created_at":"2026-05-17T23:56:51Z"},{"alias_kind":"pith_short_12","alias_value":"RRZMC7BJCP2Z","created_at":"2026-05-18T12:33:27Z"},{"alias_kind":"pith_short_16","alias_value":"RRZMC7BJCP2ZP5NN","created_at":"2026-05-18T12:33:27Z"},{"alias_kind":"pith_short_8","alias_value":"RRZMC7BJ","created_at":"2026-05-18T12:33:27Z"}],"graph_snapshots":[{"event_id":"sha256:d9b8286842d52af272418d8608f70e7e187a639805ad36dfee0d26c56fd48fc0","target":"graph","created_at":"2026-05-17T23:56:51Z","signer":{"key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","signer_id":"pith.science","signer_type":"pith_registry"},"payload":{"graph_snapshot":{"author_claims":{"count":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57","strong_count":0},"builder_version":"pith-number-builder-2026-05-17-v1","claims":{"count":0,"items":[],"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"formal_canon":{"evidence_count":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"paper":{"abstract_excerpt":"Long-term planning poses a major difficulty to many reinforcement learning algorithms. This problem becomes even more pronounced in dynamic visual environments. In this work we propose Hierarchical Planning and Reinforcement Learning (HIP-RL), a method for merging the benefits and capabilities of Symbolic Planning with the learning abilities of Deep Reinforcement Learning. We apply HIPRL to the complex visual tasks of interactive question answering and visual semantic planning and achieve state-of-the-art results on three challenging datasets all while taking fewer steps at test time and train","authors_text":"Ali Farhadi, Daniel Gordon, Dieter Fox","cross_cats":[],"headline":"","license":"http://arxiv.org/licenses/nonexclusive-distrib/1.0/","primary_cat":"cs.CV","submitted_at":"2019-01-06T03:15:15Z","title":"What Should I Do Now? Marrying Reinforcement Learning and Symbolic Planning"},"references":{"count":0,"internal_anchors":0,"resolved_work":0,"sample":[],"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"source":{"id":"1901.01492","kind":"arxiv","version":1},"verdict":{"created_at":null,"id":null,"model_set":{},"one_line_summary":"","pipeline_version":null,"pith_extraction_headline":"","strongest_claim":"","weakest_assumption":""}},"verdict_id":null}}],"author_attestations":[],"timestamp_anchors":[],"storage_attestations":[],"citation_signatures":[],"replication_records":[],"corrections":[],"mirror_hints":[],"record_created":{"event_id":"sha256:424981931f4fa6f5b95acbc85d98fb041f5dc1cd3242b8645bde2910cb0a8d17","target":"record","created_at":"2026-05-17T23:56:51Z","signer":{"key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","signer_id":"pith.science","signer_type":"pith_registry"},"payload":{"attestation_state":"computed","canonical_record":{"metadata":{"abstract_canon_sha256":"9519dc239e29055c5b5b1d5556259c5d50e9ded0a883a717840347d5ce60c0ac","cross_cats_sorted":[],"license":"http://arxiv.org/licenses/nonexclusive-distrib/1.0/","primary_cat":"cs.CV","submitted_at":"2019-01-06T03:15:15Z","title_canon_sha256":"5741c1be1c9cd3b838693ce5c2193b13a0b7f58c74896c49cda3c223c68937f0"},"schema_version":"1.0","source":{"id":"1901.01492","kind":"arxiv","version":1}},"canonical_sha256":"8c72c17c2913f597f5ad570e730db71dabb847a7ce0649a848cc0560f997d649","receipt":{"algorithm":"ed25519","builder_version":"pith-number-builder-2026-05-17-v1","canonical_sha256":"8c72c17c2913f597f5ad570e730db71dabb847a7ce0649a848cc0560f997d649","first_computed_at":"2026-05-17T23:56:51.876186Z","key_id":"pith-v1-2026-05","kind":"pith_receipt","last_reissued_at":"2026-05-17T23:56:51.876186Z","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","receipt_version":"0.3","signature_b64":"GmBu26HgZrFVTjblmbz+pyxKU/rjVC6OtXs6AMF8PAtvPb5YsQxazPFpcYKa1x6TR35NClOS7JIHqHcUzH9ECg==","signature_status":"signed_v1","signed_at":"2026-05-17T23:56:51.876599Z","signed_message":"canonical_sha256_bytes"},"source_id":"1901.01492","source_kind":"arxiv","source_version":1}}},"equivocations":[],"invalid_events":[],"applied_event_ids":["sha256:424981931f4fa6f5b95acbc85d98fb041f5dc1cd3242b8645bde2910cb0a8d17","sha256:d9b8286842d52af272418d8608f70e7e187a639805ad36dfee0d26c56fd48fc0"],"state_sha256":"32c569cf0ef3af3c7473d044c28205fae064116abdd2cb48a182b1b95e07c3c1"},"bundle_signature":{"signature_status":"signed_v1","algorithm":"ed25519","key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","signature_b64":"bZh1pHm5yGd/FfWwojKlSNVUQvWMz6pvJdlMcTKnRYlaIVCxXKxeN0RDEhT5wSnBm1AzC//7eHRqn/+09VqKAw==","signed_message":"bundle_sha256_bytes","signed_at":"2026-06-11T23:33:46.535770Z","bundle_sha256":"6030b50d930f1f17eb1bf9f01bc2ed24c0b1526918fe793dac71bb7bd4d34e15"}}