{"state_type":"pith_open_graph_state","state_version":"1.0","pith_number":"pith:2018:TT6PQIZK2HMTWBOA63ZDO45GIC","merge_version":"pith-open-graph-merge-v1","event_count":2,"valid_event_count":2,"invalid_event_count":0,"equivocation_count":0,"current":{"canonical_record":{"metadata":{"abstract_canon_sha256":"b6739d71293402f339a4ede3658e893c055b4ac4fd9a7f239715d3e04817509e","cross_cats_sorted":["cs.AI","cs.LG"],"license":"http://arxiv.org/licenses/nonexclusive-distrib/1.0/","primary_cat":"cs.RO","submitted_at":"2018-10-16T17:49:43Z","title_canon_sha256":"8f018f575e63341a17212bcd1ff6d1c84a1dfc4674aab737706ac47fa8cf836f"},"schema_version":"1.0","source":{"id":"1810.07167","kind":"arxiv","version":1}},"source_aliases":[{"alias_kind":"arxiv","alias_value":"1810.07167","created_at":"2026-05-18T00:03:10Z"},{"alias_kind":"arxiv_version","alias_value":"1810.07167v1","created_at":"2026-05-18T00:03:10Z"},{"alias_kind":"doi","alias_value":"10.48550/arxiv.1810.07167","created_at":"2026-05-18T00:03:10Z"},{"alias_kind":"pith_short_12","alias_value":"TT6PQIZK2HMT","created_at":"2026-05-18T12:32:56Z"},{"alias_kind":"pith_short_16","alias_value":"TT6PQIZK2HMTWBOA","created_at":"2026-05-18T12:32:56Z"},{"alias_kind":"pith_short_8","alias_value":"TT6PQIZK","created_at":"2026-05-18T12:32:56Z"}],"graph_snapshots":[{"event_id":"sha256:142ba3912a6d9bfce76557e3bf9ac6f3157b7d51f65a11340d92ecb97782377f","target":"graph","created_at":"2026-05-18T00:03:10Z","signer":{"key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","signer_id":"pith.science","signer_type":"pith_registry"},"payload":{"graph_snapshot":{"author_claims":{"count":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57","strong_count":0},"builder_version":"pith-number-builder-2026-05-17-v1","claims":{"count":0,"items":[],"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"formal_canon":{"evidence_count":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"paper":{"abstract_excerpt":"A general-purpose intelligent robot must be able to learn autonomously and be able to accomplish multiple tasks in order to be deployed in the real world. However, standard reinforcement learning approaches learn separate task-specific policies and assume the reward function for each task is known a priori. We propose a framework that learns event cues from off-policy data, and can flexibly combine these event cues at test time to accomplish different tasks. These event cue labels are not assumed to be known a priori, but are instead labeled using learned models, such as computer vision detect","authors_text":"Adam Villaflor, Gregory Kahn, Pieter Abbeel, Sergey Levine","cross_cats":["cs.AI","cs.LG"],"headline":"","license":"http://arxiv.org/licenses/nonexclusive-distrib/1.0/","primary_cat":"cs.RO","submitted_at":"2018-10-16T17:49:43Z","title":"Composable Action-Conditioned Predictors: Flexible Off-Policy Learning for Robot Navigation"},"references":{"count":0,"internal_anchors":0,"resolved_work":0,"sample":[],"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"source":{"id":"1810.07167","kind":"arxiv","version":1},"verdict":{"created_at":null,"id":null,"model_set":{},"one_line_summary":"","pipeline_version":null,"pith_extraction_headline":"","strongest_claim":"","weakest_assumption":""}},"verdict_id":null}}],"author_attestations":[],"timestamp_anchors":[],"storage_attestations":[],"citation_signatures":[],"replication_records":[],"corrections":[],"mirror_hints":[],"record_created":{"event_id":"sha256:0282cb48acec6682308d8fce01e15f8774448786ce63a2e38edf5ddea30e4277","target":"record","created_at":"2026-05-18T00:03:10Z","signer":{"key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","signer_id":"pith.science","signer_type":"pith_registry"},"payload":{"attestation_state":"computed","canonical_record":{"metadata":{"abstract_canon_sha256":"b6739d71293402f339a4ede3658e893c055b4ac4fd9a7f239715d3e04817509e","cross_cats_sorted":["cs.AI","cs.LG"],"license":"http://arxiv.org/licenses/nonexclusive-distrib/1.0/","primary_cat":"cs.RO","submitted_at":"2018-10-16T17:49:43Z","title_canon_sha256":"8f018f575e63341a17212bcd1ff6d1c84a1dfc4674aab737706ac47fa8cf836f"},"schema_version":"1.0","source":{"id":"1810.07167","kind":"arxiv","version":1}},"canonical_sha256":"9cfcf8232ad1d93b05c0f6f23773a6408137942f6073692a44101f8f28268de7","receipt":{"algorithm":"ed25519","builder_version":"pith-number-builder-2026-05-17-v1","canonical_sha256":"9cfcf8232ad1d93b05c0f6f23773a6408137942f6073692a44101f8f28268de7","first_computed_at":"2026-05-18T00:03:10.220948Z","key_id":"pith-v1-2026-05","kind":"pith_receipt","last_reissued_at":"2026-05-18T00:03:10.220948Z","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","receipt_version":"0.3","signature_b64":"LTBHT0BgyEyKG9wHLz/aGBQQr1E1EYbBtcG6m+XLjahCO7Q2Y2WwibM72zA6YJ8JyCNlOkPMhsebOW8GtgE0CQ==","signature_status":"signed_v1","signed_at":"2026-05-18T00:03:10.221608Z","signed_message":"canonical_sha256_bytes"},"source_id":"1810.07167","source_kind":"arxiv","source_version":1}}},"equivocations":[],"invalid_events":[],"applied_event_ids":["sha256:0282cb48acec6682308d8fce01e15f8774448786ce63a2e38edf5ddea30e4277","sha256:142ba3912a6d9bfce76557e3bf9ac6f3157b7d51f65a11340d92ecb97782377f"],"state_sha256":"b1e3042038a76e1a25ef66f080a2a7989eaec9d82329139bf4287581d714d3b3"}