{"state_type":"pith_open_graph_state","state_version":"1.0","pith_number":"pith:2019:2CI4RNTTLJUJMMFTFUZFQK4VGL","merge_version":"pith-open-graph-merge-v1","event_count":2,"valid_event_count":2,"invalid_event_count":0,"equivocation_count":0,"current":{"canonical_record":{"metadata":{"abstract_canon_sha256":"7826d3094aa78640448452a7c38c91aab7daeaeb726494b1926558f85c462d9c","cross_cats_sorted":["stat.ML"],"license":"http://arxiv.org/licenses/nonexclusive-distrib/1.0/","primary_cat":"cs.LG","submitted_at":"2019-07-01T11:22:52Z","title_canon_sha256":"db77e3227669dc52abbd77cb6c5eaf2d5cba671c39523c9a8721188395620737"},"schema_version":"1.0","source":{"id":"1907.00664","kind":"arxiv","version":1}},"source_aliases":[{"alias_kind":"arxiv","alias_value":"1907.00664","created_at":"2026-05-17T23:41:50Z"},{"alias_kind":"arxiv_version","alias_value":"1907.00664v1","created_at":"2026-05-17T23:41:50Z"},{"alias_kind":"doi","alias_value":"10.48550/arxiv.1907.00664","created_at":"2026-05-17T23:41:50Z"},{"alias_kind":"pith_short_12","alias_value":"2CI4RNTTLJUJ","created_at":"2026-05-18T12:33:07Z"},{"alias_kind":"pith_short_16","alias_value":"2CI4RNTTLJUJMMFT","created_at":"2026-05-18T12:33:07Z"},{"alias_kind":"pith_short_8","alias_value":"2CI4RNTT","created_at":"2026-05-18T12:33:07Z"}],"graph_snapshots":[{"event_id":"sha256:18d993e7df935139a3ee33ec46b832873ca7a1e9efe808020a1e0fe949ef90a9","target":"graph","created_at":"2026-05-17T23:41:50Z","signer":{"key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","signer_id":"pith.science","signer_type":"pith_registry"},"payload":{"graph_snapshot":{"author_claims":{"count":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57","strong_count":0},"builder_version":"pith-number-builder-2026-05-17-v1","claims":{"count":0,"items":[],"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"formal_canon":{"evidence_count":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"paper":{"abstract_excerpt":"In many real-world scenarios, an autonomous agent often encounters various tasks within a single complex environment. We propose to build a graph abstraction over the environment structure to accelerate the learning of these tasks. Here, nodes are important points of interest (pivotal states) and edges represent feasible traversals between them. Our approach has two stages. First, we jointly train a latent pivotal state model and a curiosity-driven goal-conditioned policy in a task-agnostic manner. Second, provided with the information from the world graph, a high-level Manager quickly finds s","authors_text":"Alex Trott, Caiming Xiong, Richard Socher, Stephan Zheng, Wenling Shang","cross_cats":["stat.ML"],"headline":"","license":"http://arxiv.org/licenses/nonexclusive-distrib/1.0/","primary_cat":"cs.LG","submitted_at":"2019-07-01T11:22:52Z","title":"Learning World Graphs to Accelerate Hierarchical Reinforcement Learning"},"references":{"count":0,"internal_anchors":0,"resolved_work":0,"sample":[],"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"source":{"id":"1907.00664","kind":"arxiv","version":1},"verdict":{"created_at":null,"id":null,"model_set":{},"one_line_summary":"","pipeline_version":null,"pith_extraction_headline":"","strongest_claim":"","weakest_assumption":""}},"verdict_id":null}}],"author_attestations":[],"timestamp_anchors":[],"storage_attestations":[],"citation_signatures":[],"replication_records":[],"corrections":[],"mirror_hints":[],"record_created":{"event_id":"sha256:d03ec31ddcf0240295af5303481d37413f98a568d50021658a334056aac8465a","target":"record","created_at":"2026-05-17T23:41:50Z","signer":{"key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","signer_id":"pith.science","signer_type":"pith_registry"},"payload":{"attestation_state":"computed","canonical_record":{"metadata":{"abstract_canon_sha256":"7826d3094aa78640448452a7c38c91aab7daeaeb726494b1926558f85c462d9c","cross_cats_sorted":["stat.ML"],"license":"http://arxiv.org/licenses/nonexclusive-distrib/1.0/","primary_cat":"cs.LG","submitted_at":"2019-07-01T11:22:52Z","title_canon_sha256":"db77e3227669dc52abbd77cb6c5eaf2d5cba671c39523c9a8721188395620737"},"schema_version":"1.0","source":{"id":"1907.00664","kind":"arxiv","version":1}},"canonical_sha256":"d091c8b6735a689630b32d32582b9532c107e8f3d79498bf0da721fb52c8ada5","receipt":{"algorithm":"ed25519","builder_version":"pith-number-builder-2026-05-17-v1","canonical_sha256":"d091c8b6735a689630b32d32582b9532c107e8f3d79498bf0da721fb52c8ada5","first_computed_at":"2026-05-17T23:41:50.856930Z","key_id":"pith-v1-2026-05","kind":"pith_receipt","last_reissued_at":"2026-05-17T23:41:50.856930Z","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","receipt_version":"0.3","signature_b64":"C1lTip0uH0Txp1CTXV3Xd6b22UgtXwxEVLenxyWGT8fTtOjEBenTPXvX9YOuttG0qgbMzy4AG5USr1so9ktcAQ==","signature_status":"signed_v1","signed_at":"2026-05-17T23:41:50.857617Z","signed_message":"canonical_sha256_bytes"},"source_id":"1907.00664","source_kind":"arxiv","source_version":1}}},"equivocations":[],"invalid_events":[],"applied_event_ids":["sha256:d03ec31ddcf0240295af5303481d37413f98a568d50021658a334056aac8465a","sha256:18d993e7df935139a3ee33ec46b832873ca7a1e9efe808020a1e0fe949ef90a9"],"state_sha256":"f35a44e7f9aacc39dd94c895b04cb51422489902754112620e7811a5afe38ae2"}