{"state_type":"pith_open_graph_state","state_version":"1.0","pith_number":"pith:2019:MU5JKQEJCENCRJM6BCYFGFLD65","merge_version":"pith-open-graph-merge-v1","event_count":2,"valid_event_count":2,"invalid_event_count":0,"equivocation_count":0,"current":{"canonical_record":{"metadata":{"abstract_canon_sha256":"41760e9b61d6e1eb7518890762c0a5eeec810ed0742c14f3dbe57cef817de718","cross_cats_sorted":["stat.ML"],"license":"http://arxiv.org/licenses/nonexclusive-distrib/1.0/","primary_cat":"cs.LG","submitted_at":"2019-12-29T08:57:02Z","title_canon_sha256":"fdd458b593496cac04e71177b881d767eac31df95e8cc983585f4aa538f6fa69"},"schema_version":"1.0","source":{"id":"1912.12612","kind":"arxiv","version":1}},"source_aliases":[{"alias_kind":"arxiv","alias_value":"1912.12612","created_at":"2026-07-05T00:29:01Z"},{"alias_kind":"arxiv_version","alias_value":"1912.12612v1","created_at":"2026-07-05T00:29:01Z"},{"alias_kind":"doi","alias_value":"10.48550/arxiv.1912.12612","created_at":"2026-07-05T00:29:01Z"},{"alias_kind":"pith_short_12","alias_value":"MU5JKQEJCENC","created_at":"2026-07-05T00:29:01Z"},{"alias_kind":"pith_short_16","alias_value":"MU5JKQEJCENCRJM6","created_at":"2026-07-05T00:29:01Z"},{"alias_kind":"pith_short_8","alias_value":"MU5JKQEJ","created_at":"2026-07-05T00:29:01Z"}],"graph_snapshots":[{"event_id":"sha256:0a9896f01d1bb78578f9ad8c16ca37af3b03b20d4c972c29b8e714300bd703a1","target":"graph","created_at":"2026-07-05T00:29:01Z","signer":{"key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","signer_id":"pith.science","signer_type":"pith_registry"},"payload":{"graph_snapshot":{"author_claims":{"count":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57","strong_count":0},"builder_version":"pith-number-builder-2026-05-17-v1","claims":{"count":0,"items":[],"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"formal_canon":{"evidence_count":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"integrity":{"available":true,"clean":true,"detectors_run":[],"endpoint":"/pith/1912.12612/integrity.json","findings":[],"snapshot_sha256":"c28c3603d3b5d939e8dc4c7e95fa8dfce3d595e45f758748cecf8e644a296938","summary":{"advisory":0,"by_detector":{},"critical":0,"informational":0}},"paper":{"abstract_excerpt":"Autonomous agents can learn by imitating teacher demonstrations of the intended behavior. Hierarchical control policies are ubiquitously useful for such learning, having the potential to break down structured tasks into simpler sub-tasks, thereby improving data efficiency and generalization. In this paper, we propose a variational inference method for imitation learning of a control policy represented by parametrized hierarchical procedures (PHP), a program-like structure in which procedures can invoke sub-procedures to perform sub-tasks. Our method discovers the hierarchical structure in a da","authors_text":"Dawn Song, Ion Stoica, Ken Goldberg, Pieter Abbeel, Richard Shin, Roy Fox, William Paul, Yitian Zou","cross_cats":["stat.ML"],"headline":"","license":"http://arxiv.org/licenses/nonexclusive-distrib/1.0/","primary_cat":"cs.LG","submitted_at":"2019-12-29T08:57:02Z","title":"Hierarchical Variational Imitation Learning of Control Programs"},"references":{"count":0,"internal_anchors":0,"resolved_work":0,"sample":[],"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"source":{"id":"1912.12612","kind":"arxiv","version":1},"verdict":{"created_at":null,"id":null,"model_set":{},"one_line_summary":"","pipeline_version":null,"pith_extraction_headline":"","strongest_claim":"","weakest_assumption":""}},"verdict_id":null}}],"author_attestations":[],"timestamp_anchors":[],"storage_attestations":[],"citation_signatures":[],"replication_records":[],"corrections":[],"mirror_hints":[],"record_created":{"event_id":"sha256:8134ec3c38be037f0505ce81b9f52f794482b1ccb970ba65dd0be8790fb0aa2e","target":"record","created_at":"2026-07-05T00:29:01Z","signer":{"key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","signer_id":"pith.science","signer_type":"pith_registry"},"payload":{"attestation_state":"computed","canonical_record":{"metadata":{"abstract_canon_sha256":"41760e9b61d6e1eb7518890762c0a5eeec810ed0742c14f3dbe57cef817de718","cross_cats_sorted":["stat.ML"],"license":"http://arxiv.org/licenses/nonexclusive-distrib/1.0/","primary_cat":"cs.LG","submitted_at":"2019-12-29T08:57:02Z","title_canon_sha256":"fdd458b593496cac04e71177b881d767eac31df95e8cc983585f4aa538f6fa69"},"schema_version":"1.0","source":{"id":"1912.12612","kind":"arxiv","version":1}},"canonical_sha256":"653a954089111a28a59e08b0531563f740a34abe0ce16584d455315775b1d556","receipt":{"algorithm":"ed25519","builder_version":"pith-number-builder-2026-05-17-v1","canonical_sha256":"653a954089111a28a59e08b0531563f740a34abe0ce16584d455315775b1d556","first_computed_at":"2026-07-05T00:29:01.786353Z","key_id":"pith-v1-2026-05","kind":"pith_receipt","last_reissued_at":"2026-07-05T00:29:01.786353Z","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","receipt_version":"0.3","signature_b64":"wvvNcah+ve7423E6x0otjGrPK2IDAZXfd6PJNu435iWmnJ+kkVIOC38iJA2ggCYZ6Di0F7nifL1v9jJNrxSrBw==","signature_status":"signed_v1","signed_at":"2026-07-05T00:29:01.786828Z","signed_message":"canonical_sha256_bytes"},"source_id":"1912.12612","source_kind":"arxiv","source_version":1}}},"equivocations":[],"invalid_events":[],"applied_event_ids":["sha256:8134ec3c38be037f0505ce81b9f52f794482b1ccb970ba65dd0be8790fb0aa2e","sha256:0a9896f01d1bb78578f9ad8c16ca37af3b03b20d4c972c29b8e714300bd703a1"],"state_sha256":"4d961a7026e9c4e872b76ea5ef4feabe75a5cd726e4f7abe61e5768579acc97a"}