{"state_type":"pith_open_graph_state","state_version":"1.0","pith_number":"pith:2019:TZLVYBSYR4EEM5CIH6CEN2CEXQ","merge_version":"pith-open-graph-merge-v1","event_count":2,"valid_event_count":2,"invalid_event_count":0,"equivocation_count":0,"current":{"canonical_record":{"metadata":{"abstract_canon_sha256":"901076f7ef9569cb9acf2994b54d2d494940530c233a6c717fb35537dd0067bc","cross_cats_sorted":["cs.AI","cs.RO","stat.AP","stat.ML"],"license":"http://arxiv.org/licenses/nonexclusive-distrib/1.0/","primary_cat":"cs.LG","submitted_at":"2019-03-22T05:54:27Z","title_canon_sha256":"a50a392564bf40f34fcd0df29a758dedf86b45b419b1c9412c9bb2ba999dbdd2"},"schema_version":"1.0","source":{"id":"1903.09366","kind":"arxiv","version":2}},"source_aliases":[{"alias_kind":"arxiv","alias_value":"1903.09366","created_at":"2026-05-17T23:44:21Z"},{"alias_kind":"arxiv_version","alias_value":"1903.09366v2","created_at":"2026-05-17T23:44:21Z"},{"alias_kind":"doi","alias_value":"10.48550/arxiv.1903.09366","created_at":"2026-05-17T23:44:21Z"},{"alias_kind":"pith_short_12","alias_value":"TZLVYBSYR4EE","created_at":"2026-05-18T12:33:30Z"},{"alias_kind":"pith_short_16","alias_value":"TZLVYBSYR4EEM5CI","created_at":"2026-05-18T12:33:30Z"},{"alias_kind":"pith_short_8","alias_value":"TZLVYBSY","created_at":"2026-05-18T12:33:30Z"}],"graph_snapshots":[{"event_id":"sha256:92b01f1d392ed33a5d5c66691a45b16cd5c5bab1d29a8d48ce75913a9a3a4dcb","target":"graph","created_at":"2026-05-17T23:44:21Z","signer":{"key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","signer_id":"pith.science","signer_type":"pith_registry"},"payload":{"graph_snapshot":{"author_claims":{"count":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57","strong_count":0},"builder_version":"pith-number-builder-2026-05-17-v1","claims":{"count":0,"items":[],"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"formal_canon":{"evidence_count":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"paper":{"abstract_excerpt":"One problem in the application of reinforcement learning to real-world problems is the curse of dimensionality on the action space. Macro actions, a sequence of primitive actions, have been studied to diminish the dimensionality of the action space with regard to the time axis. However, previous studies relied on humans defining macro actions or assumed macro actions as repetitions of the same primitive actions. We present Factorized Macro Action Reinforcement Learning (FaMARL) which autonomously learns disentangled factor representation of a sequence of actions to generate macro actions that ","authors_text":"Heecheol Kim, Hiroshi Yamakawa, Kosuke Miyoshi, Masanori Yamada","cross_cats":["cs.AI","cs.RO","stat.AP","stat.ML"],"headline":"","license":"http://arxiv.org/licenses/nonexclusive-distrib/1.0/","primary_cat":"cs.LG","submitted_at":"2019-03-22T05:54:27Z","title":"Macro Action Reinforcement Learning with Sequence Disentanglement using Variational Autoencoder"},"references":{"count":0,"internal_anchors":0,"resolved_work":0,"sample":[],"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"source":{"id":"1903.09366","kind":"arxiv","version":2},"verdict":{"created_at":null,"id":null,"model_set":{},"one_line_summary":"","pipeline_version":null,"pith_extraction_headline":"","strongest_claim":"","weakest_assumption":""}},"verdict_id":null}}],"author_attestations":[],"timestamp_anchors":[],"storage_attestations":[],"citation_signatures":[],"replication_records":[],"corrections":[],"mirror_hints":[],"record_created":{"event_id":"sha256:a0081603317449272791f16b4f11ee587ae2c557f161591f5e4d8072c5089c6f","target":"record","created_at":"2026-05-17T23:44:21Z","signer":{"key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","signer_id":"pith.science","signer_type":"pith_registry"},"payload":{"attestation_state":"computed","canonical_record":{"metadata":{"abstract_canon_sha256":"901076f7ef9569cb9acf2994b54d2d494940530c233a6c717fb35537dd0067bc","cross_cats_sorted":["cs.AI","cs.RO","stat.AP","stat.ML"],"license":"http://arxiv.org/licenses/nonexclusive-distrib/1.0/","primary_cat":"cs.LG","submitted_at":"2019-03-22T05:54:27Z","title_canon_sha256":"a50a392564bf40f34fcd0df29a758dedf86b45b419b1c9412c9bb2ba999dbdd2"},"schema_version":"1.0","source":{"id":"1903.09366","kind":"arxiv","version":2}},"canonical_sha256":"9e575c06588f084674483f8446e844bc00c23eb2f0dbd5f57fd75e21970f0c8b","receipt":{"algorithm":"ed25519","builder_version":"pith-number-builder-2026-05-17-v1","canonical_sha256":"9e575c06588f084674483f8446e844bc00c23eb2f0dbd5f57fd75e21970f0c8b","first_computed_at":"2026-05-17T23:44:21.418452Z","key_id":"pith-v1-2026-05","kind":"pith_receipt","last_reissued_at":"2026-05-17T23:44:21.418452Z","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","receipt_version":"0.3","signature_b64":"FLmoky48kBMhuVNenR+8oBYdVx7maBjl0tZVbG3cTHEZZUV+FTOhKEUCbhPhVTlQHVm0uZW/uZBNk2L5+00QAQ==","signature_status":"signed_v1","signed_at":"2026-05-17T23:44:21.419010Z","signed_message":"canonical_sha256_bytes"},"source_id":"1903.09366","source_kind":"arxiv","source_version":2}}},"equivocations":[],"invalid_events":[],"applied_event_ids":["sha256:a0081603317449272791f16b4f11ee587ae2c557f161591f5e4d8072c5089c6f","sha256:92b01f1d392ed33a5d5c66691a45b16cd5c5bab1d29a8d48ce75913a9a3a4dcb"],"state_sha256":"1b3fdaddcb32d7867cb1c9d9d748fca9777b2169a4436b2696db197a78aebc44"}