{"state_type":"pith_open_graph_state","state_version":"1.0","pith_number":"pith:2025:EDJTSMWDP76D4VR3WN6SV473B3","merge_version":"pith-open-graph-merge-v1","event_count":2,"valid_event_count":2,"invalid_event_count":0,"equivocation_count":0,"current":{"canonical_record":{"metadata":{"abstract_canon_sha256":"3b6dde410f295dbce759ce3c13c610a8112d13827e3c16c28d3f76d8d90e95dd","cross_cats_sorted":["cs.AI"],"license":"http://creativecommons.org/licenses/by/4.0/","primary_cat":"cs.LG","submitted_at":"2025-09-23T20:06:26Z","title_canon_sha256":"0be0804235a0e4456838e6a8df500a9db702bd3d62e17d14362aec303ff0282f"},"schema_version":"1.0","source":{"id":"2509.19538","kind":"arxiv","version":2}},"source_aliases":[{"alias_kind":"arxiv","alias_value":"2509.19538","created_at":"2026-05-18T03:09:34Z"},{"alias_kind":"arxiv_version","alias_value":"2509.19538v2","created_at":"2026-05-18T03:09:34Z"},{"alias_kind":"doi","alias_value":"10.48550/arxiv.2509.19538","created_at":"2026-05-18T03:09:34Z"},{"alias_kind":"pith_short_12","alias_value":"EDJTSMWDP76D","created_at":"2026-05-18T12:33:37Z"},{"alias_kind":"pith_short_16","alias_value":"EDJTSMWDP76D4VR3","created_at":"2026-05-18T12:33:37Z"},{"alias_kind":"pith_short_8","alias_value":"EDJTSMWD","created_at":"2026-05-18T12:33:37Z"}],"graph_snapshots":[{"event_id":"sha256:4bbdc62ef3c795b90bd72703b9b6053b4e3938a4c72e45c6a0182d2ac9c0ff7d","target":"graph","created_at":"2026-05-18T03:09:34Z","signer":{"key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","signer_id":"pith.science","signer_type":"pith_registry"},"payload":{"graph_snapshot":{"author_claims":{"count":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57","strong_count":0},"builder_version":"pith-number-builder-2026-05-17-v1","claims":{"count":0,"items":[],"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"formal_canon":{"evidence_count":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"paper":{"abstract_excerpt":"Diffusion-based world models have demonstrated strong capabilities in synthesizing realistic long-horizon trajectories for offline reinforcement learning (RL). However, many existing methods do not directly generate actions alongside states and rewards, limiting their compatibility with standard value-based offline RL algorithms that rely on one-step temporal difference (TD) learning. While prior work has explored joint modeling of states, rewards, and actions to address this issue, such formulations often lead to increased training complexity and reduced performance in practice. We propose \\t","authors_text":"Matthias Schubert, Niklas Strauss, Xiao Han, Yusong Li, Zongyue Li","cross_cats":["cs.AI"],"headline":"","license":"http://creativecommons.org/licenses/by/4.0/","primary_cat":"cs.LG","submitted_at":"2025-09-23T20:06:26Z","title":"DAWM: Diffusion Action World Models for Offline Reinforcement Learning via Action-Inferred Transitions"},"references":{"count":0,"internal_anchors":0,"resolved_work":0,"sample":[],"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"source":{"id":"2509.19538","kind":"arxiv","version":2},"verdict":{"created_at":null,"id":null,"model_set":{},"one_line_summary":"","pipeline_version":null,"pith_extraction_headline":"","strongest_claim":"","weakest_assumption":""}},"verdict_id":null}}],"author_attestations":[],"timestamp_anchors":[],"storage_attestations":[],"citation_signatures":[],"replication_records":[],"corrections":[],"mirror_hints":[],"record_created":{"event_id":"sha256:086f747d8ffadcbe3e9496c075857cee4579d4991935e1a0c984b5f0a78cbe33","target":"record","created_at":"2026-05-18T03:09:34Z","signer":{"key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","signer_id":"pith.science","signer_type":"pith_registry"},"payload":{"attestation_state":"computed","canonical_record":{"metadata":{"abstract_canon_sha256":"3b6dde410f295dbce759ce3c13c610a8112d13827e3c16c28d3f76d8d90e95dd","cross_cats_sorted":["cs.AI"],"license":"http://creativecommons.org/licenses/by/4.0/","primary_cat":"cs.LG","submitted_at":"2025-09-23T20:06:26Z","title_canon_sha256":"0be0804235a0e4456838e6a8df500a9db702bd3d62e17d14362aec303ff0282f"},"schema_version":"1.0","source":{"id":"2509.19538","kind":"arxiv","version":2}},"canonical_sha256":"20d33932c37ffc3e563bb37d2af3fb0ec54089319661a0c4008407e4d78ce03c","receipt":{"algorithm":"ed25519","builder_version":"pith-number-builder-2026-05-17-v1","canonical_sha256":"20d33932c37ffc3e563bb37d2af3fb0ec54089319661a0c4008407e4d78ce03c","first_computed_at":"2026-05-18T03:09:34.567039Z","key_id":"pith-v1-2026-05","kind":"pith_receipt","last_reissued_at":"2026-05-18T03:09:34.567039Z","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","receipt_version":"0.3","signature_b64":"BQYWDr+SLQ75rRHQuNd89MZKUsJa1ioTmgdXuGyzdSrupUgnNWOog/A4dlDJBvr3Z7xSiItn0ukZ7bE7tSHhAQ==","signature_status":"signed_v1","signed_at":"2026-05-18T03:09:34.567863Z","signed_message":"canonical_sha256_bytes"},"source_id":"2509.19538","source_kind":"arxiv","source_version":2}}},"equivocations":[],"invalid_events":[],"applied_event_ids":["sha256:086f747d8ffadcbe3e9496c075857cee4579d4991935e1a0c984b5f0a78cbe33","sha256:4bbdc62ef3c795b90bd72703b9b6053b4e3938a4c72e45c6a0182d2ac9c0ff7d"],"state_sha256":"c87c71abd23234a2ce97cd99f9a8a28f77088c1886e6c5f96776987cd7f224d7"}