{"state_type":"pith_open_graph_state","state_version":"1.0","pith_number":"pith:2025:HIFZOUBYL4MUBAYGMKOMOTLEEI","merge_version":"pith-open-graph-merge-v1","event_count":2,"valid_event_count":2,"invalid_event_count":0,"equivocation_count":0,"current":{"canonical_record":{"metadata":{"abstract_canon_sha256":"765f81f3d2d88b75734567382a6d76edc3ef5105afa9150b81e87305503a5f8f","cross_cats_sorted":["cs.AI","cs.RO"],"license":"http://arxiv.org/licenses/nonexclusive-distrib/1.0/","primary_cat":"cs.LG","submitted_at":"2025-03-03T11:59:03Z","title_canon_sha256":"c87b3b7402a0b036065ca13d8145b89f1d9a32e7381b9b3d878dafc51b0db253"},"schema_version":"1.0","source":{"id":"2503.01450","kind":"arxiv","version":7}},"source_aliases":[{"alias_kind":"arxiv","alias_value":"2503.01450","created_at":"2026-05-28T01:04:27Z"},{"alias_kind":"arxiv_version","alias_value":"2503.01450v7","created_at":"2026-05-28T01:04:27Z"},{"alias_kind":"doi","alias_value":"10.48550/arxiv.2503.01450","created_at":"2026-05-28T01:04:27Z"},{"alias_kind":"pith_short_12","alias_value":"HIFZOUBYL4MU","created_at":"2026-05-28T01:04:27Z"},{"alias_kind":"pith_short_16","alias_value":"HIFZOUBYL4MUBAYG","created_at":"2026-05-28T01:04:27Z"},{"alias_kind":"pith_short_8","alias_value":"HIFZOUBY","created_at":"2026-05-28T01:04:27Z"}],"graph_snapshots":[{"event_id":"sha256:56575f0d2df67f22de5bb1d985f88d1be56e068e956d0598af310aedfb8482b0","target":"graph","created_at":"2026-05-28T01:04:27Z","signer":{"key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","signer_id":"pith.science","signer_type":"pith_registry"},"payload":{"graph_snapshot":{"author_claims":{"count":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57","strong_count":0},"builder_version":"pith-number-builder-2026-05-17-v1","claims":{"count":0,"items":[],"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"formal_canon":{"evidence_count":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"integrity":{"available":true,"clean":true,"detectors_run":[],"endpoint":"/pith/2503.01450/integrity.json","findings":[],"snapshot_sha256":"c28c3603d3b5d939e8dc4c7e95fa8dfce3d595e45f758748cecf8e644a296938","summary":{"advisory":0,"by_detector":{},"critical":0,"informational":0}},"paper":{"abstract_excerpt":"How should we analyze memory in deep RL? We introduce tools for analyzing policies under partial observability and revealing how agents use memory to make decisions. To utilize these tools, we present POPGym Arcade, a collection of Atari-inspired, hardware-accelerated environments sharing a single observation and action space. Each environment provides fully and partially observable variants, enabling counterfactual studies on observability. We find that controlled studies are necessary for fair comparisons and identify a pathology where value functions smear credit over irrelevant history. Us","authors_text":"Borong Zhang, Edan Toledo, Steven Morad, Zekang Wang, Zhe He","cross_cats":["cs.AI","cs.RO"],"headline":"","license":"http://arxiv.org/licenses/nonexclusive-distrib/1.0/","primary_cat":"cs.LG","submitted_at":"2025-03-03T11:59:03Z","title":"Investigating Memory in Model-Free RL with POPGym Arcade"},"references":{"count":0,"internal_anchors":0,"resolved_work":0,"sample":[],"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"source":{"id":"2503.01450","kind":"arxiv","version":7},"verdict":{"created_at":null,"id":null,"model_set":{},"one_line_summary":"","pipeline_version":null,"pith_extraction_headline":"","strongest_claim":"","weakest_assumption":""}},"verdict_id":null}}],"author_attestations":[],"timestamp_anchors":[],"storage_attestations":[],"citation_signatures":[],"replication_records":[],"corrections":[],"mirror_hints":[],"record_created":{"event_id":"sha256:8a390320ca49bba45d9859b0537989d824ed124547237225811c74894f88a1a2","target":"record","created_at":"2026-05-28T01:04:27Z","signer":{"key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","signer_id":"pith.science","signer_type":"pith_registry"},"payload":{"attestation_state":"computed","canonical_record":{"metadata":{"abstract_canon_sha256":"765f81f3d2d88b75734567382a6d76edc3ef5105afa9150b81e87305503a5f8f","cross_cats_sorted":["cs.AI","cs.RO"],"license":"http://arxiv.org/licenses/nonexclusive-distrib/1.0/","primary_cat":"cs.LG","submitted_at":"2025-03-03T11:59:03Z","title_canon_sha256":"c87b3b7402a0b036065ca13d8145b89f1d9a32e7381b9b3d878dafc51b0db253"},"schema_version":"1.0","source":{"id":"2503.01450","kind":"arxiv","version":7}},"canonical_sha256":"3a0b9750385f19408306629cc74d64223289e769a1ea46ae7f160929fc9c367c","receipt":{"algorithm":"ed25519","builder_version":"pith-number-builder-2026-05-17-v1","canonical_sha256":"3a0b9750385f19408306629cc74d64223289e769a1ea46ae7f160929fc9c367c","first_computed_at":"2026-05-28T01:04:27.001325Z","key_id":"pith-v1-2026-05","kind":"pith_receipt","last_reissued_at":"2026-05-28T01:04:27.001325Z","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","receipt_version":"0.3","signature_b64":"lfnOhfdYcoJe+F5/jdG4egJynoAMVaPApQjgJlNRqC1MDOp5hIXnZNBbzYgx4ur3vDndh3JYGENkp7KaW7rQAQ==","signature_status":"signed_v1","signed_at":"2026-05-28T01:04:27.001862Z","signed_message":"canonical_sha256_bytes"},"source_id":"2503.01450","source_kind":"arxiv","source_version":7}}},"equivocations":[],"invalid_events":[],"applied_event_ids":["sha256:8a390320ca49bba45d9859b0537989d824ed124547237225811c74894f88a1a2","sha256:56575f0d2df67f22de5bb1d985f88d1be56e068e956d0598af310aedfb8482b0"],"state_sha256":"7774c51c287a4f9587c875824d188ad3e7c524730ed1158fbb933380ad72f024"}