{"bundle_type":"pith_open_graph_bundle","bundle_version":"1.0","pith_number":"pith:2026:5LOGV7CSGD7YVGSMBVORD5OB55","short_pith_number":"pith:5LOGV7CS","canonical_record":{"source":{"id":"2605.20272","kind":"arxiv","version":1},"metadata":{"license":"http://arxiv.org/licenses/nonexclusive-distrib/1.0/","primary_cat":"cs.LG","submitted_at":"2026-05-19T02:26:28Z","cross_cats_sorted":["cs.AI"],"title_canon_sha256":"2150d9d65fe74f47c4bedaadc17cdecb601c5830ae64ffdd6c902e429ea2a620","abstract_canon_sha256":"510e5e119354def8dc92a1222acb1cc1d72b47cc5e2cfc2b460138b1678bc8d5"},"schema_version":"1.0"},"canonical_sha256":"eadc6afc5230ff8a9a4c0d5d11f5c1ef494bcf1b78ced4f568380d5a81b704f2","source":{"kind":"arxiv","id":"2605.20272","version":1},"source_aliases":[{"alias_kind":"arxiv","alias_value":"2605.20272","created_at":"2026-05-21T00:04:23Z"},{"alias_kind":"arxiv_version","alias_value":"2605.20272v1","created_at":"2026-05-21T00:04:23Z"},{"alias_kind":"doi","alias_value":"10.48550/arxiv.2605.20272","created_at":"2026-05-21T00:04:23Z"},{"alias_kind":"pith_short_12","alias_value":"5LOGV7CSGD7Y","created_at":"2026-05-21T00:04:23Z"},{"alias_kind":"pith_short_16","alias_value":"5LOGV7CSGD7YVGSM","created_at":"2026-05-21T00:04:23Z"},{"alias_kind":"pith_short_8","alias_value":"5LOGV7CS","created_at":"2026-05-21T00:04:23Z"}],"events":[{"event_type":"record_created","subject_pith_number":"pith:2026:5LOGV7CSGD7YVGSMBVORD5OB55","target":"record","payload":{"canonical_record":{"source":{"id":"2605.20272","kind":"arxiv","version":1},"metadata":{"license":"http://arxiv.org/licenses/nonexclusive-distrib/1.0/","primary_cat":"cs.LG","submitted_at":"2026-05-19T02:26:28Z","cross_cats_sorted":["cs.AI"],"title_canon_sha256":"2150d9d65fe74f47c4bedaadc17cdecb601c5830ae64ffdd6c902e429ea2a620","abstract_canon_sha256":"510e5e119354def8dc92a1222acb1cc1d72b47cc5e2cfc2b460138b1678bc8d5"},"schema_version":"1.0"},"canonical_sha256":"eadc6afc5230ff8a9a4c0d5d11f5c1ef494bcf1b78ced4f568380d5a81b704f2","receipt":{"kind":"pith_receipt","key_id":"pith-v1-2026-05","algorithm":"ed25519","signed_at":"2026-05-21T00:04:23.516745Z","signature_b64":"dshlw5uAmYXhELTRflwHyQqfpbP2+s1EjmBnwkxVN2gnOn7OXOqjS/wLnx3qnJEgah9zVQslS4f/87mASBaUCg==","signed_message":"canonical_sha256_bytes","builder_version":"pith-number-builder-2026-05-17-v1","receipt_version":"0.3","canonical_sha256":"eadc6afc5230ff8a9a4c0d5d11f5c1ef494bcf1b78ced4f568380d5a81b704f2","last_reissued_at":"2026-05-21T00:04:23.516280Z","signature_status":"signed_v1","first_computed_at":"2026-05-21T00:04:23.516280Z","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54"},"source_kind":"arxiv","source_id":"2605.20272","source_version":1,"attestation_state":"computed"},"signer":{"signer_id":"pith.science","signer_type":"pith_registry","key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54"},"created_at":"2026-05-21T00:04:23Z","supersedes":[],"prev_event":null,"signature":{"signature_status":"signed_v1","algorithm":"ed25519","key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","signature_b64":"1V/qswePPjmus07FshZqOkKXKtVu2+h/t7pcCujPIFFL5FEdvrzj58yvBm++5B5dO/0qune0K9I7x4RhsysbDg==","signed_message":"open_graph_event_sha256_bytes","signed_at":"2026-05-26T11:44:20.467698Z"},"content_sha256":"e2822313be688775c4159dbf628b4a5da0761dd5c60145bbdc4b990cfa8bfecc","schema_version":"1.0","event_id":"sha256:e2822313be688775c4159dbf628b4a5da0761dd5c60145bbdc4b990cfa8bfecc"},{"event_type":"graph_snapshot","subject_pith_number":"pith:2026:5LOGV7CSGD7YVGSMBVORD5OB55","target":"graph","payload":{"graph_snapshot":{"paper":{"title":"Smaller Abstract State Spaces Enable Cross-Scale Generalization in Reinforcement Learning","license":"http://arxiv.org/licenses/nonexclusive-distrib/1.0/","headline":"","cross_cats":["cs.AI"],"primary_cat":"cs.LG","authors_text":"Lucas Lehnert, Nasehatul Mustakim","submitted_at":"2026-05-19T02:26:28Z","abstract_excerpt":"While humans readily generalize abstract concepts to more complex or larger tasks, building Reinforcement Learning (RL) systems with this ability remains elusive. Here, we present the first theoretical model of how such Out-of-Distribution (OOD) generalization can be achieved in RL agents. Our approach considers Partially Observable Markov Decision Processes (POMDPs) and assumes that an intelligent agent uses an abstraction function to determine which experiences can be treated as equivalent and which must be distinguished. First, we extend the existing state abstraction framework and proof te"},"claims":{"count":0,"items":[],"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"source":{"id":"2605.20272","kind":"arxiv","version":1},"verdict":{"id":null,"model_set":{},"created_at":null,"strongest_claim":"","one_line_summary":"","pipeline_version":null,"weakest_assumption":"","pith_extraction_headline":""},"integrity":{"clean":true,"summary":{"advisory":0,"critical":0,"by_detector":{},"informational":0},"endpoint":"/pith/2605.20272/integrity.json","findings":[],"available":true,"detectors_run":[],"snapshot_sha256":"c28c3603d3b5d939e8dc4c7e95fa8dfce3d595e45f758748cecf8e644a296938"},"references":{"count":0,"sample":[],"resolved_work":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57","internal_anchors":0},"formal_canon":{"evidence_count":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"author_claims":{"count":0,"strong_count":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"builder_version":"pith-number-builder-2026-05-17-v1"},"verdict_id":null},"signer":{"signer_id":"pith.science","signer_type":"pith_registry","key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54"},"created_at":"2026-05-21T00:04:23Z","supersedes":[],"prev_event":null,"signature":{"signature_status":"signed_v1","algorithm":"ed25519","key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","signature_b64":"Cf/ajJ+/mxYMcazsaGaoKrkm74zcw2F7r/V7PBY722HY+fSD29ZDm3xEKQ4KuXLA5JC0d7AIGInvxbtBWrNaBg==","signed_message":"open_graph_event_sha256_bytes","signed_at":"2026-05-26T11:44:20.468087Z"},"content_sha256":"9c3e5538e3c3036cbe3ace1bf4b297823612f4ce2ddcae4580ed17dfb4f2548c","schema_version":"1.0","event_id":"sha256:9c3e5538e3c3036cbe3ace1bf4b297823612f4ce2ddcae4580ed17dfb4f2548c"},{"event_type":"integrity_finding","subject_pith_number":"pith:2026:5LOGV7CSGD7YVGSMBVORD5OB55","target":"integrity","payload":{"note":"DOI in the printed bibliography is fragmented by whitespace or line breaks. A longer candidate (10.5555/2621980.David) was visible in the surrounding text but could not be confirmed against doi.org as printed.","snippet":"ISBN 978-1-107-05713-5. URLhttps: //dl.acm.org/doi/book/10.5555/2621980. David Silver, Aja Huang, Chris J. Maddison, Arthur Guez, Laurent Sifre, George van den Driessche, Julian Schrittwieser, Ioannis Antonoglou, Veda Panneershelvam, Marc L","arxiv_id":"2605.20272","detector":"doi_compliance","evidence":{"ref_index":12,"verdict_class":"incontrovertible","resolved_title":null,"printed_excerpt":"ISBN 978-1-107-05713-5. URLhttps: //dl.acm.org/doi/book/10.5555/2621980. David Silver, Aja Huang, Chris J. Maddison, Arthur Guez, Laurent Sifre, George van den Driessche, Julian Schrittwieser, Ioannis Antonoglou, Veda Panneershelvam, Marc L","reconstructed_doi":"10.5555/2621980.David"},"severity":"advisory","ref_index":12,"audited_at":"2026-05-21T07:35:09.015615Z","event_type":"pith.integrity.v1","detected_doi":"10.5555/2621980.David","detector_url":"https://pith.science/pith-integrity-protocol#doi_compliance","external_url":null,"finding_type":"recoverable_identifier","evidence_hash":"f64d97c18c543af1c9cef143271213323c1272e340fce7ccccd39f70a69f026d","paper_version":1,"verdict_class":"incontrovertible","resolved_title":null,"detector_version":"1.0.0","detected_arxiv_id":null,"integrity_event_id":5871,"payload_sha256":"aae1e264b1f76cb4c039b3653c6f193056c6dd54c3164fd841ddbdf65f6929ea","signature_b64":"g9TRPrNLQvWRw6wuBqgojsMGKStVAhUr8c1JpSOyCvVu5mrEcaZMOO3CISSjA/rliri2sW/hfIFNCzjwDIx7Ag==","signing_key_id":"pith-v1-2026-05"},"signer":{"signer_id":"pith.science","signer_type":"pith_registry","key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54"},"created_at":"2026-05-21T07:39:11Z","supersedes":[],"prev_event":null,"signature":{"signature_status":"signed_v1","algorithm":"ed25519","key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","signature_b64":"J+EqxVZPI8+5ZeKTJVhUXd6Z9V1ka3IabpfYCRvqBbGNT/A6EhmIEt5DNzsYcYkAneXx1vmijiRrSBcjhQyKDw==","signed_message":"open_graph_event_sha256_bytes","signed_at":"2026-05-26T11:44:20.469039Z"},"content_sha256":"b628279784168a202f7c27106ed0c9eccdd81353dce8de3d49ea71b96f766f71","schema_version":"1.0","event_id":"sha256:b628279784168a202f7c27106ed0c9eccdd81353dce8de3d49ea71b96f766f71"}],"timestamp_proofs":[],"mirror_hints":[{"mirror_type":"https","name":"Pith Resolver","base_url":"https://pith.science","bundle_url":"https://pith.science/pith/5LOGV7CSGD7YVGSMBVORD5OB55/bundle.json","state_url":"https://pith.science/pith/5LOGV7CSGD7YVGSMBVORD5OB55/state.json","well_known_bundle_url":"https://pith.science/.well-known/pith/5LOGV7CSGD7YVGSMBVORD5OB55/bundle.json","status":"primary"}],"public_keys":[{"key_id":"pith-v1-2026-05","algorithm":"ed25519","format":"raw","public_key_b64":"stVStoiQhXFxp4s2pdzPNoqVNBMojDU/fJ2db5S3CbM=","public_key_hex":"b2d552b68890857171a78b36a5dccf368a953413288c353f7c9d9d6f94b709b3","fingerprint_sha256_b32_first128bits":"RVFV5Z2OI2J3ZUO7ERDEBCYNKS","fingerprint_sha256_hex":"8d4b5ee74e4693bcd1df2446408b0d54","rotates_at":null,"url":"https://pith.science/pith-signing-key.json","notes":"Pith uses this Ed25519 key to sign canonical record SHA-256 digests. Verify with: ed25519_verify(public_key, message=canonical_sha256_bytes, signature=base64decode(signature_b64))."}],"merge_version":"pith-open-graph-merge-v1","built_at":"2026-05-26T11:44:20Z","links":{"resolver":"https://pith.science/pith/5LOGV7CSGD7YVGSMBVORD5OB55","bundle":"https://pith.science/pith/5LOGV7CSGD7YVGSMBVORD5OB55/bundle.json","state":"https://pith.science/pith/5LOGV7CSGD7YVGSMBVORD5OB55/state.json","well_known_bundle":"https://pith.science/.well-known/pith/5LOGV7CSGD7YVGSMBVORD5OB55/bundle.json"},"state":{"state_type":"pith_open_graph_state","state_version":"1.0","pith_number":"pith:2026:5LOGV7CSGD7YVGSMBVORD5OB55","merge_version":"pith-open-graph-merge-v1","event_count":3,"valid_event_count":3,"invalid_event_count":0,"equivocation_count":0,"current":{"canonical_record":{"metadata":{"abstract_canon_sha256":"510e5e119354def8dc92a1222acb1cc1d72b47cc5e2cfc2b460138b1678bc8d5","cross_cats_sorted":["cs.AI"],"license":"http://arxiv.org/licenses/nonexclusive-distrib/1.0/","primary_cat":"cs.LG","submitted_at":"2026-05-19T02:26:28Z","title_canon_sha256":"2150d9d65fe74f47c4bedaadc17cdecb601c5830ae64ffdd6c902e429ea2a620"},"schema_version":"1.0","source":{"id":"2605.20272","kind":"arxiv","version":1}},"source_aliases":[{"alias_kind":"arxiv","alias_value":"2605.20272","created_at":"2026-05-21T00:04:23Z"},{"alias_kind":"arxiv_version","alias_value":"2605.20272v1","created_at":"2026-05-21T00:04:23Z"},{"alias_kind":"doi","alias_value":"10.48550/arxiv.2605.20272","created_at":"2026-05-21T00:04:23Z"},{"alias_kind":"pith_short_12","alias_value":"5LOGV7CSGD7Y","created_at":"2026-05-21T00:04:23Z"},{"alias_kind":"pith_short_16","alias_value":"5LOGV7CSGD7YVGSM","created_at":"2026-05-21T00:04:23Z"},{"alias_kind":"pith_short_8","alias_value":"5LOGV7CS","created_at":"2026-05-21T00:04:23Z"}],"graph_snapshots":[{"event_id":"sha256:9c3e5538e3c3036cbe3ace1bf4b297823612f4ce2ddcae4580ed17dfb4f2548c","target":"graph","created_at":"2026-05-21T00:04:23Z","signer":{"key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","signer_id":"pith.science","signer_type":"pith_registry"},"payload":{"graph_snapshot":{"author_claims":{"count":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57","strong_count":0},"builder_version":"pith-number-builder-2026-05-17-v1","claims":{"count":0,"items":[],"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"formal_canon":{"evidence_count":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"integrity":{"available":true,"clean":true,"detectors_run":[],"endpoint":"/pith/2605.20272/integrity.json","findings":[],"snapshot_sha256":"c28c3603d3b5d939e8dc4c7e95fa8dfce3d595e45f758748cecf8e644a296938","summary":{"advisory":0,"by_detector":{},"critical":0,"informational":0}},"paper":{"abstract_excerpt":"While humans readily generalize abstract concepts to more complex or larger tasks, building Reinforcement Learning (RL) systems with this ability remains elusive. Here, we present the first theoretical model of how such Out-of-Distribution (OOD) generalization can be achieved in RL agents. Our approach considers Partially Observable Markov Decision Processes (POMDPs) and assumes that an intelligent agent uses an abstraction function to determine which experiences can be treated as equivalent and which must be distinguished. First, we extend the existing state abstraction framework and proof te","authors_text":"Lucas Lehnert, Nasehatul Mustakim","cross_cats":["cs.AI"],"headline":"","license":"http://arxiv.org/licenses/nonexclusive-distrib/1.0/","primary_cat":"cs.LG","submitted_at":"2026-05-19T02:26:28Z","title":"Smaller Abstract State Spaces Enable Cross-Scale Generalization in Reinforcement Learning"},"references":{"count":0,"internal_anchors":0,"resolved_work":0,"sample":[],"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"source":{"id":"2605.20272","kind":"arxiv","version":1},"verdict":{"created_at":null,"id":null,"model_set":{},"one_line_summary":"","pipeline_version":null,"pith_extraction_headline":"","strongest_claim":"","weakest_assumption":""}},"verdict_id":null}}],"author_attestations":[],"timestamp_anchors":[],"storage_attestations":[],"citation_signatures":[],"replication_records":[],"corrections":[],"mirror_hints":[],"record_created":{"event_id":"sha256:e2822313be688775c4159dbf628b4a5da0761dd5c60145bbdc4b990cfa8bfecc","target":"record","created_at":"2026-05-21T00:04:23Z","signer":{"key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","signer_id":"pith.science","signer_type":"pith_registry"},"payload":{"attestation_state":"computed","canonical_record":{"metadata":{"abstract_canon_sha256":"510e5e119354def8dc92a1222acb1cc1d72b47cc5e2cfc2b460138b1678bc8d5","cross_cats_sorted":["cs.AI"],"license":"http://arxiv.org/licenses/nonexclusive-distrib/1.0/","primary_cat":"cs.LG","submitted_at":"2026-05-19T02:26:28Z","title_canon_sha256":"2150d9d65fe74f47c4bedaadc17cdecb601c5830ae64ffdd6c902e429ea2a620"},"schema_version":"1.0","source":{"id":"2605.20272","kind":"arxiv","version":1}},"canonical_sha256":"eadc6afc5230ff8a9a4c0d5d11f5c1ef494bcf1b78ced4f568380d5a81b704f2","receipt":{"algorithm":"ed25519","builder_version":"pith-number-builder-2026-05-17-v1","canonical_sha256":"eadc6afc5230ff8a9a4c0d5d11f5c1ef494bcf1b78ced4f568380d5a81b704f2","first_computed_at":"2026-05-21T00:04:23.516280Z","key_id":"pith-v1-2026-05","kind":"pith_receipt","last_reissued_at":"2026-05-21T00:04:23.516280Z","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","receipt_version":"0.3","signature_b64":"dshlw5uAmYXhELTRflwHyQqfpbP2+s1EjmBnwkxVN2gnOn7OXOqjS/wLnx3qnJEgah9zVQslS4f/87mASBaUCg==","signature_status":"signed_v1","signed_at":"2026-05-21T00:04:23.516745Z","signed_message":"canonical_sha256_bytes"},"source_id":"2605.20272","source_kind":"arxiv","source_version":1}}},"equivocations":[],"invalid_events":[],"applied_event_ids":["sha256:e2822313be688775c4159dbf628b4a5da0761dd5c60145bbdc4b990cfa8bfecc","sha256:9c3e5538e3c3036cbe3ace1bf4b297823612f4ce2ddcae4580ed17dfb4f2548c","sha256:b628279784168a202f7c27106ed0c9eccdd81353dce8de3d49ea71b96f766f71"],"state_sha256":"564afd6bb5605c495ac8f64c54f95258bcac05a11ca8cbff21eaf70b41a40e31"},"bundle_signature":{"signature_status":"signed_v1","algorithm":"ed25519","key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","signature_b64":"XCFiU3PrQFASSFKNG+RBdtyF5o2hhxqx9qUDjBAMeUAmZPMmCRpfJ6HinDMFnGTHfKUWGO04OsPT61WBzfiaAg==","signed_message":"bundle_sha256_bytes","signed_at":"2026-05-26T11:44:20.472033Z","bundle_sha256":"c413347d57631012e38b5814aa59efd3b189b335e06396c5a85254bdfcfa2454"}}