{"bundle_type":"pith_open_graph_bundle","bundle_version":"1.0","pith_number":"pith:2019:ZFQN5GPFYSBCZDQ2GU2ELIP65F","short_pith_number":"pith:ZFQN5GPF","canonical_record":{"source":{"id":"1905.12044","kind":"arxiv","version":1},"metadata":{"license":"http://arxiv.org/licenses/nonexclusive-distrib/1.0/","primary_cat":"cs.LG","submitted_at":"2019-05-28T19:33:49Z","cross_cats_sorted":["cs.AI","stat.ML"],"title_canon_sha256":"00af7d07fa030c05928d02a9eec2ff99de28b45a9ea76ba6710385ca6dabd152","abstract_canon_sha256":"85d58eecb6b3c72dcb29458f3c876ac4b069c000473d8d671275865a21d4e6cb"},"schema_version":"1.0"},"canonical_sha256":"c960de99e5c4822c8e1a353445a1fee975cc60a46280a8c040860a4f467e34b5","source":{"kind":"arxiv","id":"1905.12044","version":1},"source_aliases":[{"alias_kind":"arxiv","alias_value":"1905.12044","created_at":"2026-05-17T23:44:49Z"},{"alias_kind":"arxiv_version","alias_value":"1905.12044v1","created_at":"2026-05-17T23:44:49Z"},{"alias_kind":"doi","alias_value":"10.48550/arxiv.1905.12044","created_at":"2026-05-17T23:44:49Z"},{"alias_kind":"pith_short_12","alias_value":"ZFQN5GPFYSBC","created_at":"2026-05-18T12:33:33Z"},{"alias_kind":"pith_short_16","alias_value":"ZFQN5GPFYSBCZDQ2","created_at":"2026-05-18T12:33:33Z"},{"alias_kind":"pith_short_8","alias_value":"ZFQN5GPF","created_at":"2026-05-18T12:33:33Z"}],"events":[{"event_type":"record_created","subject_pith_number":"pith:2019:ZFQN5GPFYSBCZDQ2GU2ELIP65F","target":"record","payload":{"canonical_record":{"source":{"id":"1905.12044","kind":"arxiv","version":1},"metadata":{"license":"http://arxiv.org/licenses/nonexclusive-distrib/1.0/","primary_cat":"cs.LG","submitted_at":"2019-05-28T19:33:49Z","cross_cats_sorted":["cs.AI","stat.ML"],"title_canon_sha256":"00af7d07fa030c05928d02a9eec2ff99de28b45a9ea76ba6710385ca6dabd152","abstract_canon_sha256":"85d58eecb6b3c72dcb29458f3c876ac4b069c000473d8d671275865a21d4e6cb"},"schema_version":"1.0"},"canonical_sha256":"c960de99e5c4822c8e1a353445a1fee975cc60a46280a8c040860a4f467e34b5","receipt":{"kind":"pith_receipt","key_id":"pith-v1-2026-05","algorithm":"ed25519","signed_at":"2026-05-17T23:44:49.118374Z","signature_b64":"59CZN4bMJHV7dMUnePm1pNCTPU6D1O6t9CPhP8g1RER44ZttF+9PhQpkRhAEQ6m80Etj+m5iv/PXPqjaGMWtCQ==","signed_message":"canonical_sha256_bytes","builder_version":"pith-number-builder-2026-05-17-v1","receipt_version":"0.3","canonical_sha256":"c960de99e5c4822c8e1a353445a1fee975cc60a46280a8c040860a4f467e34b5","last_reissued_at":"2026-05-17T23:44:49.117763Z","signature_status":"signed_v1","first_computed_at":"2026-05-17T23:44:49.117763Z","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54"},"source_kind":"arxiv","source_id":"1905.12044","source_version":1,"attestation_state":"computed"},"signer":{"signer_id":"pith.science","signer_type":"pith_registry","key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54"},"created_at":"2026-05-17T23:44:49Z","supersedes":[],"prev_event":null,"signature":{"signature_status":"signed_v1","algorithm":"ed25519","key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","signature_b64":"0nVuxDA3WOt1UBD6EXgcDruQAAab3zxF0ejJX4HcSs/CsO9GQ/5cD4H4AtCnO5lo8X/KsARHaXp/n89XHqaeAg==","signed_message":"open_graph_event_sha256_bytes","signed_at":"2026-06-07T21:29:53.252689Z"},"content_sha256":"0401cf64e90d0d8e26aba64030f39721bee3832ac5a11fc0e601fc6ced95369e","schema_version":"1.0","event_id":"sha256:0401cf64e90d0d8e26aba64030f39721bee3832ac5a11fc0e601fc6ced95369e"},{"event_type":"graph_snapshot","subject_pith_number":"pith:2019:ZFQN5GPFYSBCZDQ2GU2ELIP65F","target":"graph","payload":{"graph_snapshot":{"paper":{"title":"Generation of Policy-Level Explanations for Reinforcement Learning","license":"http://arxiv.org/licenses/nonexclusive-distrib/1.0/","headline":"","cross_cats":["cs.AI","stat.ML"],"primary_cat":"cs.LG","authors_text":"Manuela Veloso, Nicholay Topin","submitted_at":"2019-05-28T19:33:49Z","abstract_excerpt":"Though reinforcement learning has greatly benefited from the incorporation of neural networks, the inability to verify the correctness of such systems limits their use. Current work in explainable deep learning focuses on explaining only a single decision in terms of input features, making it unsuitable for explaining a sequence of decisions. To address this need, we introduce Abstracted Policy Graphs, which are Markov chains of abstract states. This representation concisely summarizes a policy so that individual decisions can be explained in the context of expected future transitions. Additio"},"claims":{"count":0,"items":[],"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"source":{"id":"1905.12044","kind":"arxiv","version":1},"verdict":{"id":null,"model_set":{},"created_at":null,"strongest_claim":"","one_line_summary":"","pipeline_version":null,"weakest_assumption":"","pith_extraction_headline":""},"references":{"count":0,"sample":[],"resolved_work":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57","internal_anchors":0},"formal_canon":{"evidence_count":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"author_claims":{"count":0,"strong_count":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"builder_version":"pith-number-builder-2026-05-17-v1"},"verdict_id":null},"signer":{"signer_id":"pith.science","signer_type":"pith_registry","key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54"},"created_at":"2026-05-17T23:44:49Z","supersedes":[],"prev_event":null,"signature":{"signature_status":"signed_v1","algorithm":"ed25519","key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","signature_b64":"WqzRZS/YfurDpnrTemOG1/L3xAw/IzVNFDqq0fniluSeDT6GHuvx8x6CcuY1Vd8ki+Ps+FzDewoBnYVWBLEJAQ==","signed_message":"open_graph_event_sha256_bytes","signed_at":"2026-06-07T21:29:53.253037Z"},"content_sha256":"4d062c070b10c9ea830fa5c9cac6981a28837d6ef4b0663261ef35d842e1ae54","schema_version":"1.0","event_id":"sha256:4d062c070b10c9ea830fa5c9cac6981a28837d6ef4b0663261ef35d842e1ae54"}],"timestamp_proofs":[],"mirror_hints":[{"mirror_type":"https","name":"Pith Resolver","base_url":"https://pith.science","bundle_url":"https://pith.science/pith/ZFQN5GPFYSBCZDQ2GU2ELIP65F/bundle.json","state_url":"https://pith.science/pith/ZFQN5GPFYSBCZDQ2GU2ELIP65F/state.json","well_known_bundle_url":"https://pith.science/.well-known/pith/ZFQN5GPFYSBCZDQ2GU2ELIP65F/bundle.json","status":"primary"}],"public_keys":[{"key_id":"pith-v1-2026-05","algorithm":"ed25519","format":"raw","public_key_b64":"stVStoiQhXFxp4s2pdzPNoqVNBMojDU/fJ2db5S3CbM=","public_key_hex":"b2d552b68890857171a78b36a5dccf368a953413288c353f7c9d9d6f94b709b3","fingerprint_sha256_b32_first128bits":"RVFV5Z2OI2J3ZUO7ERDEBCYNKS","fingerprint_sha256_hex":"8d4b5ee74e4693bcd1df2446408b0d54","rotates_at":null,"url":"https://pith.science/pith-signing-key.json","notes":"Pith uses this Ed25519 key to sign canonical record SHA-256 digests. Verify with: ed25519_verify(public_key, message=canonical_sha256_bytes, signature=base64decode(signature_b64))."}],"merge_version":"pith-open-graph-merge-v1","built_at":"2026-06-07T21:29:53Z","links":{"resolver":"https://pith.science/pith/ZFQN5GPFYSBCZDQ2GU2ELIP65F","bundle":"https://pith.science/pith/ZFQN5GPFYSBCZDQ2GU2ELIP65F/bundle.json","state":"https://pith.science/pith/ZFQN5GPFYSBCZDQ2GU2ELIP65F/state.json","well_known_bundle":"https://pith.science/.well-known/pith/ZFQN5GPFYSBCZDQ2GU2ELIP65F/bundle.json"},"state":{"state_type":"pith_open_graph_state","state_version":"1.0","pith_number":"pith:2019:ZFQN5GPFYSBCZDQ2GU2ELIP65F","merge_version":"pith-open-graph-merge-v1","event_count":2,"valid_event_count":2,"invalid_event_count":0,"equivocation_count":0,"current":{"canonical_record":{"metadata":{"abstract_canon_sha256":"85d58eecb6b3c72dcb29458f3c876ac4b069c000473d8d671275865a21d4e6cb","cross_cats_sorted":["cs.AI","stat.ML"],"license":"http://arxiv.org/licenses/nonexclusive-distrib/1.0/","primary_cat":"cs.LG","submitted_at":"2019-05-28T19:33:49Z","title_canon_sha256":"00af7d07fa030c05928d02a9eec2ff99de28b45a9ea76ba6710385ca6dabd152"},"schema_version":"1.0","source":{"id":"1905.12044","kind":"arxiv","version":1}},"source_aliases":[{"alias_kind":"arxiv","alias_value":"1905.12044","created_at":"2026-05-17T23:44:49Z"},{"alias_kind":"arxiv_version","alias_value":"1905.12044v1","created_at":"2026-05-17T23:44:49Z"},{"alias_kind":"doi","alias_value":"10.48550/arxiv.1905.12044","created_at":"2026-05-17T23:44:49Z"},{"alias_kind":"pith_short_12","alias_value":"ZFQN5GPFYSBC","created_at":"2026-05-18T12:33:33Z"},{"alias_kind":"pith_short_16","alias_value":"ZFQN5GPFYSBCZDQ2","created_at":"2026-05-18T12:33:33Z"},{"alias_kind":"pith_short_8","alias_value":"ZFQN5GPF","created_at":"2026-05-18T12:33:33Z"}],"graph_snapshots":[{"event_id":"sha256:4d062c070b10c9ea830fa5c9cac6981a28837d6ef4b0663261ef35d842e1ae54","target":"graph","created_at":"2026-05-17T23:44:49Z","signer":{"key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","signer_id":"pith.science","signer_type":"pith_registry"},"payload":{"graph_snapshot":{"author_claims":{"count":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57","strong_count":0},"builder_version":"pith-number-builder-2026-05-17-v1","claims":{"count":0,"items":[],"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"formal_canon":{"evidence_count":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"paper":{"abstract_excerpt":"Though reinforcement learning has greatly benefited from the incorporation of neural networks, the inability to verify the correctness of such systems limits their use. Current work in explainable deep learning focuses on explaining only a single decision in terms of input features, making it unsuitable for explaining a sequence of decisions. To address this need, we introduce Abstracted Policy Graphs, which are Markov chains of abstract states. This representation concisely summarizes a policy so that individual decisions can be explained in the context of expected future transitions. Additio","authors_text":"Manuela Veloso, Nicholay Topin","cross_cats":["cs.AI","stat.ML"],"headline":"","license":"http://arxiv.org/licenses/nonexclusive-distrib/1.0/","primary_cat":"cs.LG","submitted_at":"2019-05-28T19:33:49Z","title":"Generation of Policy-Level Explanations for Reinforcement Learning"},"references":{"count":0,"internal_anchors":0,"resolved_work":0,"sample":[],"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"source":{"id":"1905.12044","kind":"arxiv","version":1},"verdict":{"created_at":null,"id":null,"model_set":{},"one_line_summary":"","pipeline_version":null,"pith_extraction_headline":"","strongest_claim":"","weakest_assumption":""}},"verdict_id":null}}],"author_attestations":[],"timestamp_anchors":[],"storage_attestations":[],"citation_signatures":[],"replication_records":[],"corrections":[],"mirror_hints":[],"record_created":{"event_id":"sha256:0401cf64e90d0d8e26aba64030f39721bee3832ac5a11fc0e601fc6ced95369e","target":"record","created_at":"2026-05-17T23:44:49Z","signer":{"key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","signer_id":"pith.science","signer_type":"pith_registry"},"payload":{"attestation_state":"computed","canonical_record":{"metadata":{"abstract_canon_sha256":"85d58eecb6b3c72dcb29458f3c876ac4b069c000473d8d671275865a21d4e6cb","cross_cats_sorted":["cs.AI","stat.ML"],"license":"http://arxiv.org/licenses/nonexclusive-distrib/1.0/","primary_cat":"cs.LG","submitted_at":"2019-05-28T19:33:49Z","title_canon_sha256":"00af7d07fa030c05928d02a9eec2ff99de28b45a9ea76ba6710385ca6dabd152"},"schema_version":"1.0","source":{"id":"1905.12044","kind":"arxiv","version":1}},"canonical_sha256":"c960de99e5c4822c8e1a353445a1fee975cc60a46280a8c040860a4f467e34b5","receipt":{"algorithm":"ed25519","builder_version":"pith-number-builder-2026-05-17-v1","canonical_sha256":"c960de99e5c4822c8e1a353445a1fee975cc60a46280a8c040860a4f467e34b5","first_computed_at":"2026-05-17T23:44:49.117763Z","key_id":"pith-v1-2026-05","kind":"pith_receipt","last_reissued_at":"2026-05-17T23:44:49.117763Z","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","receipt_version":"0.3","signature_b64":"59CZN4bMJHV7dMUnePm1pNCTPU6D1O6t9CPhP8g1RER44ZttF+9PhQpkRhAEQ6m80Etj+m5iv/PXPqjaGMWtCQ==","signature_status":"signed_v1","signed_at":"2026-05-17T23:44:49.118374Z","signed_message":"canonical_sha256_bytes"},"source_id":"1905.12044","source_kind":"arxiv","source_version":1}}},"equivocations":[],"invalid_events":[],"applied_event_ids":["sha256:0401cf64e90d0d8e26aba64030f39721bee3832ac5a11fc0e601fc6ced95369e","sha256:4d062c070b10c9ea830fa5c9cac6981a28837d6ef4b0663261ef35d842e1ae54"],"state_sha256":"2f058a2ba6a1646c9df4fd2b902d73bbc5cf11c9621f6351a5ffdc874ca76361"},"bundle_signature":{"signature_status":"signed_v1","algorithm":"ed25519","key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","signature_b64":"HkDot0+BpBK7gRG1btniXsqs1HcsjnEEQuMC5G2TylbWyaPATPNcFuJGigSGumkQNWj7iMdWodBq1ev20mIACg==","signed_message":"bundle_sha256_bytes","signed_at":"2026-06-07T21:29:53.255421Z","bundle_sha256":"8d182796b681422b0cda3ce8486b7cc8c2673f1e778ac9719140b47497888f3f"}}