{"bundle_type":"pith_open_graph_bundle","bundle_version":"1.0","pith_number":"pith:2021:6PWEW4WS6RP5GGQR374P43C6MM","short_pith_number":"pith:6PWEW4WS","canonical_record":{"source":{"id":"2105.13431","kind":"arxiv","version":2},"metadata":{"license":"http://creativecommons.org/licenses/by-nc-sa/4.0/","primary_cat":"cs.LG","submitted_at":"2021-05-27T20:12:20Z","cross_cats_sorted":["cs.AI","cs.SY","eess.SY"],"title_canon_sha256":"0b212843e6d10ead4b61fa793bcd41f3d9730ee5ff45d7ba3e17e50d13d30137","abstract_canon_sha256":"7bef6fdb8dccb8703a3b554b700f91db2a52358192c6b8cd630a21d5536909b5"},"schema_version":"1.0"},"canonical_sha256":"f3ec4b72d2f45fd31a11dff8fe6c5e633f94e9da780700f5a1ad9225f2b659ad","source":{"kind":"arxiv","id":"2105.13431","version":2},"source_aliases":[{"alias_kind":"arxiv","alias_value":"2105.13431","created_at":"2026-05-26T01:03:07Z"},{"alias_kind":"arxiv_version","alias_value":"2105.13431v2","created_at":"2026-05-26T01:03:07Z"},{"alias_kind":"doi","alias_value":"10.48550/arxiv.2105.13431","created_at":"2026-05-26T01:03:07Z"},{"alias_kind":"pith_short_12","alias_value":"6PWEW4WS6RP5","created_at":"2026-05-26T01:03:07Z"},{"alias_kind":"pith_short_16","alias_value":"6PWEW4WS6RP5GGQR","created_at":"2026-05-26T01:03:07Z"},{"alias_kind":"pith_short_8","alias_value":"6PWEW4WS","created_at":"2026-05-26T01:03:07Z"}],"events":[{"event_type":"record_created","subject_pith_number":"pith:2021:6PWEW4WS6RP5GGQR374P43C6MM","target":"record","payload":{"canonical_record":{"source":{"id":"2105.13431","kind":"arxiv","version":2},"metadata":{"license":"http://creativecommons.org/licenses/by-nc-sa/4.0/","primary_cat":"cs.LG","submitted_at":"2021-05-27T20:12:20Z","cross_cats_sorted":["cs.AI","cs.SY","eess.SY"],"title_canon_sha256":"0b212843e6d10ead4b61fa793bcd41f3d9730ee5ff45d7ba3e17e50d13d30137","abstract_canon_sha256":"7bef6fdb8dccb8703a3b554b700f91db2a52358192c6b8cd630a21d5536909b5"},"schema_version":"1.0"},"canonical_sha256":"f3ec4b72d2f45fd31a11dff8fe6c5e633f94e9da780700f5a1ad9225f2b659ad","receipt":{"kind":"pith_receipt","key_id":"pith-v1-2026-05","algorithm":"ed25519","signed_at":"2026-05-26T01:03:07.145126Z","signature_b64":"UF51qtTyBqnxEtgmEr4I6Ro80oAMZrAdteGll1Ctpp62ra2Km//UxkBhTOLaneZh6eYnTDrsCPXv77/jEfbBCg==","signed_message":"canonical_sha256_bytes","builder_version":"pith-number-builder-2026-05-17-v1","receipt_version":"0.3","canonical_sha256":"f3ec4b72d2f45fd31a11dff8fe6c5e633f94e9da780700f5a1ad9225f2b659ad","last_reissued_at":"2026-05-26T01:03:07.144370Z","signature_status":"signed_v1","first_computed_at":"2026-05-26T01:03:07.144370Z","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54"},"source_kind":"arxiv","source_id":"2105.13431","source_version":2,"attestation_state":"computed"},"signer":{"signer_id":"pith.science","signer_type":"pith_registry","key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54"},"created_at":"2026-05-26T01:03:07Z","supersedes":[],"prev_event":null,"signature":{"signature_status":"signed_v1","algorithm":"ed25519","key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","signature_b64":"kybfnyCX7l+TajDwGk5nu0zLnCRFpDYBlXf8Y926fYC0QXluHUPKN6gOWcIHgd7jpbrTq6z3ix8yOoROTpBOBA==","signed_message":"open_graph_event_sha256_bytes","signed_at":"2026-07-01T00:27:14.789573Z"},"content_sha256":"fd8c6050adac396d61b907de23d1b50b7717359076dab1a1ec7a04053861e98c","schema_version":"1.0","event_id":"sha256:fd8c6050adac396d61b907de23d1b50b7717359076dab1a1ec7a04053861e98c"},{"event_type":"graph_snapshot","subject_pith_number":"pith:2021:6PWEW4WS6RP5GGQR374P43C6MM","target":"graph","payload":{"graph_snapshot":{"paper":{"title":"An Offline Risk-aware Policy Selection Method for Bayesian Markov Decision Processes","license":"http://creativecommons.org/licenses/by-nc-sa/4.0/","headline":"","cross_cats":["cs.AI","cs.SY","eess.SY"],"primary_cat":"cs.LG","authors_text":"Caroline Ponzoni Carvalho Chanel, Giorgio Angelotti, Nicolas Drougard","submitted_at":"2021-05-27T20:12:20Z","abstract_excerpt":"In Offline Model Learning for Planning and in Offline Reinforcement Learning, the limited data set hinders the estimate of the Value function of the relative Markov Decision Process (MDP). Consequently, the performance of the obtained policy in the real world is bounded and possibly risky, especially when the deployment of a wrong policy can lead to catastrophic consequences. For this reason, several pathways are being followed with the scope of reducing the model error (or the distributional shift between the learned model and the true one) and, more broadly, obtaining risk-aware solutions wi"},"claims":{"count":0,"items":[],"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"source":{"id":"2105.13431","kind":"arxiv","version":2},"verdict":{"id":null,"model_set":{},"created_at":null,"strongest_claim":"","one_line_summary":"","pipeline_version":null,"weakest_assumption":"","pith_extraction_headline":""},"integrity":{"clean":true,"summary":{"advisory":0,"critical":0,"by_detector":{},"informational":0},"endpoint":"/pith/2105.13431/integrity.json","findings":[],"available":true,"detectors_run":[],"snapshot_sha256":"c28c3603d3b5d939e8dc4c7e95fa8dfce3d595e45f758748cecf8e644a296938"},"references":{"count":0,"sample":[],"resolved_work":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57","internal_anchors":0},"formal_canon":{"evidence_count":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"author_claims":{"count":0,"strong_count":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"builder_version":"pith-number-builder-2026-05-17-v1"},"verdict_id":null},"signer":{"signer_id":"pith.science","signer_type":"pith_registry","key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54"},"created_at":"2026-05-26T01:03:07Z","supersedes":[],"prev_event":null,"signature":{"signature_status":"signed_v1","algorithm":"ed25519","key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","signature_b64":"NVYKxgYRvEoEhshz4koN6aJeyMc+qXqtdzZTdltMo7kG7gvCVgDzCsKMN/UuMhtamiD/jf1bnCSVVukYoVM/AQ==","signed_message":"open_graph_event_sha256_bytes","signed_at":"2026-07-01T00:27:14.789958Z"},"content_sha256":"612812be2e558f3087c6ea3bee38ed5639f800e4b24b8890f6d32a61234f7668","schema_version":"1.0","event_id":"sha256:612812be2e558f3087c6ea3bee38ed5639f800e4b24b8890f6d32a61234f7668"}],"timestamp_proofs":[],"mirror_hints":[{"mirror_type":"https","name":"Pith Resolver","base_url":"https://pith.science","bundle_url":"https://pith.science/pith/6PWEW4WS6RP5GGQR374P43C6MM/bundle.json","state_url":"https://pith.science/pith/6PWEW4WS6RP5GGQR374P43C6MM/state.json","well_known_bundle_url":"https://pith.science/.well-known/pith/6PWEW4WS6RP5GGQR374P43C6MM/bundle.json","status":"primary"}],"public_keys":[{"key_id":"pith-v1-2026-05","algorithm":"ed25519","format":"raw","public_key_b64":"stVStoiQhXFxp4s2pdzPNoqVNBMojDU/fJ2db5S3CbM=","public_key_hex":"b2d552b68890857171a78b36a5dccf368a953413288c353f7c9d9d6f94b709b3","fingerprint_sha256_b32_first128bits":"RVFV5Z2OI2J3ZUO7ERDEBCYNKS","fingerprint_sha256_hex":"8d4b5ee74e4693bcd1df2446408b0d54","rotates_at":null,"url":"https://pith.science/pith-signing-key.json","notes":"Pith uses this Ed25519 key to sign canonical record SHA-256 digests. Verify with: ed25519_verify(public_key, message=canonical_sha256_bytes, signature=base64decode(signature_b64))."}],"merge_version":"pith-open-graph-merge-v1","built_at":"2026-07-01T00:27:14Z","links":{"resolver":"https://pith.science/pith/6PWEW4WS6RP5GGQR374P43C6MM","bundle":"https://pith.science/pith/6PWEW4WS6RP5GGQR374P43C6MM/bundle.json","state":"https://pith.science/pith/6PWEW4WS6RP5GGQR374P43C6MM/state.json","well_known_bundle":"https://pith.science/.well-known/pith/6PWEW4WS6RP5GGQR374P43C6MM/bundle.json"},"state":{"state_type":"pith_open_graph_state","state_version":"1.0","pith_number":"pith:2021:6PWEW4WS6RP5GGQR374P43C6MM","merge_version":"pith-open-graph-merge-v1","event_count":2,"valid_event_count":2,"invalid_event_count":0,"equivocation_count":0,"current":{"canonical_record":{"metadata":{"abstract_canon_sha256":"7bef6fdb8dccb8703a3b554b700f91db2a52358192c6b8cd630a21d5536909b5","cross_cats_sorted":["cs.AI","cs.SY","eess.SY"],"license":"http://creativecommons.org/licenses/by-nc-sa/4.0/","primary_cat":"cs.LG","submitted_at":"2021-05-27T20:12:20Z","title_canon_sha256":"0b212843e6d10ead4b61fa793bcd41f3d9730ee5ff45d7ba3e17e50d13d30137"},"schema_version":"1.0","source":{"id":"2105.13431","kind":"arxiv","version":2}},"source_aliases":[{"alias_kind":"arxiv","alias_value":"2105.13431","created_at":"2026-05-26T01:03:07Z"},{"alias_kind":"arxiv_version","alias_value":"2105.13431v2","created_at":"2026-05-26T01:03:07Z"},{"alias_kind":"doi","alias_value":"10.48550/arxiv.2105.13431","created_at":"2026-05-26T01:03:07Z"},{"alias_kind":"pith_short_12","alias_value":"6PWEW4WS6RP5","created_at":"2026-05-26T01:03:07Z"},{"alias_kind":"pith_short_16","alias_value":"6PWEW4WS6RP5GGQR","created_at":"2026-05-26T01:03:07Z"},{"alias_kind":"pith_short_8","alias_value":"6PWEW4WS","created_at":"2026-05-26T01:03:07Z"}],"graph_snapshots":[{"event_id":"sha256:612812be2e558f3087c6ea3bee38ed5639f800e4b24b8890f6d32a61234f7668","target":"graph","created_at":"2026-05-26T01:03:07Z","signer":{"key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","signer_id":"pith.science","signer_type":"pith_registry"},"payload":{"graph_snapshot":{"author_claims":{"count":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57","strong_count":0},"builder_version":"pith-number-builder-2026-05-17-v1","claims":{"count":0,"items":[],"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"formal_canon":{"evidence_count":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"integrity":{"available":true,"clean":true,"detectors_run":[],"endpoint":"/pith/2105.13431/integrity.json","findings":[],"snapshot_sha256":"c28c3603d3b5d939e8dc4c7e95fa8dfce3d595e45f758748cecf8e644a296938","summary":{"advisory":0,"by_detector":{},"critical":0,"informational":0}},"paper":{"abstract_excerpt":"In Offline Model Learning for Planning and in Offline Reinforcement Learning, the limited data set hinders the estimate of the Value function of the relative Markov Decision Process (MDP). Consequently, the performance of the obtained policy in the real world is bounded and possibly risky, especially when the deployment of a wrong policy can lead to catastrophic consequences. For this reason, several pathways are being followed with the scope of reducing the model error (or the distributional shift between the learned model and the true one) and, more broadly, obtaining risk-aware solutions wi","authors_text":"Caroline Ponzoni Carvalho Chanel, Giorgio Angelotti, Nicolas Drougard","cross_cats":["cs.AI","cs.SY","eess.SY"],"headline":"","license":"http://creativecommons.org/licenses/by-nc-sa/4.0/","primary_cat":"cs.LG","submitted_at":"2021-05-27T20:12:20Z","title":"An Offline Risk-aware Policy Selection Method for Bayesian Markov Decision Processes"},"references":{"count":0,"internal_anchors":0,"resolved_work":0,"sample":[],"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"source":{"id":"2105.13431","kind":"arxiv","version":2},"verdict":{"created_at":null,"id":null,"model_set":{},"one_line_summary":"","pipeline_version":null,"pith_extraction_headline":"","strongest_claim":"","weakest_assumption":""}},"verdict_id":null}}],"author_attestations":[],"timestamp_anchors":[],"storage_attestations":[],"citation_signatures":[],"replication_records":[],"corrections":[],"mirror_hints":[],"record_created":{"event_id":"sha256:fd8c6050adac396d61b907de23d1b50b7717359076dab1a1ec7a04053861e98c","target":"record","created_at":"2026-05-26T01:03:07Z","signer":{"key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","signer_id":"pith.science","signer_type":"pith_registry"},"payload":{"attestation_state":"computed","canonical_record":{"metadata":{"abstract_canon_sha256":"7bef6fdb8dccb8703a3b554b700f91db2a52358192c6b8cd630a21d5536909b5","cross_cats_sorted":["cs.AI","cs.SY","eess.SY"],"license":"http://creativecommons.org/licenses/by-nc-sa/4.0/","primary_cat":"cs.LG","submitted_at":"2021-05-27T20:12:20Z","title_canon_sha256":"0b212843e6d10ead4b61fa793bcd41f3d9730ee5ff45d7ba3e17e50d13d30137"},"schema_version":"1.0","source":{"id":"2105.13431","kind":"arxiv","version":2}},"canonical_sha256":"f3ec4b72d2f45fd31a11dff8fe6c5e633f94e9da780700f5a1ad9225f2b659ad","receipt":{"algorithm":"ed25519","builder_version":"pith-number-builder-2026-05-17-v1","canonical_sha256":"f3ec4b72d2f45fd31a11dff8fe6c5e633f94e9da780700f5a1ad9225f2b659ad","first_computed_at":"2026-05-26T01:03:07.144370Z","key_id":"pith-v1-2026-05","kind":"pith_receipt","last_reissued_at":"2026-05-26T01:03:07.144370Z","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","receipt_version":"0.3","signature_b64":"UF51qtTyBqnxEtgmEr4I6Ro80oAMZrAdteGll1Ctpp62ra2Km//UxkBhTOLaneZh6eYnTDrsCPXv77/jEfbBCg==","signature_status":"signed_v1","signed_at":"2026-05-26T01:03:07.145126Z","signed_message":"canonical_sha256_bytes"},"source_id":"2105.13431","source_kind":"arxiv","source_version":2}}},"equivocations":[],"invalid_events":[],"applied_event_ids":["sha256:fd8c6050adac396d61b907de23d1b50b7717359076dab1a1ec7a04053861e98c","sha256:612812be2e558f3087c6ea3bee38ed5639f800e4b24b8890f6d32a61234f7668"],"state_sha256":"b00813ef1a61e4db843a96786d0588431eebf36b25545e3a9ce82e9057d8f54e"},"bundle_signature":{"signature_status":"signed_v1","algorithm":"ed25519","key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","signature_b64":"oqfj0hRE5SBC7W8oLbBeuICbGM36rimzfLtOaslZ+466E9yA/9ivzsYjEbyh6bM5GJ6qk/C4M9UZMDGAU7ZxAA==","signed_message":"bundle_sha256_bytes","signed_at":"2026-07-01T00:27:14.792362Z","bundle_sha256":"aa29dcb42a823b9aa6c8c9becf6cd672853489d09ffda897e3aa7bd3f53813b5"}}