{"state_type":"pith_open_graph_state","state_version":"1.0","pith_number":"pith:2018:GVXEMODDKJQZLZL7LLSSWOTJ4U","merge_version":"pith-open-graph-merge-v1","event_count":2,"valid_event_count":2,"invalid_event_count":0,"equivocation_count":0,"current":{"canonical_record":{"metadata":{"abstract_canon_sha256":"aee4c7310b3c54a214e3d82be77ebba715ca6d35017dce79b1652afa365c478b","cross_cats_sorted":["cs.AI","stat.ML"],"license":"http://arxiv.org/licenses/nonexclusive-distrib/1.0/","primary_cat":"cs.LG","submitted_at":"2018-09-24T18:13:01Z","title_canon_sha256":"ac94d63a41ccfa0b5ad3fa23d3446dc924aa9419994032c755aaa5c5cc4648c3"},"schema_version":"1.0","source":{"id":"1809.09147","kind":"arxiv","version":1}},"source_aliases":[{"alias_kind":"arxiv","alias_value":"1809.09147","created_at":"2026-05-18T00:04:54Z"},{"alias_kind":"arxiv_version","alias_value":"1809.09147v1","created_at":"2026-05-18T00:04:54Z"},{"alias_kind":"doi","alias_value":"10.48550/arxiv.1809.09147","created_at":"2026-05-18T00:04:54Z"},{"alias_kind":"pith_short_12","alias_value":"GVXEMODDKJQZ","created_at":"2026-05-18T12:32:25Z"},{"alias_kind":"pith_short_16","alias_value":"GVXEMODDKJQZLZL7","created_at":"2026-05-18T12:32:25Z"},{"alias_kind":"pith_short_8","alias_value":"GVXEMODD","created_at":"2026-05-18T12:32:25Z"}],"graph_snapshots":[{"event_id":"sha256:661c977a9bd29b8fc8decb21685c877f36a1118ec0dd3b851b6560f2faff16d4","target":"graph","created_at":"2026-05-18T00:04:54Z","signer":{"key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","signer_id":"pith.science","signer_type":"pith_registry"},"payload":{"graph_snapshot":{"author_claims":{"count":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57","strong_count":0},"builder_version":"pith-number-builder-2026-05-17-v1","claims":{"count":0,"items":[],"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"formal_canon":{"evidence_count":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"paper":{"abstract_excerpt":"In the real world, agents often have to operate in situations with incomplete information, limited sensing capabilities, and inherently stochastic environments, making individual observations incomplete and unreliable. Moreover, in many situations it is preferable to delay a decision rather than run the risk of making a bad decision. In such situations it is necessary to aggregate information before taking an action; however, most state of the art reinforcement learning (RL) algorithms are biased towards taking actions \\textit{at every time step}, even if the agent is not particularly confiden","authors_text":"Abhinau Kumar V, Akshat Agarwal, Erik Peterson, Katia Sycara, Kyle Dunovan, Timothy Verstynen","cross_cats":["cs.AI","stat.ML"],"headline":"","license":"http://arxiv.org/licenses/nonexclusive-distrib/1.0/","primary_cat":"cs.LG","submitted_at":"2018-09-24T18:13:01Z","title":"Better Safe than Sorry: Evidence Accumulation Allows for Safe Reinforcement Learning"},"references":{"count":0,"internal_anchors":0,"resolved_work":0,"sample":[],"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"source":{"id":"1809.09147","kind":"arxiv","version":1},"verdict":{"created_at":null,"id":null,"model_set":{},"one_line_summary":"","pipeline_version":null,"pith_extraction_headline":"","strongest_claim":"","weakest_assumption":""}},"verdict_id":null}}],"author_attestations":[],"timestamp_anchors":[],"storage_attestations":[],"citation_signatures":[],"replication_records":[],"corrections":[],"mirror_hints":[],"record_created":{"event_id":"sha256:362c4d7ddae90006a42859efde768d3633ede7ebd6bc875fd54e6db3a49878fa","target":"record","created_at":"2026-05-18T00:04:54Z","signer":{"key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","signer_id":"pith.science","signer_type":"pith_registry"},"payload":{"attestation_state":"computed","canonical_record":{"metadata":{"abstract_canon_sha256":"aee4c7310b3c54a214e3d82be77ebba715ca6d35017dce79b1652afa365c478b","cross_cats_sorted":["cs.AI","stat.ML"],"license":"http://arxiv.org/licenses/nonexclusive-distrib/1.0/","primary_cat":"cs.LG","submitted_at":"2018-09-24T18:13:01Z","title_canon_sha256":"ac94d63a41ccfa0b5ad3fa23d3446dc924aa9419994032c755aaa5c5cc4648c3"},"schema_version":"1.0","source":{"id":"1809.09147","kind":"arxiv","version":1}},"canonical_sha256":"356e463863526195e57f5ae52b3a69e50db8b00c98747100c20c5fb528c9133c","receipt":{"algorithm":"ed25519","builder_version":"pith-number-builder-2026-05-17-v1","canonical_sha256":"356e463863526195e57f5ae52b3a69e50db8b00c98747100c20c5fb528c9133c","first_computed_at":"2026-05-18T00:04:54.170725Z","key_id":"pith-v1-2026-05","kind":"pith_receipt","last_reissued_at":"2026-05-18T00:04:54.170725Z","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","receipt_version":"0.3","signature_b64":"nV0JgIyblSSB4a5y+q3+aU83WThFq+bkr4uZ97EVm4CIXh1yaclTUTXSjohivO6c1tG8RUYgCPpO1id8hYpaCw==","signature_status":"signed_v1","signed_at":"2026-05-18T00:04:54.171331Z","signed_message":"canonical_sha256_bytes"},"source_id":"1809.09147","source_kind":"arxiv","source_version":1}}},"equivocations":[],"invalid_events":[],"applied_event_ids":["sha256:362c4d7ddae90006a42859efde768d3633ede7ebd6bc875fd54e6db3a49878fa","sha256:661c977a9bd29b8fc8decb21685c877f36a1118ec0dd3b851b6560f2faff16d4"],"state_sha256":"e2dc3235957589f5c97e380b1513f853ca574e1be9becf68cecc5bd8f9340ccd"}