{"record_type":"pith_number_record","schema_url":"https://pith.science/schemas/pith-number/v1.json","pith_number":"pith:2018:V65F2QVLQ2MXCWCLW2GH6DUF6E","short_pith_number":"pith:V65F2QVL","schema_version":"1.0","canonical_sha256":"afba5d42ab869971584bb68c7f0e85f119606477a05ed8c03f5f997db01d7d7b","source":{"kind":"arxiv","id":"1802.09810","version":1},"attestation_state":"computed","paper":{"title":"Human-in-the-Loop Synthesis for Partially Observable Markov Decision Processes","license":"http://arxiv.org/licenses/nonexclusive-distrib/1.0/","headline":"","cross_cats":[],"primary_cat":"cs.AI","authors_text":"Jie Fu, Nils Jansen, Ralf Wimmer, Steven Carr, Ufuk Topcu","submitted_at":"2018-02-27T10:29:56Z","abstract_excerpt":"We study planning problems where autonomous agents operate inside environments that are subject to uncertainties and not fully observable. Partially observable Markov decision processes (POMDPs) are a natural formal model to capture such problems. Because of the potentially huge or even infinite belief space in POMDPs, synthesis with safety guarantees is, in general, computationally intractable. We propose an approach that aims to circumvent this difficulty: in scenarios that can be partially or fully simulated in a virtual environment, we actively integrate a human user to control an agent. W"},"verification_status":{"content_addressed":true,"pith_receipt":true,"author_attested":false,"weak_author_claims":0,"strong_author_claims":0,"externally_anchored":false,"storage_verified":false,"citation_signatures":0,"replication_records":0,"graph_snapshot":true,"references_resolved":false,"formal_links_present":false},"canonical_record":{"source":{"id":"1802.09810","kind":"arxiv","version":1},"metadata":{"license":"http://arxiv.org/licenses/nonexclusive-distrib/1.0/","primary_cat":"cs.AI","submitted_at":"2018-02-27T10:29:56Z","cross_cats_sorted":[],"title_canon_sha256":"0cf9237e8e5c7f76e0f4cb0eaee71d892cf4f1adab6708cf9aff3bef61fd83f6","abstract_canon_sha256":"c5119509053e3aef5bc2ceed00b4923181757497a5f68c24e0ae6720c60e9149"},"schema_version":"1.0"},"receipt":{"kind":"pith_receipt","key_id":"pith-v1-2026-05","algorithm":"ed25519","signed_at":"2026-05-18T00:22:22.124345Z","signature_b64":"YQg1KnAK9I98NKTa7yLA7bis2M//NsSJF1kAFptXKBCUCsrnW72aGC0td5Tlmwz5MSSibx+x97WXKxmw2XUdAQ==","signed_message":"canonical_sha256_bytes","builder_version":"pith-number-builder-2026-05-17-v1","receipt_version":"0.3","canonical_sha256":"afba5d42ab869971584bb68c7f0e85f119606477a05ed8c03f5f997db01d7d7b","last_reissued_at":"2026-05-18T00:22:22.123567Z","signature_status":"signed_v1","first_computed_at":"2026-05-18T00:22:22.123567Z","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54"},"graph_snapshot":{"paper":{"title":"Human-in-the-Loop Synthesis for Partially Observable Markov Decision Processes","license":"http://arxiv.org/licenses/nonexclusive-distrib/1.0/","headline":"","cross_cats":[],"primary_cat":"cs.AI","authors_text":"Jie Fu, Nils Jansen, Ralf Wimmer, Steven Carr, Ufuk Topcu","submitted_at":"2018-02-27T10:29:56Z","abstract_excerpt":"We study planning problems where autonomous agents operate inside environments that are subject to uncertainties and not fully observable. Partially observable Markov decision processes (POMDPs) are a natural formal model to capture such problems. Because of the potentially huge or even infinite belief space in POMDPs, synthesis with safety guarantees is, in general, computationally intractable. We propose an approach that aims to circumvent this difficulty: in scenarios that can be partially or fully simulated in a virtual environment, we actively integrate a human user to control an agent. W"},"claims":{"count":0,"items":[],"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"source":{"id":"1802.09810","kind":"arxiv","version":1},"verdict":{"id":null,"model_set":{},"created_at":null,"strongest_claim":"","one_line_summary":"","pipeline_version":null,"weakest_assumption":"","pith_extraction_headline":""},"references":{"count":0,"sample":[],"resolved_work":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57","internal_anchors":0},"formal_canon":{"evidence_count":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"author_claims":{"count":0,"strong_count":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"builder_version":"pith-number-builder-2026-05-17-v1"},"aliases":[{"alias_kind":"arxiv","alias_value":"1802.09810","created_at":"2026-05-18T00:22:22.123710+00:00"},{"alias_kind":"arxiv_version","alias_value":"1802.09810v1","created_at":"2026-05-18T00:22:22.123710+00:00"},{"alias_kind":"doi","alias_value":"10.48550/arxiv.1802.09810","created_at":"2026-05-18T00:22:22.123710+00:00"},{"alias_kind":"pith_short_12","alias_value":"V65F2QVLQ2MX","created_at":"2026-05-18T12:32:59.047623+00:00"},{"alias_kind":"pith_short_16","alias_value":"V65F2QVLQ2MXCWCL","created_at":"2026-05-18T12:32:59.047623+00:00"},{"alias_kind":"pith_short_8","alias_value":"V65F2QVL","created_at":"2026-05-18T12:32:59.047623+00:00"}],"events":[],"event_summary":{},"paper_claims":[],"inbound_citations":{"count":0,"internal_anchor_count":0,"sample":[]},"formal_canon":{"evidence_count":0,"sample":[],"anchors":[]},"links":{"html":"https://pith.science/pith/V65F2QVLQ2MXCWCLW2GH6DUF6E","json":"https://pith.science/pith/V65F2QVLQ2MXCWCLW2GH6DUF6E.json","graph_json":"https://pith.science/api/pith-number/V65F2QVLQ2MXCWCLW2GH6DUF6E/graph.json","events_json":"https://pith.science/api/pith-number/V65F2QVLQ2MXCWCLW2GH6DUF6E/events.json","paper":"https://pith.science/paper/V65F2QVL"},"agent_actions":{"view_html":"https://pith.science/pith/V65F2QVLQ2MXCWCLW2GH6DUF6E","download_json":"https://pith.science/pith/V65F2QVLQ2MXCWCLW2GH6DUF6E.json","view_paper":"https://pith.science/paper/V65F2QVL","resolve_alias":"https://pith.science/api/pith-number/resolve?arxiv=1802.09810&json=true","fetch_graph":"https://pith.science/api/pith-number/V65F2QVLQ2MXCWCLW2GH6DUF6E/graph.json","fetch_events":"https://pith.science/api/pith-number/V65F2QVLQ2MXCWCLW2GH6DUF6E/events.json","actions":{"anchor_timestamp":"https://pith.science/pith/V65F2QVLQ2MXCWCLW2GH6DUF6E/action/timestamp_anchor","attest_storage":"https://pith.science/pith/V65F2QVLQ2MXCWCLW2GH6DUF6E/action/storage_attestation","attest_author":"https://pith.science/pith/V65F2QVLQ2MXCWCLW2GH6DUF6E/action/author_attestation","sign_citation":"https://pith.science/pith/V65F2QVLQ2MXCWCLW2GH6DUF6E/action/citation_signature","submit_replication":"https://pith.science/pith/V65F2QVLQ2MXCWCLW2GH6DUF6E/action/replication_record"}},"created_at":"2026-05-18T00:22:22.123710+00:00","updated_at":"2026-05-18T00:22:22.123710+00:00"}