{"record_type":"pith_number_record","schema_url":"https://pith.science/schemas/pith-number/v1.json","pith_number":"pith:2016:DH2VEJ27KUY7Z3FJXIFC73XLWS","short_pith_number":"pith:DH2VEJ27","schema_version":"1.0","canonical_sha256":"19f552275f5531fceca9ba0a2feeebb4ab901d52699c1d1cb60ba985e199c40c","source":{"kind":"arxiv","id":"1602.03348","version":2},"attestation_state":"computed","paper":{"title":"Iterative Hierarchical Optimization for Misspecified Problems (IHOMP)","license":"http://arxiv.org/licenses/nonexclusive-distrib/1.0/","headline":"","cross_cats":["cs.AI"],"primary_cat":"cs.LG","authors_text":"Daniel J. Mankowitz, Shie Mannor, Timothy A. Mann","submitted_at":"2016-02-10T12:27:04Z","abstract_excerpt":"For complex, high-dimensional Markov Decision Processes (MDPs), it may be necessary to represent the policy with function approximation. A problem is misspecified whenever, the representation cannot express any policy with acceptable performance. We introduce IHOMP : an approach for solving misspecified problems. IHOMP iteratively learns a set of context specialized options and combines these options to solve an otherwise misspecified problem. Our main contribution is proving that IHOMP enjoys theoretical convergence guarantees. In addition, we extend IHOMP to exploit Option Interruption (OI) "},"verification_status":{"content_addressed":true,"pith_receipt":true,"author_attested":false,"weak_author_claims":0,"strong_author_claims":0,"externally_anchored":false,"storage_verified":false,"citation_signatures":0,"replication_records":0,"graph_snapshot":true,"references_resolved":false,"formal_links_present":false},"canonical_record":{"source":{"id":"1602.03348","kind":"arxiv","version":2},"metadata":{"license":"http://arxiv.org/licenses/nonexclusive-distrib/1.0/","primary_cat":"cs.LG","submitted_at":"2016-02-10T12:27:04Z","cross_cats_sorted":["cs.AI"],"title_canon_sha256":"5666cd613bd6fd55e9644847b68a03ac6a6948dc492856719bc36707e75b7f4a","abstract_canon_sha256":"1e51d8912edfd317748bea9b558fa024a84049b6eb16ba39e55f659ca1c7fa64"},"schema_version":"1.0"},"receipt":{"kind":"pith_receipt","key_id":"pith-v1-2026-05","algorithm":"ed25519","signed_at":"2026-05-18T01:12:43.225276Z","signature_b64":"mtDJNNfVbEpLMbJ6xUMkUnQ7QdmiZWmwcqUe7oPPimtHmHsyu5Otrhn8F6Qx4Pp+EWAR45ae5ohKCbuOGe33DA==","signed_message":"canonical_sha256_bytes","builder_version":"pith-number-builder-2026-05-17-v1","receipt_version":"0.3","canonical_sha256":"19f552275f5531fceca9ba0a2feeebb4ab901d52699c1d1cb60ba985e199c40c","last_reissued_at":"2026-05-18T01:12:43.224943Z","signature_status":"signed_v1","first_computed_at":"2026-05-18T01:12:43.224943Z","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54"},"graph_snapshot":{"paper":{"title":"Iterative Hierarchical Optimization for Misspecified Problems (IHOMP)","license":"http://arxiv.org/licenses/nonexclusive-distrib/1.0/","headline":"","cross_cats":["cs.AI"],"primary_cat":"cs.LG","authors_text":"Daniel J. Mankowitz, Shie Mannor, Timothy A. Mann","submitted_at":"2016-02-10T12:27:04Z","abstract_excerpt":"For complex, high-dimensional Markov Decision Processes (MDPs), it may be necessary to represent the policy with function approximation. A problem is misspecified whenever, the representation cannot express any policy with acceptable performance. We introduce IHOMP : an approach for solving misspecified problems. IHOMP iteratively learns a set of context specialized options and combines these options to solve an otherwise misspecified problem. Our main contribution is proving that IHOMP enjoys theoretical convergence guarantees. In addition, we extend IHOMP to exploit Option Interruption (OI) "},"claims":{"count":0,"items":[],"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"source":{"id":"1602.03348","kind":"arxiv","version":2},"verdict":{"id":null,"model_set":{},"created_at":null,"strongest_claim":"","one_line_summary":"","pipeline_version":null,"weakest_assumption":"","pith_extraction_headline":""},"references":{"count":0,"sample":[],"resolved_work":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57","internal_anchors":0},"formal_canon":{"evidence_count":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"author_claims":{"count":0,"strong_count":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"builder_version":"pith-number-builder-2026-05-17-v1"},"aliases":[{"alias_kind":"arxiv","alias_value":"1602.03348","created_at":"2026-05-18T01:12:43.224997+00:00"},{"alias_kind":"arxiv_version","alias_value":"1602.03348v2","created_at":"2026-05-18T01:12:43.224997+00:00"},{"alias_kind":"doi","alias_value":"10.48550/arxiv.1602.03348","created_at":"2026-05-18T01:12:43.224997+00:00"},{"alias_kind":"pith_short_12","alias_value":"DH2VEJ27KUY7","created_at":"2026-05-18T12:30:12.583610+00:00"},{"alias_kind":"pith_short_16","alias_value":"DH2VEJ27KUY7Z3FJ","created_at":"2026-05-18T12:30:12.583610+00:00"},{"alias_kind":"pith_short_8","alias_value":"DH2VEJ27","created_at":"2026-05-18T12:30:12.583610+00:00"}],"events":[],"event_summary":{},"paper_claims":[],"inbound_citations":{"count":0,"internal_anchor_count":0,"sample":[]},"formal_canon":{"evidence_count":0,"sample":[],"anchors":[]},"links":{"html":"https://pith.science/pith/DH2VEJ27KUY7Z3FJXIFC73XLWS","json":"https://pith.science/pith/DH2VEJ27KUY7Z3FJXIFC73XLWS.json","graph_json":"https://pith.science/api/pith-number/DH2VEJ27KUY7Z3FJXIFC73XLWS/graph.json","events_json":"https://pith.science/api/pith-number/DH2VEJ27KUY7Z3FJXIFC73XLWS/events.json","paper":"https://pith.science/paper/DH2VEJ27"},"agent_actions":{"view_html":"https://pith.science/pith/DH2VEJ27KUY7Z3FJXIFC73XLWS","download_json":"https://pith.science/pith/DH2VEJ27KUY7Z3FJXIFC73XLWS.json","view_paper":"https://pith.science/paper/DH2VEJ27","resolve_alias":"https://pith.science/api/pith-number/resolve?arxiv=1602.03348&json=true","fetch_graph":"https://pith.science/api/pith-number/DH2VEJ27KUY7Z3FJXIFC73XLWS/graph.json","fetch_events":"https://pith.science/api/pith-number/DH2VEJ27KUY7Z3FJXIFC73XLWS/events.json","actions":{"anchor_timestamp":"https://pith.science/pith/DH2VEJ27KUY7Z3FJXIFC73XLWS/action/timestamp_anchor","attest_storage":"https://pith.science/pith/DH2VEJ27KUY7Z3FJXIFC73XLWS/action/storage_attestation","attest_author":"https://pith.science/pith/DH2VEJ27KUY7Z3FJXIFC73XLWS/action/author_attestation","sign_citation":"https://pith.science/pith/DH2VEJ27KUY7Z3FJXIFC73XLWS/action/citation_signature","submit_replication":"https://pith.science/pith/DH2VEJ27KUY7Z3FJXIFC73XLWS/action/replication_record"}},"created_at":"2026-05-18T01:12:43.224997+00:00","updated_at":"2026-05-18T01:12:43.224997+00:00"}