{"record_type":"pith_number_record","schema_url":"https://pith.science/schemas/pith-number/v1.json","pith_number":"pith:2017:HFSIVXEIGL6VEI2CDBBQRPAVFS","short_pith_number":"pith:HFSIVXEI","schema_version":"1.0","canonical_sha256":"39648adc8832fd522342184308bc152ca27459ac1f0cce378d38d2f088e7ce1e","source":{"kind":"arxiv","id":"1705.07384","version":2},"attestation_state":"computed","paper":{"title":"Balanced Policy Evaluation and Learning","license":"http://arxiv.org/licenses/nonexclusive-distrib/1.0/","headline":"","cross_cats":["cs.LG","math.OC"],"primary_cat":"stat.ML","authors_text":"Nathan Kallus","submitted_at":"2017-05-21T03:03:27Z","abstract_excerpt":"We present a new approach to the problems of evaluating and learning personalized decision policies from observational data of past contexts, decisions, and outcomes. Only the outcome of the enacted decision is available and the historical policy is unknown. These problems arise in personalized medicine using electronic health records and in internet advertising. Existing approaches use inverse propensity weighting (or, doubly robust versions) to make historical outcome (or, residual) data look like it were generated by a new policy being evaluated or learned. But this relies on a plug-in appr"},"verification_status":{"content_addressed":true,"pith_receipt":true,"author_attested":false,"weak_author_claims":0,"strong_author_claims":0,"externally_anchored":false,"storage_verified":false,"citation_signatures":0,"replication_records":0,"graph_snapshot":true,"references_resolved":false,"formal_links_present":false},"canonical_record":{"source":{"id":"1705.07384","kind":"arxiv","version":2},"metadata":{"license":"http://arxiv.org/licenses/nonexclusive-distrib/1.0/","primary_cat":"stat.ML","submitted_at":"2017-05-21T03:03:27Z","cross_cats_sorted":["cs.LG","math.OC"],"title_canon_sha256":"879c704efe09515969728f99674096f72e84928cf987e6e868fedec48898ffdc","abstract_canon_sha256":"fa1c2e2026f3e3e7364463ab336698779440cd6b14a82c9932046957b0a6bf01"},"schema_version":"1.0"},"receipt":{"kind":"pith_receipt","key_id":"pith-v1-2026-05","algorithm":"ed25519","signed_at":"2026-05-17T23:44:33.043850Z","signature_b64":"zgGnYfAvFQJsjVvNiXT6AWge16QgR+nkEg81hl3OB5FsTAx6MY2N/xQp5lROWyiuCAXT9eRqYIcu68oE+bATBQ==","signed_message":"canonical_sha256_bytes","builder_version":"pith-number-builder-2026-05-17-v1","receipt_version":"0.3","canonical_sha256":"39648adc8832fd522342184308bc152ca27459ac1f0cce378d38d2f088e7ce1e","last_reissued_at":"2026-05-17T23:44:33.043212Z","signature_status":"signed_v1","first_computed_at":"2026-05-17T23:44:33.043212Z","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54"},"graph_snapshot":{"paper":{"title":"Balanced Policy Evaluation and Learning","license":"http://arxiv.org/licenses/nonexclusive-distrib/1.0/","headline":"","cross_cats":["cs.LG","math.OC"],"primary_cat":"stat.ML","authors_text":"Nathan Kallus","submitted_at":"2017-05-21T03:03:27Z","abstract_excerpt":"We present a new approach to the problems of evaluating and learning personalized decision policies from observational data of past contexts, decisions, and outcomes. Only the outcome of the enacted decision is available and the historical policy is unknown. These problems arise in personalized medicine using electronic health records and in internet advertising. Existing approaches use inverse propensity weighting (or, doubly robust versions) to make historical outcome (or, residual) data look like it were generated by a new policy being evaluated or learned. But this relies on a plug-in appr"},"claims":{"count":0,"items":[],"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"source":{"id":"1705.07384","kind":"arxiv","version":2},"verdict":{"id":null,"model_set":{},"created_at":null,"strongest_claim":"","one_line_summary":"","pipeline_version":null,"weakest_assumption":"","pith_extraction_headline":""},"references":{"count":0,"sample":[],"resolved_work":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57","internal_anchors":0},"formal_canon":{"evidence_count":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"author_claims":{"count":0,"strong_count":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"builder_version":"pith-number-builder-2026-05-17-v1"},"aliases":[{"alias_kind":"arxiv","alias_value":"1705.07384","created_at":"2026-05-17T23:44:33.043305+00:00"},{"alias_kind":"arxiv_version","alias_value":"1705.07384v2","created_at":"2026-05-17T23:44:33.043305+00:00"},{"alias_kind":"doi","alias_value":"10.48550/arxiv.1705.07384","created_at":"2026-05-17T23:44:33.043305+00:00"},{"alias_kind":"pith_short_12","alias_value":"HFSIVXEIGL6V","created_at":"2026-05-18T12:31:18.294218+00:00"},{"alias_kind":"pith_short_16","alias_value":"HFSIVXEIGL6VEI2C","created_at":"2026-05-18T12:31:18.294218+00:00"},{"alias_kind":"pith_short_8","alias_value":"HFSIVXEI","created_at":"2026-05-18T12:31:18.294218+00:00"}],"events":[],"event_summary":{},"paper_claims":[],"inbound_citations":{"count":0,"internal_anchor_count":0,"sample":[]},"formal_canon":{"evidence_count":0,"sample":[],"anchors":[]},"links":{"html":"https://pith.science/pith/HFSIVXEIGL6VEI2CDBBQRPAVFS","json":"https://pith.science/pith/HFSIVXEIGL6VEI2CDBBQRPAVFS.json","graph_json":"https://pith.science/api/pith-number/HFSIVXEIGL6VEI2CDBBQRPAVFS/graph.json","events_json":"https://pith.science/api/pith-number/HFSIVXEIGL6VEI2CDBBQRPAVFS/events.json","paper":"https://pith.science/paper/HFSIVXEI"},"agent_actions":{"view_html":"https://pith.science/pith/HFSIVXEIGL6VEI2CDBBQRPAVFS","download_json":"https://pith.science/pith/HFSIVXEIGL6VEI2CDBBQRPAVFS.json","view_paper":"https://pith.science/paper/HFSIVXEI","resolve_alias":"https://pith.science/api/pith-number/resolve?arxiv=1705.07384&json=true","fetch_graph":"https://pith.science/api/pith-number/HFSIVXEIGL6VEI2CDBBQRPAVFS/graph.json","fetch_events":"https://pith.science/api/pith-number/HFSIVXEIGL6VEI2CDBBQRPAVFS/events.json","actions":{"anchor_timestamp":"https://pith.science/pith/HFSIVXEIGL6VEI2CDBBQRPAVFS/action/timestamp_anchor","attest_storage":"https://pith.science/pith/HFSIVXEIGL6VEI2CDBBQRPAVFS/action/storage_attestation","attest_author":"https://pith.science/pith/HFSIVXEIGL6VEI2CDBBQRPAVFS/action/author_attestation","sign_citation":"https://pith.science/pith/HFSIVXEIGL6VEI2CDBBQRPAVFS/action/citation_signature","submit_replication":"https://pith.science/pith/HFSIVXEIGL6VEI2CDBBQRPAVFS/action/replication_record"}},"created_at":"2026-05-17T23:44:33.043305+00:00","updated_at":"2026-05-17T23:44:33.043305+00:00"}