{"bundle_type":"pith_open_graph_bundle","bundle_version":"1.0","pith_number":"pith:2018:KRFR433CLRD4W6EIXPFYDZL2KA","short_pith_number":"pith:KRFR433C","canonical_record":{"source":{"id":"1802.06037","kind":"arxiv","version":1},"metadata":{"license":"http://arxiv.org/licenses/nonexclusive-distrib/1.0/","primary_cat":"stat.ML","submitted_at":"2018-02-16T17:23:02Z","cross_cats_sorted":["cs.LG"],"title_canon_sha256":"a3df9110a1b1acdfaf6d61aff8d0da25ddf346de2a268d65240e6940666ff499","abstract_canon_sha256":"4fed89509c176296259b45f3b7f8213219fd4d8486acb88ebae8f9456a73348c"},"schema_version":"1.0"},"canonical_sha256":"544b1e6f625c47cb7888bbcb81e57a501a681a996ee710188c14f6c5dda350c3","source":{"kind":"arxiv","id":"1802.06037","version":1},"source_aliases":[{"alias_kind":"arxiv","alias_value":"1802.06037","created_at":"2026-05-18T00:23:10Z"},{"alias_kind":"arxiv_version","alias_value":"1802.06037v1","created_at":"2026-05-18T00:23:10Z"},{"alias_kind":"doi","alias_value":"10.48550/arxiv.1802.06037","created_at":"2026-05-18T00:23:10Z"},{"alias_kind":"pith_short_12","alias_value":"KRFR433CLRD4","created_at":"2026-05-18T12:32:33Z"},{"alias_kind":"pith_short_16","alias_value":"KRFR433CLRD4W6EI","created_at":"2026-05-18T12:32:33Z"},{"alias_kind":"pith_short_8","alias_value":"KRFR433C","created_at":"2026-05-18T12:32:33Z"}],"events":[{"event_type":"record_created","subject_pith_number":"pith:2018:KRFR433CLRD4W6EIXPFYDZL2KA","target":"record","payload":{"canonical_record":{"source":{"id":"1802.06037","kind":"arxiv","version":1},"metadata":{"license":"http://arxiv.org/licenses/nonexclusive-distrib/1.0/","primary_cat":"stat.ML","submitted_at":"2018-02-16T17:23:02Z","cross_cats_sorted":["cs.LG"],"title_canon_sha256":"a3df9110a1b1acdfaf6d61aff8d0da25ddf346de2a268d65240e6940666ff499","abstract_canon_sha256":"4fed89509c176296259b45f3b7f8213219fd4d8486acb88ebae8f9456a73348c"},"schema_version":"1.0"},"canonical_sha256":"544b1e6f625c47cb7888bbcb81e57a501a681a996ee710188c14f6c5dda350c3","receipt":{"kind":"pith_receipt","key_id":"pith-v1-2026-05","algorithm":"ed25519","signed_at":"2026-05-18T00:23:10.078641Z","signature_b64":"99H57zCrq2mmxQEuSsNWWqqsVdSaJFg4U38HYmM0aQ3LE0QjLFccfLlM+BiDGsRip+jWx6ur+EXfqXkWfFG4Bg==","signed_message":"canonical_sha256_bytes","builder_version":"pith-number-builder-2026-05-17-v1","receipt_version":"0.3","canonical_sha256":"544b1e6f625c47cb7888bbcb81e57a501a681a996ee710188c14f6c5dda350c3","last_reissued_at":"2026-05-18T00:23:10.077972Z","signature_status":"signed_v1","first_computed_at":"2026-05-18T00:23:10.077972Z","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54"},"source_kind":"arxiv","source_id":"1802.06037","source_version":1,"attestation_state":"computed"},"signer":{"signer_id":"pith.science","signer_type":"pith_registry","key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54"},"created_at":"2026-05-18T00:23:10Z","supersedes":[],"prev_event":null,"signature":{"signature_status":"signed_v1","algorithm":"ed25519","key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","signature_b64":"SZpXQF+GWQEOE3JMzv7IJQ7jPg/JTXvuj8fyALmgUgpIukhHvjCXvD+MtDzJtE8mdaHwLMcPW+Oqq/tyY9SXCw==","signed_message":"open_graph_event_sha256_bytes","signed_at":"2026-06-02T01:23:27.641496Z"},"content_sha256":"5ca58d6c43ceaa93d31c06500b6ef2429c3288170f82e80f528e28f210ff703f","schema_version":"1.0","event_id":"sha256:5ca58d6c43ceaa93d31c06500b6ef2429c3288170f82e80f528e28f210ff703f"},{"event_type":"graph_snapshot","subject_pith_number":"pith:2018:KRFR433CLRD4W6EIXPFYDZL2KA","target":"graph","payload":{"graph_snapshot":{"paper":{"title":"Policy Evaluation and Optimization with Continuous Treatments","license":"http://arxiv.org/licenses/nonexclusive-distrib/1.0/","headline":"","cross_cats":["cs.LG"],"primary_cat":"stat.ML","authors_text":"Angela Zhou, Nathan Kallus","submitted_at":"2018-02-16T17:23:02Z","abstract_excerpt":"We study the problem of policy evaluation and learning from batched contextual bandit data when treatments are continuous, going beyond previous work on discrete treatments. Previous work for discrete treatment/action spaces focuses on inverse probability weighting (IPW) and doubly robust (DR) methods that use a rejection sampling approach for evaluation and the equivalent weighted classification problem for learning. In the continuous setting, this reduction fails as we would almost surely reject all observations. To tackle the case of continuous treatments, we extend the IPW and DR approache"},"claims":{"count":0,"items":[],"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"source":{"id":"1802.06037","kind":"arxiv","version":1},"verdict":{"id":null,"model_set":{},"created_at":null,"strongest_claim":"","one_line_summary":"","pipeline_version":null,"weakest_assumption":"","pith_extraction_headline":""},"references":{"count":0,"sample":[],"resolved_work":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57","internal_anchors":0},"formal_canon":{"evidence_count":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"author_claims":{"count":0,"strong_count":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"builder_version":"pith-number-builder-2026-05-17-v1"},"verdict_id":null},"signer":{"signer_id":"pith.science","signer_type":"pith_registry","key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54"},"created_at":"2026-05-18T00:23:10Z","supersedes":[],"prev_event":null,"signature":{"signature_status":"signed_v1","algorithm":"ed25519","key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","signature_b64":"gT10SeyTTXdXh1Li7RZey7FGtkuTLmKWIPrMv9kuDaO1u2G55Kit/EyeMQyQsjAg9jYXlQysVzot5NyNj3XqDg==","signed_message":"open_graph_event_sha256_bytes","signed_at":"2026-06-02T01:23:27.641832Z"},"content_sha256":"1edcf6e89220abfd96e3c947d12688aab121b2c10d51d4d504fe7a15d74c6be5","schema_version":"1.0","event_id":"sha256:1edcf6e89220abfd96e3c947d12688aab121b2c10d51d4d504fe7a15d74c6be5"}],"timestamp_proofs":[],"mirror_hints":[{"mirror_type":"https","name":"Pith Resolver","base_url":"https://pith.science","bundle_url":"https://pith.science/pith/KRFR433CLRD4W6EIXPFYDZL2KA/bundle.json","state_url":"https://pith.science/pith/KRFR433CLRD4W6EIXPFYDZL2KA/state.json","well_known_bundle_url":"https://pith.science/.well-known/pith/KRFR433CLRD4W6EIXPFYDZL2KA/bundle.json","status":"primary"}],"public_keys":[{"key_id":"pith-v1-2026-05","algorithm":"ed25519","format":"raw","public_key_b64":"stVStoiQhXFxp4s2pdzPNoqVNBMojDU/fJ2db5S3CbM=","public_key_hex":"b2d552b68890857171a78b36a5dccf368a953413288c353f7c9d9d6f94b709b3","fingerprint_sha256_b32_first128bits":"RVFV5Z2OI2J3ZUO7ERDEBCYNKS","fingerprint_sha256_hex":"8d4b5ee74e4693bcd1df2446408b0d54","rotates_at":null,"url":"https://pith.science/pith-signing-key.json","notes":"Pith uses this Ed25519 key to sign canonical record SHA-256 digests. Verify with: ed25519_verify(public_key, message=canonical_sha256_bytes, signature=base64decode(signature_b64))."}],"merge_version":"pith-open-graph-merge-v1","built_at":"2026-06-02T01:23:27Z","links":{"resolver":"https://pith.science/pith/KRFR433CLRD4W6EIXPFYDZL2KA","bundle":"https://pith.science/pith/KRFR433CLRD4W6EIXPFYDZL2KA/bundle.json","state":"https://pith.science/pith/KRFR433CLRD4W6EIXPFYDZL2KA/state.json","well_known_bundle":"https://pith.science/.well-known/pith/KRFR433CLRD4W6EIXPFYDZL2KA/bundle.json"},"state":{"state_type":"pith_open_graph_state","state_version":"1.0","pith_number":"pith:2018:KRFR433CLRD4W6EIXPFYDZL2KA","merge_version":"pith-open-graph-merge-v1","event_count":2,"valid_event_count":2,"invalid_event_count":0,"equivocation_count":0,"current":{"canonical_record":{"metadata":{"abstract_canon_sha256":"4fed89509c176296259b45f3b7f8213219fd4d8486acb88ebae8f9456a73348c","cross_cats_sorted":["cs.LG"],"license":"http://arxiv.org/licenses/nonexclusive-distrib/1.0/","primary_cat":"stat.ML","submitted_at":"2018-02-16T17:23:02Z","title_canon_sha256":"a3df9110a1b1acdfaf6d61aff8d0da25ddf346de2a268d65240e6940666ff499"},"schema_version":"1.0","source":{"id":"1802.06037","kind":"arxiv","version":1}},"source_aliases":[{"alias_kind":"arxiv","alias_value":"1802.06037","created_at":"2026-05-18T00:23:10Z"},{"alias_kind":"arxiv_version","alias_value":"1802.06037v1","created_at":"2026-05-18T00:23:10Z"},{"alias_kind":"doi","alias_value":"10.48550/arxiv.1802.06037","created_at":"2026-05-18T00:23:10Z"},{"alias_kind":"pith_short_12","alias_value":"KRFR433CLRD4","created_at":"2026-05-18T12:32:33Z"},{"alias_kind":"pith_short_16","alias_value":"KRFR433CLRD4W6EI","created_at":"2026-05-18T12:32:33Z"},{"alias_kind":"pith_short_8","alias_value":"KRFR433C","created_at":"2026-05-18T12:32:33Z"}],"graph_snapshots":[{"event_id":"sha256:1edcf6e89220abfd96e3c947d12688aab121b2c10d51d4d504fe7a15d74c6be5","target":"graph","created_at":"2026-05-18T00:23:10Z","signer":{"key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","signer_id":"pith.science","signer_type":"pith_registry"},"payload":{"graph_snapshot":{"author_claims":{"count":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57","strong_count":0},"builder_version":"pith-number-builder-2026-05-17-v1","claims":{"count":0,"items":[],"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"formal_canon":{"evidence_count":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"paper":{"abstract_excerpt":"We study the problem of policy evaluation and learning from batched contextual bandit data when treatments are continuous, going beyond previous work on discrete treatments. Previous work for discrete treatment/action spaces focuses on inverse probability weighting (IPW) and doubly robust (DR) methods that use a rejection sampling approach for evaluation and the equivalent weighted classification problem for learning. In the continuous setting, this reduction fails as we would almost surely reject all observations. To tackle the case of continuous treatments, we extend the IPW and DR approache","authors_text":"Angela Zhou, Nathan Kallus","cross_cats":["cs.LG"],"headline":"","license":"http://arxiv.org/licenses/nonexclusive-distrib/1.0/","primary_cat":"stat.ML","submitted_at":"2018-02-16T17:23:02Z","title":"Policy Evaluation and Optimization with Continuous Treatments"},"references":{"count":0,"internal_anchors":0,"resolved_work":0,"sample":[],"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"source":{"id":"1802.06037","kind":"arxiv","version":1},"verdict":{"created_at":null,"id":null,"model_set":{},"one_line_summary":"","pipeline_version":null,"pith_extraction_headline":"","strongest_claim":"","weakest_assumption":""}},"verdict_id":null}}],"author_attestations":[],"timestamp_anchors":[],"storage_attestations":[],"citation_signatures":[],"replication_records":[],"corrections":[],"mirror_hints":[],"record_created":{"event_id":"sha256:5ca58d6c43ceaa93d31c06500b6ef2429c3288170f82e80f528e28f210ff703f","target":"record","created_at":"2026-05-18T00:23:10Z","signer":{"key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","signer_id":"pith.science","signer_type":"pith_registry"},"payload":{"attestation_state":"computed","canonical_record":{"metadata":{"abstract_canon_sha256":"4fed89509c176296259b45f3b7f8213219fd4d8486acb88ebae8f9456a73348c","cross_cats_sorted":["cs.LG"],"license":"http://arxiv.org/licenses/nonexclusive-distrib/1.0/","primary_cat":"stat.ML","submitted_at":"2018-02-16T17:23:02Z","title_canon_sha256":"a3df9110a1b1acdfaf6d61aff8d0da25ddf346de2a268d65240e6940666ff499"},"schema_version":"1.0","source":{"id":"1802.06037","kind":"arxiv","version":1}},"canonical_sha256":"544b1e6f625c47cb7888bbcb81e57a501a681a996ee710188c14f6c5dda350c3","receipt":{"algorithm":"ed25519","builder_version":"pith-number-builder-2026-05-17-v1","canonical_sha256":"544b1e6f625c47cb7888bbcb81e57a501a681a996ee710188c14f6c5dda350c3","first_computed_at":"2026-05-18T00:23:10.077972Z","key_id":"pith-v1-2026-05","kind":"pith_receipt","last_reissued_at":"2026-05-18T00:23:10.077972Z","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","receipt_version":"0.3","signature_b64":"99H57zCrq2mmxQEuSsNWWqqsVdSaJFg4U38HYmM0aQ3LE0QjLFccfLlM+BiDGsRip+jWx6ur+EXfqXkWfFG4Bg==","signature_status":"signed_v1","signed_at":"2026-05-18T00:23:10.078641Z","signed_message":"canonical_sha256_bytes"},"source_id":"1802.06037","source_kind":"arxiv","source_version":1}}},"equivocations":[],"invalid_events":[],"applied_event_ids":["sha256:5ca58d6c43ceaa93d31c06500b6ef2429c3288170f82e80f528e28f210ff703f","sha256:1edcf6e89220abfd96e3c947d12688aab121b2c10d51d4d504fe7a15d74c6be5"],"state_sha256":"91fe813cf745769ef5b41aef36346bdc4f401bb555b1af02541377baa29b2ece"},"bundle_signature":{"signature_status":"signed_v1","algorithm":"ed25519","key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","signature_b64":"QsHz2X37ttY9ZMHbj8OCU8KnoQn2BNdz1YxqGqQVBb8DUrNgvXs5fuE9BPAJNbA3F0cCaatXgKUZRpgOYydgDw==","signed_message":"bundle_sha256_bytes","signed_at":"2026-06-02T01:23:27.643641Z","bundle_sha256":"a2d8cdda88f6c39824a4575fba00a64c0c312975397d507b5711e6cc8d6f9787"}}