{"bundle_type":"pith_open_graph_bundle","bundle_version":"1.0","pith_number":"pith:2026:SHIZBXBABN4DWNCKR7P4FYUS2L","short_pith_number":"pith:SHIZBXBA","canonical_record":{"source":{"id":"2605.18509","kind":"arxiv","version":1},"metadata":{"license":"http://arxiv.org/licenses/nonexclusive-distrib/1.0/","primary_cat":"cs.LG","submitted_at":"2026-05-18T15:01:30Z","cross_cats_sorted":[],"title_canon_sha256":"add019ad29b5506112ae0a5e4001a1b0f95e021d2f58dce2cb24dab54e306890","abstract_canon_sha256":"8627c2a2da6af4075ae678939ed2dc79491c62a584e4e0bd8d6593a3111ecafb"},"schema_version":"1.0"},"canonical_sha256":"91d190dc200b783b344a8fdfc2e292d2d3c25e9c6b68ba4ad7220822952bde2a","source":{"kind":"arxiv","id":"2605.18509","version":1},"source_aliases":[{"alias_kind":"arxiv","alias_value":"2605.18509","created_at":"2026-05-20T00:06:04Z"},{"alias_kind":"arxiv_version","alias_value":"2605.18509v1","created_at":"2026-05-20T00:06:04Z"},{"alias_kind":"doi","alias_value":"10.48550/arxiv.2605.18509","created_at":"2026-05-20T00:06:04Z"},{"alias_kind":"pith_short_12","alias_value":"SHIZBXBABN4D","created_at":"2026-05-20T00:06:04Z"},{"alias_kind":"pith_short_16","alias_value":"SHIZBXBABN4DWNCK","created_at":"2026-05-20T00:06:04Z"},{"alias_kind":"pith_short_8","alias_value":"SHIZBXBA","created_at":"2026-05-20T00:06:04Z"}],"events":[{"event_type":"record_created","subject_pith_number":"pith:2026:SHIZBXBABN4DWNCKR7P4FYUS2L","target":"record","payload":{"canonical_record":{"source":{"id":"2605.18509","kind":"arxiv","version":1},"metadata":{"license":"http://arxiv.org/licenses/nonexclusive-distrib/1.0/","primary_cat":"cs.LG","submitted_at":"2026-05-18T15:01:30Z","cross_cats_sorted":[],"title_canon_sha256":"add019ad29b5506112ae0a5e4001a1b0f95e021d2f58dce2cb24dab54e306890","abstract_canon_sha256":"8627c2a2da6af4075ae678939ed2dc79491c62a584e4e0bd8d6593a3111ecafb"},"schema_version":"1.0"},"canonical_sha256":"91d190dc200b783b344a8fdfc2e292d2d3c25e9c6b68ba4ad7220822952bde2a","receipt":{"kind":"pith_receipt","key_id":"pith-v1-2026-05","algorithm":"ed25519","signed_at":"2026-05-20T00:06:04.938268Z","signature_b64":"enEZqrC34/UMS9BX/eJ6Y6aeur0l5C1kRpcRL3o+RxCNMxjcBerupjy9LNBHcTar3dxFqZ0cAKQTrkyh4LvlDA==","signed_message":"canonical_sha256_bytes","builder_version":"pith-number-builder-2026-05-17-v1","receipt_version":"0.3","canonical_sha256":"91d190dc200b783b344a8fdfc2e292d2d3c25e9c6b68ba4ad7220822952bde2a","last_reissued_at":"2026-05-20T00:06:04.937360Z","signature_status":"signed_v1","first_computed_at":"2026-05-20T00:06:04.937360Z","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54"},"source_kind":"arxiv","source_id":"2605.18509","source_version":1,"attestation_state":"computed"},"signer":{"signer_id":"pith.science","signer_type":"pith_registry","key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54"},"created_at":"2026-05-20T00:06:04Z","supersedes":[],"prev_event":null,"signature":{"signature_status":"signed_v1","algorithm":"ed25519","key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","signature_b64":"MPYNaN930lTk21QiVVN8OLwX9pzHBJAWC6sLrUkL1maMQR8MdZSndAktGd+4qc9nD41cw97wPOzvOyHiXBYoBg==","signed_message":"open_graph_event_sha256_bytes","signed_at":"2026-05-23T10:32:36.873097Z"},"content_sha256":"69b824553a1900968d547cb2f4774f9678fda1d0bbd3067b067ec9c5f3268de4","schema_version":"1.0","event_id":"sha256:69b824553a1900968d547cb2f4774f9678fda1d0bbd3067b067ec9c5f3268de4"},{"event_type":"graph_snapshot","subject_pith_number":"pith:2026:SHIZBXBABN4DWNCKR7P4FYUS2L","target":"graph","payload":{"graph_snapshot":{"paper":{"title":"Offline Contextual Bandits in the Presence of New Actions","license":"http://arxiv.org/licenses/nonexclusive-distrib/1.0/","headline":"","cross_cats":[],"primary_cat":"cs.LG","authors_text":"Kazuki Kawamura, Kei Tateno, Ren Kishimoto, Takanori Muroi, Takuma Udagawa, Tatsuhiro Shimizu, Yuki Sasamoto, Yusuke Narita, Yuta Saito","submitted_at":"2026-05-18T15:01:30Z","abstract_excerpt":"Automated decision-making algorithms drive applications such as recommendation systems and search engines. These algorithms often rely on off-policy contextual bandits or off-policy learning (OPL). Conventionally, OPL selects actions that maximize the expected reward from an existing action set. However, in many real-world scenarios, actions, such as news articles or video content, change continuously, and the action space evolves over time after data collection. We define actions introduced after deploying the logging policy as new actions and focus on OPL with new actions. Existing OPL metho"},"claims":{"count":0,"items":[],"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"source":{"id":"2605.18509","kind":"arxiv","version":1},"verdict":{"id":null,"model_set":{},"created_at":null,"strongest_claim":"","one_line_summary":"","pipeline_version":null,"weakest_assumption":"","pith_extraction_headline":""},"integrity":{"clean":true,"summary":{"advisory":0,"critical":0,"by_detector":{},"informational":0},"endpoint":"/pith/2605.18509/integrity.json","findings":[],"available":true,"detectors_run":[],"snapshot_sha256":"c28c3603d3b5d939e8dc4c7e95fa8dfce3d595e45f758748cecf8e644a296938"},"references":{"count":0,"sample":[],"resolved_work":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57","internal_anchors":0},"formal_canon":{"evidence_count":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"author_claims":{"count":0,"strong_count":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"builder_version":"pith-number-builder-2026-05-17-v1"},"verdict_id":null},"signer":{"signer_id":"pith.science","signer_type":"pith_registry","key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54"},"created_at":"2026-05-20T00:06:04Z","supersedes":[],"prev_event":null,"signature":{"signature_status":"signed_v1","algorithm":"ed25519","key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","signature_b64":"s6jnNKbbUWJd16ePIN1Lua8/FBRT1LT7a4JW6+/NGjMz59wultW3dqitmQVRWP1TUZX8ihmgWT6dgqWR/ihBBQ==","signed_message":"open_graph_event_sha256_bytes","signed_at":"2026-05-23T10:32:36.873996Z"},"content_sha256":"6109d6600b881cb5b6737d2dc984bf9579c4792c8829cab82de6da087945bad5","schema_version":"1.0","event_id":"sha256:6109d6600b881cb5b6737d2dc984bf9579c4792c8829cab82de6da087945bad5"}],"timestamp_proofs":[],"mirror_hints":[{"mirror_type":"https","name":"Pith Resolver","base_url":"https://pith.science","bundle_url":"https://pith.science/pith/SHIZBXBABN4DWNCKR7P4FYUS2L/bundle.json","state_url":"https://pith.science/pith/SHIZBXBABN4DWNCKR7P4FYUS2L/state.json","well_known_bundle_url":"https://pith.science/.well-known/pith/SHIZBXBABN4DWNCKR7P4FYUS2L/bundle.json","status":"primary"}],"public_keys":[{"key_id":"pith-v1-2026-05","algorithm":"ed25519","format":"raw","public_key_b64":"stVStoiQhXFxp4s2pdzPNoqVNBMojDU/fJ2db5S3CbM=","public_key_hex":"b2d552b68890857171a78b36a5dccf368a953413288c353f7c9d9d6f94b709b3","fingerprint_sha256_b32_first128bits":"RVFV5Z2OI2J3ZUO7ERDEBCYNKS","fingerprint_sha256_hex":"8d4b5ee74e4693bcd1df2446408b0d54","rotates_at":null,"url":"https://pith.science/pith-signing-key.json","notes":"Pith uses this Ed25519 key to sign canonical record SHA-256 digests. Verify with: ed25519_verify(public_key, message=canonical_sha256_bytes, signature=base64decode(signature_b64))."}],"merge_version":"pith-open-graph-merge-v1","built_at":"2026-05-23T10:32:36Z","links":{"resolver":"https://pith.science/pith/SHIZBXBABN4DWNCKR7P4FYUS2L","bundle":"https://pith.science/pith/SHIZBXBABN4DWNCKR7P4FYUS2L/bundle.json","state":"https://pith.science/pith/SHIZBXBABN4DWNCKR7P4FYUS2L/state.json","well_known_bundle":"https://pith.science/.well-known/pith/SHIZBXBABN4DWNCKR7P4FYUS2L/bundle.json"},"state":{"state_type":"pith_open_graph_state","state_version":"1.0","pith_number":"pith:2026:SHIZBXBABN4DWNCKR7P4FYUS2L","merge_version":"pith-open-graph-merge-v1","event_count":2,"valid_event_count":2,"invalid_event_count":0,"equivocation_count":0,"current":{"canonical_record":{"metadata":{"abstract_canon_sha256":"8627c2a2da6af4075ae678939ed2dc79491c62a584e4e0bd8d6593a3111ecafb","cross_cats_sorted":[],"license":"http://arxiv.org/licenses/nonexclusive-distrib/1.0/","primary_cat":"cs.LG","submitted_at":"2026-05-18T15:01:30Z","title_canon_sha256":"add019ad29b5506112ae0a5e4001a1b0f95e021d2f58dce2cb24dab54e306890"},"schema_version":"1.0","source":{"id":"2605.18509","kind":"arxiv","version":1}},"source_aliases":[{"alias_kind":"arxiv","alias_value":"2605.18509","created_at":"2026-05-20T00:06:04Z"},{"alias_kind":"arxiv_version","alias_value":"2605.18509v1","created_at":"2026-05-20T00:06:04Z"},{"alias_kind":"doi","alias_value":"10.48550/arxiv.2605.18509","created_at":"2026-05-20T00:06:04Z"},{"alias_kind":"pith_short_12","alias_value":"SHIZBXBABN4D","created_at":"2026-05-20T00:06:04Z"},{"alias_kind":"pith_short_16","alias_value":"SHIZBXBABN4DWNCK","created_at":"2026-05-20T00:06:04Z"},{"alias_kind":"pith_short_8","alias_value":"SHIZBXBA","created_at":"2026-05-20T00:06:04Z"}],"graph_snapshots":[{"event_id":"sha256:6109d6600b881cb5b6737d2dc984bf9579c4792c8829cab82de6da087945bad5","target":"graph","created_at":"2026-05-20T00:06:04Z","signer":{"key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","signer_id":"pith.science","signer_type":"pith_registry"},"payload":{"graph_snapshot":{"author_claims":{"count":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57","strong_count":0},"builder_version":"pith-number-builder-2026-05-17-v1","claims":{"count":0,"items":[],"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"formal_canon":{"evidence_count":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"integrity":{"available":true,"clean":true,"detectors_run":[],"endpoint":"/pith/2605.18509/integrity.json","findings":[],"snapshot_sha256":"c28c3603d3b5d939e8dc4c7e95fa8dfce3d595e45f758748cecf8e644a296938","summary":{"advisory":0,"by_detector":{},"critical":0,"informational":0}},"paper":{"abstract_excerpt":"Automated decision-making algorithms drive applications such as recommendation systems and search engines. These algorithms often rely on off-policy contextual bandits or off-policy learning (OPL). Conventionally, OPL selects actions that maximize the expected reward from an existing action set. However, in many real-world scenarios, actions, such as news articles or video content, change continuously, and the action space evolves over time after data collection. We define actions introduced after deploying the logging policy as new actions and focus on OPL with new actions. Existing OPL metho","authors_text":"Kazuki Kawamura, Kei Tateno, Ren Kishimoto, Takanori Muroi, Takuma Udagawa, Tatsuhiro Shimizu, Yuki Sasamoto, Yusuke Narita, Yuta Saito","cross_cats":[],"headline":"","license":"http://arxiv.org/licenses/nonexclusive-distrib/1.0/","primary_cat":"cs.LG","submitted_at":"2026-05-18T15:01:30Z","title":"Offline Contextual Bandits in the Presence of New Actions"},"references":{"count":0,"internal_anchors":0,"resolved_work":0,"sample":[],"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"source":{"id":"2605.18509","kind":"arxiv","version":1},"verdict":{"created_at":null,"id":null,"model_set":{},"one_line_summary":"","pipeline_version":null,"pith_extraction_headline":"","strongest_claim":"","weakest_assumption":""}},"verdict_id":null}}],"author_attestations":[],"timestamp_anchors":[],"storage_attestations":[],"citation_signatures":[],"replication_records":[],"corrections":[],"mirror_hints":[],"record_created":{"event_id":"sha256:69b824553a1900968d547cb2f4774f9678fda1d0bbd3067b067ec9c5f3268de4","target":"record","created_at":"2026-05-20T00:06:04Z","signer":{"key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","signer_id":"pith.science","signer_type":"pith_registry"},"payload":{"attestation_state":"computed","canonical_record":{"metadata":{"abstract_canon_sha256":"8627c2a2da6af4075ae678939ed2dc79491c62a584e4e0bd8d6593a3111ecafb","cross_cats_sorted":[],"license":"http://arxiv.org/licenses/nonexclusive-distrib/1.0/","primary_cat":"cs.LG","submitted_at":"2026-05-18T15:01:30Z","title_canon_sha256":"add019ad29b5506112ae0a5e4001a1b0f95e021d2f58dce2cb24dab54e306890"},"schema_version":"1.0","source":{"id":"2605.18509","kind":"arxiv","version":1}},"canonical_sha256":"91d190dc200b783b344a8fdfc2e292d2d3c25e9c6b68ba4ad7220822952bde2a","receipt":{"algorithm":"ed25519","builder_version":"pith-number-builder-2026-05-17-v1","canonical_sha256":"91d190dc200b783b344a8fdfc2e292d2d3c25e9c6b68ba4ad7220822952bde2a","first_computed_at":"2026-05-20T00:06:04.937360Z","key_id":"pith-v1-2026-05","kind":"pith_receipt","last_reissued_at":"2026-05-20T00:06:04.937360Z","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","receipt_version":"0.3","signature_b64":"enEZqrC34/UMS9BX/eJ6Y6aeur0l5C1kRpcRL3o+RxCNMxjcBerupjy9LNBHcTar3dxFqZ0cAKQTrkyh4LvlDA==","signature_status":"signed_v1","signed_at":"2026-05-20T00:06:04.938268Z","signed_message":"canonical_sha256_bytes"},"source_id":"2605.18509","source_kind":"arxiv","source_version":1}}},"equivocations":[],"invalid_events":[],"applied_event_ids":["sha256:69b824553a1900968d547cb2f4774f9678fda1d0bbd3067b067ec9c5f3268de4","sha256:6109d6600b881cb5b6737d2dc984bf9579c4792c8829cab82de6da087945bad5"],"state_sha256":"2dabe273aaa067b069f51b2ddefa1ceed2054982a7a396b64af33c0c2141b54c"},"bundle_signature":{"signature_status":"signed_v1","algorithm":"ed25519","key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","signature_b64":"kom+Fo1tE6rVN6uVxCaLmR6rB4ltJVKcmwlHfzcI2dxkGsvfFTzs/q/nFasRhopG3JOiKEKhu6EyXf31zNMkAw==","signed_message":"bundle_sha256_bytes","signed_at":"2026-05-23T10:32:36.877824Z","bundle_sha256":"9d32cf568ab9643da2f6fbbf4e67936044ff639d0174f57ec534ec370032311f"}}