{"bundle_type":"pith_open_graph_bundle","bundle_version":"1.0","pith_number":"pith:2018:P5RSZW5H3ESI2HVBTVDZSPP6AB","short_pith_number":"pith:P5RSZW5H","canonical_record":{"source":{"id":"1806.05819","kind":"arxiv","version":2},"metadata":{"license":"http://arxiv.org/licenses/nonexclusive-distrib/1.0/","primary_cat":"cs.LG","submitted_at":"2018-06-15T06:17:55Z","cross_cats_sorted":["stat.ML"],"title_canon_sha256":"ee6158ace3d3d4c05eb1c78e48350fa7e50b7b7d9bee36d9e44beace5347fd36","abstract_canon_sha256":"e5dfb2e1e4f7bc6ce12921d21536d93f00adc67f80a9ce78de93a8397c9b23ac"},"schema_version":"1.0"},"canonical_sha256":"7f632cdba7d9248d1ea19d47993dfe004998af7ffb56c5d93eb19070fdff1b61","source":{"kind":"arxiv","id":"1806.05819","version":2},"source_aliases":[{"alias_kind":"arxiv","alias_value":"1806.05819","created_at":"2026-05-17T23:41:53Z"},{"alias_kind":"arxiv_version","alias_value":"1806.05819v2","created_at":"2026-05-17T23:41:53Z"},{"alias_kind":"doi","alias_value":"10.48550/arxiv.1806.05819","created_at":"2026-05-17T23:41:53Z"},{"alias_kind":"pith_short_12","alias_value":"P5RSZW5H3ESI","created_at":"2026-05-18T12:32:43Z"},{"alias_kind":"pith_short_16","alias_value":"P5RSZW5H3ESI2HVB","created_at":"2026-05-18T12:32:43Z"},{"alias_kind":"pith_short_8","alias_value":"P5RSZW5H","created_at":"2026-05-18T12:32:43Z"}],"events":[{"event_type":"record_created","subject_pith_number":"pith:2018:P5RSZW5H3ESI2HVBTVDZSPP6AB","target":"record","payload":{"canonical_record":{"source":{"id":"1806.05819","kind":"arxiv","version":2},"metadata":{"license":"http://arxiv.org/licenses/nonexclusive-distrib/1.0/","primary_cat":"cs.LG","submitted_at":"2018-06-15T06:17:55Z","cross_cats_sorted":["stat.ML"],"title_canon_sha256":"ee6158ace3d3d4c05eb1c78e48350fa7e50b7b7d9bee36d9e44beace5347fd36","abstract_canon_sha256":"e5dfb2e1e4f7bc6ce12921d21536d93f00adc67f80a9ce78de93a8397c9b23ac"},"schema_version":"1.0"},"canonical_sha256":"7f632cdba7d9248d1ea19d47993dfe004998af7ffb56c5d93eb19070fdff1b61","receipt":{"kind":"pith_receipt","key_id":"pith-v1-2026-05","algorithm":"ed25519","signed_at":"2026-05-17T23:41:53.988144Z","signature_b64":"g/NTyjrLXSA+NqEE0u+okxdDbINaesgzMc4HFr+6Kyucb/4XJC9/uyqZAKoaLBN2hQUDRxf0o3C+KeEoZP1ZBw==","signed_message":"canonical_sha256_bytes","builder_version":"pith-number-builder-2026-05-17-v1","receipt_version":"0.3","canonical_sha256":"7f632cdba7d9248d1ea19d47993dfe004998af7ffb56c5d93eb19070fdff1b61","last_reissued_at":"2026-05-17T23:41:53.987682Z","signature_status":"signed_v1","first_computed_at":"2026-05-17T23:41:53.987682Z","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54"},"source_kind":"arxiv","source_id":"1806.05819","source_version":2,"attestation_state":"computed"},"signer":{"signer_id":"pith.science","signer_type":"pith_registry","key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54"},"created_at":"2026-05-17T23:41:53Z","supersedes":[],"prev_event":null,"signature":{"signature_status":"signed_v1","algorithm":"ed25519","key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","signature_b64":"vuH4b9RJGkGuE+pNiyA0ohHVfMpUeFFU+yn36Qyh0+iW567vESEGI6L0xCymoVR9iEDeVmvjw13MuYlf9RHLAg==","signed_message":"open_graph_event_sha256_bytes","signed_at":"2026-06-03T13:02:02.228597Z"},"content_sha256":"7bab0980e70383f3c6323c48c8ba6be5236d9923e523ace46ba43e8547aa4240","schema_version":"1.0","event_id":"sha256:7bab0980e70383f3c6323c48c8ba6be5236d9923e523ace46ba43e8547aa4240"},{"event_type":"graph_snapshot","subject_pith_number":"pith:2018:P5RSZW5H3ESI2HVBTVDZSPP6AB","target":"graph","payload":{"graph_snapshot":{"paper":{"title":"BubbleRank: Safe Online Learning to Re-Rank via Implicit Click Feedback","license":"http://arxiv.org/licenses/nonexclusive-distrib/1.0/","headline":"","cross_cats":["stat.ML"],"primary_cat":"cs.LG","authors_text":"Branislav Kveton, Chang Li, Csaba Szepesvari, Ilya Markov, Maarten de Rijke, Masrour Zoghi, Tor Lattimore","submitted_at":"2018-06-15T06:17:55Z","abstract_excerpt":"In this paper, we study the problem of safe online learning to re-rank, where user feedback is used to improve the quality of displayed lists. Learning to rank has traditionally been studied in two settings. In the offline setting, rankers are typically learned from relevance labels created by judges. This approach has generally become standard in industrial applications of ranking, such as search. However, this approach lacks exploration and thus is limited by the information content of the offline training data. In the online setting, an algorithm can experiment with lists and learn from fee"},"claims":{"count":0,"items":[],"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"source":{"id":"1806.05819","kind":"arxiv","version":2},"verdict":{"id":null,"model_set":{},"created_at":null,"strongest_claim":"","one_line_summary":"","pipeline_version":null,"weakest_assumption":"","pith_extraction_headline":""},"references":{"count":0,"sample":[],"resolved_work":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57","internal_anchors":0},"formal_canon":{"evidence_count":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"author_claims":{"count":0,"strong_count":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"builder_version":"pith-number-builder-2026-05-17-v1"},"verdict_id":null},"signer":{"signer_id":"pith.science","signer_type":"pith_registry","key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54"},"created_at":"2026-05-17T23:41:53Z","supersedes":[],"prev_event":null,"signature":{"signature_status":"signed_v1","algorithm":"ed25519","key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","signature_b64":"ZklwkrPb1eyqJdiwe91F2q4XGghzAbtZTtOVzbZ+9NGusM5A8rT/XR0wE09nNoEdSUmUTIfgboxPr+7HXqK2Dw==","signed_message":"open_graph_event_sha256_bytes","signed_at":"2026-06-03T13:02:02.228966Z"},"content_sha256":"cdd4b82db155f7a456c6727c0f864cd82df344c8960e1d6a12f60e83f380012d","schema_version":"1.0","event_id":"sha256:cdd4b82db155f7a456c6727c0f864cd82df344c8960e1d6a12f60e83f380012d"}],"timestamp_proofs":[],"mirror_hints":[{"mirror_type":"https","name":"Pith Resolver","base_url":"https://pith.science","bundle_url":"https://pith.science/pith/P5RSZW5H3ESI2HVBTVDZSPP6AB/bundle.json","state_url":"https://pith.science/pith/P5RSZW5H3ESI2HVBTVDZSPP6AB/state.json","well_known_bundle_url":"https://pith.science/.well-known/pith/P5RSZW5H3ESI2HVBTVDZSPP6AB/bundle.json","status":"primary"}],"public_keys":[{"key_id":"pith-v1-2026-05","algorithm":"ed25519","format":"raw","public_key_b64":"stVStoiQhXFxp4s2pdzPNoqVNBMojDU/fJ2db5S3CbM=","public_key_hex":"b2d552b68890857171a78b36a5dccf368a953413288c353f7c9d9d6f94b709b3","fingerprint_sha256_b32_first128bits":"RVFV5Z2OI2J3ZUO7ERDEBCYNKS","fingerprint_sha256_hex":"8d4b5ee74e4693bcd1df2446408b0d54","rotates_at":null,"url":"https://pith.science/pith-signing-key.json","notes":"Pith uses this Ed25519 key to sign canonical record SHA-256 digests. Verify with: ed25519_verify(public_key, message=canonical_sha256_bytes, signature=base64decode(signature_b64))."}],"merge_version":"pith-open-graph-merge-v1","built_at":"2026-06-03T13:02:02Z","links":{"resolver":"https://pith.science/pith/P5RSZW5H3ESI2HVBTVDZSPP6AB","bundle":"https://pith.science/pith/P5RSZW5H3ESI2HVBTVDZSPP6AB/bundle.json","state":"https://pith.science/pith/P5RSZW5H3ESI2HVBTVDZSPP6AB/state.json","well_known_bundle":"https://pith.science/.well-known/pith/P5RSZW5H3ESI2HVBTVDZSPP6AB/bundle.json"},"state":{"state_type":"pith_open_graph_state","state_version":"1.0","pith_number":"pith:2018:P5RSZW5H3ESI2HVBTVDZSPP6AB","merge_version":"pith-open-graph-merge-v1","event_count":2,"valid_event_count":2,"invalid_event_count":0,"equivocation_count":0,"current":{"canonical_record":{"metadata":{"abstract_canon_sha256":"e5dfb2e1e4f7bc6ce12921d21536d93f00adc67f80a9ce78de93a8397c9b23ac","cross_cats_sorted":["stat.ML"],"license":"http://arxiv.org/licenses/nonexclusive-distrib/1.0/","primary_cat":"cs.LG","submitted_at":"2018-06-15T06:17:55Z","title_canon_sha256":"ee6158ace3d3d4c05eb1c78e48350fa7e50b7b7d9bee36d9e44beace5347fd36"},"schema_version":"1.0","source":{"id":"1806.05819","kind":"arxiv","version":2}},"source_aliases":[{"alias_kind":"arxiv","alias_value":"1806.05819","created_at":"2026-05-17T23:41:53Z"},{"alias_kind":"arxiv_version","alias_value":"1806.05819v2","created_at":"2026-05-17T23:41:53Z"},{"alias_kind":"doi","alias_value":"10.48550/arxiv.1806.05819","created_at":"2026-05-17T23:41:53Z"},{"alias_kind":"pith_short_12","alias_value":"P5RSZW5H3ESI","created_at":"2026-05-18T12:32:43Z"},{"alias_kind":"pith_short_16","alias_value":"P5RSZW5H3ESI2HVB","created_at":"2026-05-18T12:32:43Z"},{"alias_kind":"pith_short_8","alias_value":"P5RSZW5H","created_at":"2026-05-18T12:32:43Z"}],"graph_snapshots":[{"event_id":"sha256:cdd4b82db155f7a456c6727c0f864cd82df344c8960e1d6a12f60e83f380012d","target":"graph","created_at":"2026-05-17T23:41:53Z","signer":{"key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","signer_id":"pith.science","signer_type":"pith_registry"},"payload":{"graph_snapshot":{"author_claims":{"count":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57","strong_count":0},"builder_version":"pith-number-builder-2026-05-17-v1","claims":{"count":0,"items":[],"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"formal_canon":{"evidence_count":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"paper":{"abstract_excerpt":"In this paper, we study the problem of safe online learning to re-rank, where user feedback is used to improve the quality of displayed lists. Learning to rank has traditionally been studied in two settings. In the offline setting, rankers are typically learned from relevance labels created by judges. This approach has generally become standard in industrial applications of ranking, such as search. However, this approach lacks exploration and thus is limited by the information content of the offline training data. In the online setting, an algorithm can experiment with lists and learn from fee","authors_text":"Branislav Kveton, Chang Li, Csaba Szepesvari, Ilya Markov, Maarten de Rijke, Masrour Zoghi, Tor Lattimore","cross_cats":["stat.ML"],"headline":"","license":"http://arxiv.org/licenses/nonexclusive-distrib/1.0/","primary_cat":"cs.LG","submitted_at":"2018-06-15T06:17:55Z","title":"BubbleRank: Safe Online Learning to Re-Rank via Implicit Click Feedback"},"references":{"count":0,"internal_anchors":0,"resolved_work":0,"sample":[],"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"source":{"id":"1806.05819","kind":"arxiv","version":2},"verdict":{"created_at":null,"id":null,"model_set":{},"one_line_summary":"","pipeline_version":null,"pith_extraction_headline":"","strongest_claim":"","weakest_assumption":""}},"verdict_id":null}}],"author_attestations":[],"timestamp_anchors":[],"storage_attestations":[],"citation_signatures":[],"replication_records":[],"corrections":[],"mirror_hints":[],"record_created":{"event_id":"sha256:7bab0980e70383f3c6323c48c8ba6be5236d9923e523ace46ba43e8547aa4240","target":"record","created_at":"2026-05-17T23:41:53Z","signer":{"key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","signer_id":"pith.science","signer_type":"pith_registry"},"payload":{"attestation_state":"computed","canonical_record":{"metadata":{"abstract_canon_sha256":"e5dfb2e1e4f7bc6ce12921d21536d93f00adc67f80a9ce78de93a8397c9b23ac","cross_cats_sorted":["stat.ML"],"license":"http://arxiv.org/licenses/nonexclusive-distrib/1.0/","primary_cat":"cs.LG","submitted_at":"2018-06-15T06:17:55Z","title_canon_sha256":"ee6158ace3d3d4c05eb1c78e48350fa7e50b7b7d9bee36d9e44beace5347fd36"},"schema_version":"1.0","source":{"id":"1806.05819","kind":"arxiv","version":2}},"canonical_sha256":"7f632cdba7d9248d1ea19d47993dfe004998af7ffb56c5d93eb19070fdff1b61","receipt":{"algorithm":"ed25519","builder_version":"pith-number-builder-2026-05-17-v1","canonical_sha256":"7f632cdba7d9248d1ea19d47993dfe004998af7ffb56c5d93eb19070fdff1b61","first_computed_at":"2026-05-17T23:41:53.987682Z","key_id":"pith-v1-2026-05","kind":"pith_receipt","last_reissued_at":"2026-05-17T23:41:53.987682Z","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","receipt_version":"0.3","signature_b64":"g/NTyjrLXSA+NqEE0u+okxdDbINaesgzMc4HFr+6Kyucb/4XJC9/uyqZAKoaLBN2hQUDRxf0o3C+KeEoZP1ZBw==","signature_status":"signed_v1","signed_at":"2026-05-17T23:41:53.988144Z","signed_message":"canonical_sha256_bytes"},"source_id":"1806.05819","source_kind":"arxiv","source_version":2}}},"equivocations":[],"invalid_events":[],"applied_event_ids":["sha256:7bab0980e70383f3c6323c48c8ba6be5236d9923e523ace46ba43e8547aa4240","sha256:cdd4b82db155f7a456c6727c0f864cd82df344c8960e1d6a12f60e83f380012d"],"state_sha256":"203a76f3bce43c880510d224144ca49c8dda06f886ac0353baf66604088ea010"},"bundle_signature":{"signature_status":"signed_v1","algorithm":"ed25519","key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","signature_b64":"2yHSpHuYCxgwFZ5cPlfyegEDxdsG/cX38JYUbMsBw6Dq9yb5Ln/TeT39hR3fpXaLqcVbcRx24Tqu+Iwc3OJuAw==","signed_message":"bundle_sha256_bytes","signed_at":"2026-06-03T13:02:02.230887Z","bundle_sha256":"f9de8bf28c97a12ce69346b7dcbbd7875e935bbfd44c1b89f8566b169c8fd187"}}