{"state_type":"pith_open_graph_state","state_version":"1.0","pith_number":"pith:2014:27LCWZEXOZORSBBGAADPJNQXTQ","merge_version":"pith-open-graph-merge-v1","event_count":2,"valid_event_count":2,"invalid_event_count":0,"equivocation_count":0,"current":{"canonical_record":{"metadata":{"abstract_canon_sha256":"6b089e8f68e5aedc84636a5fe21c71ecf8d843db102ae4d6169f14f822b12bd3","cross_cats_sorted":[],"license":"http://arxiv.org/licenses/nonexclusive-distrib/1.0/","primary_cat":"cs.LG","submitted_at":"2014-05-14T08:03:08Z","title_canon_sha256":"944fec365831b1e3da3c176e5eb68a0f65ee20349c2c86d32f9442563ec4d51a"},"schema_version":"1.0","source":{"id":"1405.3396","kind":"arxiv","version":1}},"source_aliases":[{"alias_kind":"arxiv","alias_value":"1405.3396","created_at":"2026-05-18T02:51:56Z"},{"alias_kind":"arxiv_version","alias_value":"1405.3396v1","created_at":"2026-05-18T02:51:56Z"},{"alias_kind":"doi","alias_value":"10.48550/arxiv.1405.3396","created_at":"2026-05-18T02:51:56Z"},{"alias_kind":"pith_short_12","alias_value":"27LCWZEXOZOR","created_at":"2026-05-18T12:28:09Z"},{"alias_kind":"pith_short_16","alias_value":"27LCWZEXOZORSBBG","created_at":"2026-05-18T12:28:09Z"},{"alias_kind":"pith_short_8","alias_value":"27LCWZEX","created_at":"2026-05-18T12:28:09Z"}],"graph_snapshots":[{"event_id":"sha256:5bffadf278eff8bd462419dd9d883f500de57f6d7c482cbf03d21f8bc7b6a151","target":"graph","created_at":"2026-05-18T02:51:56Z","signer":{"key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","signer_id":"pith.science","signer_type":"pith_registry"},"payload":{"graph_snapshot":{"author_claims":{"count":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57","strong_count":0},"builder_version":"pith-number-builder-2026-05-17-v1","claims":{"count":0,"items":[],"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"formal_canon":{"evidence_count":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"paper":{"abstract_excerpt":"We present algorithms for reducing the Dueling Bandits problem to the conventional (stochastic) Multi-Armed Bandits problem. The Dueling Bandits problem is an online model of learning with ordinal feedback of the form \"A is preferred to B\" (as opposed to cardinal feedback like \"A has value 2.5\"), giving it wide applicability in learning from implicit user feedback and revealed and stated preferences. In contrast to existing algorithms for the Dueling Bandits problem, our reductions -- named $\\Doubler$, $\\MultiSbm$ and $\\DoubleSbm$ -- provide a generic schema for translating the extensive body ","authors_text":"Nir Ailon, Thorsten Joachims, Zohar Karnin","cross_cats":[],"headline":"","license":"http://arxiv.org/licenses/nonexclusive-distrib/1.0/","primary_cat":"cs.LG","submitted_at":"2014-05-14T08:03:08Z","title":"Reducing Dueling Bandits to Cardinal Bandits"},"references":{"count":0,"internal_anchors":0,"resolved_work":0,"sample":[],"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"source":{"id":"1405.3396","kind":"arxiv","version":1},"verdict":{"created_at":null,"id":null,"model_set":{},"one_line_summary":"","pipeline_version":null,"pith_extraction_headline":"","strongest_claim":"","weakest_assumption":""}},"verdict_id":null}}],"author_attestations":[],"timestamp_anchors":[],"storage_attestations":[],"citation_signatures":[],"replication_records":[],"corrections":[],"mirror_hints":[],"record_created":{"event_id":"sha256:8b91a3cd478e43ea2af18459f1720532721e3f5763952e726212c1e65af2944d","target":"record","created_at":"2026-05-18T02:51:56Z","signer":{"key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","signer_id":"pith.science","signer_type":"pith_registry"},"payload":{"attestation_state":"computed","canonical_record":{"metadata":{"abstract_canon_sha256":"6b089e8f68e5aedc84636a5fe21c71ecf8d843db102ae4d6169f14f822b12bd3","cross_cats_sorted":[],"license":"http://arxiv.org/licenses/nonexclusive-distrib/1.0/","primary_cat":"cs.LG","submitted_at":"2014-05-14T08:03:08Z","title_canon_sha256":"944fec365831b1e3da3c176e5eb68a0f65ee20349c2c86d32f9442563ec4d51a"},"schema_version":"1.0","source":{"id":"1405.3396","kind":"arxiv","version":1}},"canonical_sha256":"d7d62b6497765d1904260006f4b6179c07633f54ca2e296192dc319c5e1dda58","receipt":{"algorithm":"ed25519","builder_version":"pith-number-builder-2026-05-17-v1","canonical_sha256":"d7d62b6497765d1904260006f4b6179c07633f54ca2e296192dc319c5e1dda58","first_computed_at":"2026-05-18T02:51:56.134058Z","key_id":"pith-v1-2026-05","kind":"pith_receipt","last_reissued_at":"2026-05-18T02:51:56.134058Z","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","receipt_version":"0.3","signature_b64":"8km/6si3swfuYglwkWIMEQMWnSgWNNcu/p1Vgkoox9G8HC8ZIrsz4tLPf64kvXhJbgFDNC5c7cGiFSyttabqBw==","signature_status":"signed_v1","signed_at":"2026-05-18T02:51:56.134567Z","signed_message":"canonical_sha256_bytes"},"source_id":"1405.3396","source_kind":"arxiv","source_version":1}}},"equivocations":[],"invalid_events":[],"applied_event_ids":["sha256:8b91a3cd478e43ea2af18459f1720532721e3f5763952e726212c1e65af2944d","sha256:5bffadf278eff8bd462419dd9d883f500de57f6d7c482cbf03d21f8bc7b6a151"],"state_sha256":"09a5128033e5e575f8261ee01050cc0a414559ca9ea1feac84f7b8cad46dc563"}