{"state_type":"pith_open_graph_state","state_version":"1.0","pith_number":"pith:2025:RN6ZNQFL56QWLSOKHOIUZQQR4T","merge_version":"pith-open-graph-merge-v1","event_count":2,"valid_event_count":2,"invalid_event_count":0,"equivocation_count":0,"current":{"canonical_record":{"metadata":{"abstract_canon_sha256":"d1886fa35a67444672264add5be2542b9688c389abe470d016d5f9d2cdbb0fe2","cross_cats_sorted":["cs.LG"],"license":"http://creativecommons.org/licenses/by/4.0/","primary_cat":"stat.ML","submitted_at":"2025-10-14T05:14:54Z","title_canon_sha256":"6fea8b6ab0f62e50c41d3ad66b9259e151e488e20e1d8142768ef771cfd5e29d"},"schema_version":"1.0","source":{"id":"2510.12152","kind":"arxiv","version":2}},"source_aliases":[{"alias_kind":"arxiv","alias_value":"2510.12152","created_at":"2026-05-29T01:04:56Z"},{"alias_kind":"arxiv_version","alias_value":"2510.12152v2","created_at":"2026-05-29T01:04:56Z"},{"alias_kind":"doi","alias_value":"10.48550/arxiv.2510.12152","created_at":"2026-05-29T01:04:56Z"},{"alias_kind":"pith_short_12","alias_value":"RN6ZNQFL56QW","created_at":"2026-05-29T01:04:56Z"},{"alias_kind":"pith_short_16","alias_value":"RN6ZNQFL56QWLSOK","created_at":"2026-05-29T01:04:56Z"},{"alias_kind":"pith_short_8","alias_value":"RN6ZNQFL","created_at":"2026-05-29T01:04:56Z"}],"graph_snapshots":[{"event_id":"sha256:147008611d57fe86b0d54a9392c90d0be955adf6b6147df878b380a458225149","target":"graph","created_at":"2026-05-29T01:04:56Z","signer":{"key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","signer_id":"pith.science","signer_type":"pith_registry"},"payload":{"graph_snapshot":{"author_claims":{"count":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57","strong_count":0},"builder_version":"pith-number-builder-2026-05-17-v1","claims":{"count":0,"items":[],"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"formal_canon":{"evidence_count":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"integrity":{"available":true,"clean":true,"detectors_run":[],"endpoint":"/pith/2510.12152/integrity.json","findings":[],"snapshot_sha256":"c28c3603d3b5d939e8dc4c7e95fa8dfce3d595e45f758748cecf8e644a296938","summary":{"advisory":0,"by_detector":{},"critical":0,"informational":0}},"paper":{"abstract_excerpt":"We study the decoupled multi-armed bandit problem, where the learner separately selects one arm for exploration and one, possibly different, arm for exploitation at each round. In this setting, the loss of the explored arm is observed but not incurred, whereas the loss of the exploited arm is incurred without being observed. We propose an efficient Follow-the-Perturbed-Leader (FTPL) policy that achieves Best-of-Both-Worlds (BOBW) guarantee with constant regret in the stochastic regime and optimal $O(\\sqrt{KT})$ regret in the adversarial regime. A key feature of our method is that it completely","authors_text":"Chaiwon Kim, Jongyeong Lee, Min-hwan Oh","cross_cats":["cs.LG"],"headline":"","license":"http://creativecommons.org/licenses/by/4.0/","primary_cat":"stat.ML","submitted_at":"2025-10-14T05:14:54Z","title":"Follow-the-Perturbed-Leader for Decoupled Bandits: Best-of-Both-Worlds and Practicality"},"references":{"count":0,"internal_anchors":0,"resolved_work":0,"sample":[],"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"source":{"id":"2510.12152","kind":"arxiv","version":2},"verdict":{"created_at":null,"id":null,"model_set":{},"one_line_summary":"","pipeline_version":null,"pith_extraction_headline":"","strongest_claim":"","weakest_assumption":""}},"verdict_id":null}}],"author_attestations":[],"timestamp_anchors":[],"storage_attestations":[],"citation_signatures":[],"replication_records":[],"corrections":[],"mirror_hints":[],"record_created":{"event_id":"sha256:6eefd5bf0ada7f4a183bc5c12b7f1997ae40217bcc358e74e28160b4e0b6a5e1","target":"record","created_at":"2026-05-29T01:04:56Z","signer":{"key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","signer_id":"pith.science","signer_type":"pith_registry"},"payload":{"attestation_state":"computed","canonical_record":{"metadata":{"abstract_canon_sha256":"d1886fa35a67444672264add5be2542b9688c389abe470d016d5f9d2cdbb0fe2","cross_cats_sorted":["cs.LG"],"license":"http://creativecommons.org/licenses/by/4.0/","primary_cat":"stat.ML","submitted_at":"2025-10-14T05:14:54Z","title_canon_sha256":"6fea8b6ab0f62e50c41d3ad66b9259e151e488e20e1d8142768ef771cfd5e29d"},"schema_version":"1.0","source":{"id":"2510.12152","kind":"arxiv","version":2}},"canonical_sha256":"8b7d96c0abefa165c9ca3b914cc211e4c00721d3c41bffc20813c051309fecb8","receipt":{"algorithm":"ed25519","builder_version":"pith-number-builder-2026-05-17-v1","canonical_sha256":"8b7d96c0abefa165c9ca3b914cc211e4c00721d3c41bffc20813c051309fecb8","first_computed_at":"2026-05-29T01:04:56.811743Z","key_id":"pith-v1-2026-05","kind":"pith_receipt","last_reissued_at":"2026-05-29T01:04:56.811743Z","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","receipt_version":"0.3","signature_b64":"XsdJiT6NFlU7EhHDu30ynJjDKfw6lqD/MJ/3Nn7y25zgxYa1i6iPKOI81azA29qjXxMCSH50mdYE9yUcVkWbBA==","signature_status":"signed_v1","signed_at":"2026-05-29T01:04:56.812353Z","signed_message":"canonical_sha256_bytes"},"source_id":"2510.12152","source_kind":"arxiv","source_version":2}}},"equivocations":[],"invalid_events":[],"applied_event_ids":["sha256:6eefd5bf0ada7f4a183bc5c12b7f1997ae40217bcc358e74e28160b4e0b6a5e1","sha256:147008611d57fe86b0d54a9392c90d0be955adf6b6147df878b380a458225149"],"state_sha256":"e1d908c2bb4bdd43d7b80d31a3a34f425fb64f21bb8e5b7c47f38479b53ab193"}