{"bundle_type":"pith_open_graph_bundle","bundle_version":"1.0","pith_number":"pith:2018:WJWSWF5MMJZTN72HMBLGBNSKRA","short_pith_number":"pith:WJWSWF5M","canonical_record":{"source":{"id":"1802.09127","kind":"arxiv","version":1},"metadata":{"license":"http://arxiv.org/licenses/nonexclusive-distrib/1.0/","primary_cat":"stat.ML","submitted_at":"2018-02-26T02:04:57Z","cross_cats_sorted":["cs.LG"],"title_canon_sha256":"9405e7320da7ad5d43df69ab24a31abcccd22e147a0c6f5ab14667d903340e19","abstract_canon_sha256":"c35508a5a28fc31e5344039b853bcaceb7a5884e2cc8d377ee595125c3d65e3a"},"schema_version":"1.0"},"canonical_sha256":"b26d2b17ac627336ff47605660b64a880ff6f4a95dbed2f1289bf1f932ce908c","source":{"kind":"arxiv","id":"1802.09127","version":1},"source_aliases":[{"alias_kind":"arxiv","alias_value":"1802.09127","created_at":"2026-05-18T00:22:34Z"},{"alias_kind":"arxiv_version","alias_value":"1802.09127v1","created_at":"2026-05-18T00:22:34Z"},{"alias_kind":"doi","alias_value":"10.48550/arxiv.1802.09127","created_at":"2026-05-18T00:22:34Z"},{"alias_kind":"pith_short_12","alias_value":"WJWSWF5MMJZT","created_at":"2026-05-18T12:32:59Z"},{"alias_kind":"pith_short_16","alias_value":"WJWSWF5MMJZTN72H","created_at":"2026-05-18T12:32:59Z"},{"alias_kind":"pith_short_8","alias_value":"WJWSWF5M","created_at":"2026-05-18T12:32:59Z"}],"events":[{"event_type":"record_created","subject_pith_number":"pith:2018:WJWSWF5MMJZTN72HMBLGBNSKRA","target":"record","payload":{"canonical_record":{"source":{"id":"1802.09127","kind":"arxiv","version":1},"metadata":{"license":"http://arxiv.org/licenses/nonexclusive-distrib/1.0/","primary_cat":"stat.ML","submitted_at":"2018-02-26T02:04:57Z","cross_cats_sorted":["cs.LG"],"title_canon_sha256":"9405e7320da7ad5d43df69ab24a31abcccd22e147a0c6f5ab14667d903340e19","abstract_canon_sha256":"c35508a5a28fc31e5344039b853bcaceb7a5884e2cc8d377ee595125c3d65e3a"},"schema_version":"1.0"},"canonical_sha256":"b26d2b17ac627336ff47605660b64a880ff6f4a95dbed2f1289bf1f932ce908c","receipt":{"kind":"pith_receipt","key_id":"pith-v1-2026-05","algorithm":"ed25519","signed_at":"2026-05-18T00:22:34.694652Z","signature_b64":"Epu/dHa4cAtz9RnJtvoko3GWj3t74GcWYJVurOQoCQxqezQ3vt5AnMNqkli2N135ALxlpq1y1LH/NXgV99TfDA==","signed_message":"canonical_sha256_bytes","builder_version":"pith-number-builder-2026-05-17-v1","receipt_version":"0.3","canonical_sha256":"b26d2b17ac627336ff47605660b64a880ff6f4a95dbed2f1289bf1f932ce908c","last_reissued_at":"2026-05-18T00:22:34.693991Z","signature_status":"signed_v1","first_computed_at":"2026-05-18T00:22:34.693991Z","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54"},"source_kind":"arxiv","source_id":"1802.09127","source_version":1,"attestation_state":"computed"},"signer":{"signer_id":"pith.science","signer_type":"pith_registry","key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54"},"created_at":"2026-05-18T00:22:34Z","supersedes":[],"prev_event":null,"signature":{"signature_status":"signed_v1","algorithm":"ed25519","key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","signature_b64":"Tbw/R/u7x8ahVzGtoyxHq8k5p0iXJSQlE4voMRzSLkf8wQ1/g3kP0n/tOkmOuCuf8aRm1BOxPRYOh1p0hkm+Dw==","signed_message":"open_graph_event_sha256_bytes","signed_at":"2026-05-26T13:17:35.873565Z"},"content_sha256":"09622f2a8caf1260a0018231c10de0d8e0417e34fc1264243a6c4cf086582faf","schema_version":"1.0","event_id":"sha256:09622f2a8caf1260a0018231c10de0d8e0417e34fc1264243a6c4cf086582faf"},{"event_type":"graph_snapshot","subject_pith_number":"pith:2018:WJWSWF5MMJZTN72HMBLGBNSKRA","target":"graph","payload":{"graph_snapshot":{"paper":{"title":"Deep Bayesian Bandits Showdown: An Empirical Comparison of Bayesian Deep Networks for Thompson Sampling","license":"http://arxiv.org/licenses/nonexclusive-distrib/1.0/","headline":"","cross_cats":["cs.LG"],"primary_cat":"stat.ML","authors_text":"Carlos Riquelme, George Tucker, Jasper Snoek","submitted_at":"2018-02-26T02:04:57Z","abstract_excerpt":"Recent advances in deep reinforcement learning have made significant strides in performance on applications such as Go and Atari games. However, developing practical methods to balance exploration and exploitation in complex domains remains largely unsolved. Thompson Sampling and its extension to reinforcement learning provide an elegant approach to exploration that only requires access to posterior samples of the model. At the same time, advances in approximate Bayesian methods have made posterior approximation for flexible neural network models practical. Thus, it is attractive to consider a"},"claims":{"count":0,"items":[],"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"source":{"id":"1802.09127","kind":"arxiv","version":1},"verdict":{"id":null,"model_set":{},"created_at":null,"strongest_claim":"","one_line_summary":"","pipeline_version":null,"weakest_assumption":"","pith_extraction_headline":""},"references":{"count":0,"sample":[],"resolved_work":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57","internal_anchors":0},"formal_canon":{"evidence_count":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"author_claims":{"count":0,"strong_count":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"builder_version":"pith-number-builder-2026-05-17-v1"},"verdict_id":null},"signer":{"signer_id":"pith.science","signer_type":"pith_registry","key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54"},"created_at":"2026-05-18T00:22:34Z","supersedes":[],"prev_event":null,"signature":{"signature_status":"signed_v1","algorithm":"ed25519","key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","signature_b64":"rCkkMrKnaafashm3wh3wNPMM+v69NgDstVrH7ivAdAFwvRrcK+EGvMvRyziEfF/zYE4lLCoipTGmHEgkfL2QBA==","signed_message":"open_graph_event_sha256_bytes","signed_at":"2026-05-26T13:17:35.874245Z"},"content_sha256":"80e33f25f1d9e70e02b6a89723e883634e6910ade719da9a55de50ea2d01825b","schema_version":"1.0","event_id":"sha256:80e33f25f1d9e70e02b6a89723e883634e6910ade719da9a55de50ea2d01825b"}],"timestamp_proofs":[],"mirror_hints":[{"mirror_type":"https","name":"Pith Resolver","base_url":"https://pith.science","bundle_url":"https://pith.science/pith/WJWSWF5MMJZTN72HMBLGBNSKRA/bundle.json","state_url":"https://pith.science/pith/WJWSWF5MMJZTN72HMBLGBNSKRA/state.json","well_known_bundle_url":"https://pith.science/.well-known/pith/WJWSWF5MMJZTN72HMBLGBNSKRA/bundle.json","status":"primary"}],"public_keys":[{"key_id":"pith-v1-2026-05","algorithm":"ed25519","format":"raw","public_key_b64":"stVStoiQhXFxp4s2pdzPNoqVNBMojDU/fJ2db5S3CbM=","public_key_hex":"b2d552b68890857171a78b36a5dccf368a953413288c353f7c9d9d6f94b709b3","fingerprint_sha256_b32_first128bits":"RVFV5Z2OI2J3ZUO7ERDEBCYNKS","fingerprint_sha256_hex":"8d4b5ee74e4693bcd1df2446408b0d54","rotates_at":null,"url":"https://pith.science/pith-signing-key.json","notes":"Pith uses this Ed25519 key to sign canonical record SHA-256 digests. Verify with: ed25519_verify(public_key, message=canonical_sha256_bytes, signature=base64decode(signature_b64))."}],"merge_version":"pith-open-graph-merge-v1","built_at":"2026-05-26T13:17:35Z","links":{"resolver":"https://pith.science/pith/WJWSWF5MMJZTN72HMBLGBNSKRA","bundle":"https://pith.science/pith/WJWSWF5MMJZTN72HMBLGBNSKRA/bundle.json","state":"https://pith.science/pith/WJWSWF5MMJZTN72HMBLGBNSKRA/state.json","well_known_bundle":"https://pith.science/.well-known/pith/WJWSWF5MMJZTN72HMBLGBNSKRA/bundle.json"},"state":{"state_type":"pith_open_graph_state","state_version":"1.0","pith_number":"pith:2018:WJWSWF5MMJZTN72HMBLGBNSKRA","merge_version":"pith-open-graph-merge-v1","event_count":2,"valid_event_count":2,"invalid_event_count":0,"equivocation_count":0,"current":{"canonical_record":{"metadata":{"abstract_canon_sha256":"c35508a5a28fc31e5344039b853bcaceb7a5884e2cc8d377ee595125c3d65e3a","cross_cats_sorted":["cs.LG"],"license":"http://arxiv.org/licenses/nonexclusive-distrib/1.0/","primary_cat":"stat.ML","submitted_at":"2018-02-26T02:04:57Z","title_canon_sha256":"9405e7320da7ad5d43df69ab24a31abcccd22e147a0c6f5ab14667d903340e19"},"schema_version":"1.0","source":{"id":"1802.09127","kind":"arxiv","version":1}},"source_aliases":[{"alias_kind":"arxiv","alias_value":"1802.09127","created_at":"2026-05-18T00:22:34Z"},{"alias_kind":"arxiv_version","alias_value":"1802.09127v1","created_at":"2026-05-18T00:22:34Z"},{"alias_kind":"doi","alias_value":"10.48550/arxiv.1802.09127","created_at":"2026-05-18T00:22:34Z"},{"alias_kind":"pith_short_12","alias_value":"WJWSWF5MMJZT","created_at":"2026-05-18T12:32:59Z"},{"alias_kind":"pith_short_16","alias_value":"WJWSWF5MMJZTN72H","created_at":"2026-05-18T12:32:59Z"},{"alias_kind":"pith_short_8","alias_value":"WJWSWF5M","created_at":"2026-05-18T12:32:59Z"}],"graph_snapshots":[{"event_id":"sha256:80e33f25f1d9e70e02b6a89723e883634e6910ade719da9a55de50ea2d01825b","target":"graph","created_at":"2026-05-18T00:22:34Z","signer":{"key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","signer_id":"pith.science","signer_type":"pith_registry"},"payload":{"graph_snapshot":{"author_claims":{"count":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57","strong_count":0},"builder_version":"pith-number-builder-2026-05-17-v1","claims":{"count":0,"items":[],"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"formal_canon":{"evidence_count":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"paper":{"abstract_excerpt":"Recent advances in deep reinforcement learning have made significant strides in performance on applications such as Go and Atari games. However, developing practical methods to balance exploration and exploitation in complex domains remains largely unsolved. Thompson Sampling and its extension to reinforcement learning provide an elegant approach to exploration that only requires access to posterior samples of the model. At the same time, advances in approximate Bayesian methods have made posterior approximation for flexible neural network models practical. Thus, it is attractive to consider a","authors_text":"Carlos Riquelme, George Tucker, Jasper Snoek","cross_cats":["cs.LG"],"headline":"","license":"http://arxiv.org/licenses/nonexclusive-distrib/1.0/","primary_cat":"stat.ML","submitted_at":"2018-02-26T02:04:57Z","title":"Deep Bayesian Bandits Showdown: An Empirical Comparison of Bayesian Deep Networks for Thompson Sampling"},"references":{"count":0,"internal_anchors":0,"resolved_work":0,"sample":[],"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"source":{"id":"1802.09127","kind":"arxiv","version":1},"verdict":{"created_at":null,"id":null,"model_set":{},"one_line_summary":"","pipeline_version":null,"pith_extraction_headline":"","strongest_claim":"","weakest_assumption":""}},"verdict_id":null}}],"author_attestations":[],"timestamp_anchors":[],"storage_attestations":[],"citation_signatures":[],"replication_records":[],"corrections":[],"mirror_hints":[],"record_created":{"event_id":"sha256:09622f2a8caf1260a0018231c10de0d8e0417e34fc1264243a6c4cf086582faf","target":"record","created_at":"2026-05-18T00:22:34Z","signer":{"key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","signer_id":"pith.science","signer_type":"pith_registry"},"payload":{"attestation_state":"computed","canonical_record":{"metadata":{"abstract_canon_sha256":"c35508a5a28fc31e5344039b853bcaceb7a5884e2cc8d377ee595125c3d65e3a","cross_cats_sorted":["cs.LG"],"license":"http://arxiv.org/licenses/nonexclusive-distrib/1.0/","primary_cat":"stat.ML","submitted_at":"2018-02-26T02:04:57Z","title_canon_sha256":"9405e7320da7ad5d43df69ab24a31abcccd22e147a0c6f5ab14667d903340e19"},"schema_version":"1.0","source":{"id":"1802.09127","kind":"arxiv","version":1}},"canonical_sha256":"b26d2b17ac627336ff47605660b64a880ff6f4a95dbed2f1289bf1f932ce908c","receipt":{"algorithm":"ed25519","builder_version":"pith-number-builder-2026-05-17-v1","canonical_sha256":"b26d2b17ac627336ff47605660b64a880ff6f4a95dbed2f1289bf1f932ce908c","first_computed_at":"2026-05-18T00:22:34.693991Z","key_id":"pith-v1-2026-05","kind":"pith_receipt","last_reissued_at":"2026-05-18T00:22:34.693991Z","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","receipt_version":"0.3","signature_b64":"Epu/dHa4cAtz9RnJtvoko3GWj3t74GcWYJVurOQoCQxqezQ3vt5AnMNqkli2N135ALxlpq1y1LH/NXgV99TfDA==","signature_status":"signed_v1","signed_at":"2026-05-18T00:22:34.694652Z","signed_message":"canonical_sha256_bytes"},"source_id":"1802.09127","source_kind":"arxiv","source_version":1}}},"equivocations":[],"invalid_events":[],"applied_event_ids":["sha256:09622f2a8caf1260a0018231c10de0d8e0417e34fc1264243a6c4cf086582faf","sha256:80e33f25f1d9e70e02b6a89723e883634e6910ade719da9a55de50ea2d01825b"],"state_sha256":"fa2c5f13a13b5fc9eb79cb0ce3ea3696303d5650e5cd2a5d8490336ab96e54c6"},"bundle_signature":{"signature_status":"signed_v1","algorithm":"ed25519","key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","signature_b64":"LNwj64XBjEu0sDBVxMJyqYIUNu80YtR2DjdtN09+yHz1cacd1hu4yqWlqsMiy/6IzPcH01JtKHqc9EogdJvODQ==","signed_message":"bundle_sha256_bytes","signed_at":"2026-05-26T13:17:35.878027Z","bundle_sha256":"cbfbcbae4e75f3edc430a0d4d8d0f422156d241783b47a659cb19a57d80b004b"}}