{"bundle_type":"pith_open_graph_bundle","bundle_version":"1.0","pith_number":"pith:2016:K3TGK2IYX7TSBNBVFLUYUBQBB7","short_pith_number":"pith:K3TGK2IY","canonical_record":{"source":{"id":"1610.06603","kind":"arxiv","version":4},"metadata":{"license":"http://arxiv.org/licenses/nonexclusive-distrib/1.0/","primary_cat":"cs.LG","submitted_at":"2016-10-20T20:54:41Z","cross_cats_sorted":["cs.DS","stat.ML"],"title_canon_sha256":"699b2a110f16969fe252c875ed66aaedab99ebd90ac1444f5d75380047921a26","abstract_canon_sha256":"6cb602bbb1c998383dd59db298218d641162231151355d5f27fca8612180d37f"},"schema_version":"1.0"},"canonical_sha256":"56e6656918bfe720b4352ae98a06010ff80729b635129bcef850833bc01743b4","source":{"kind":"arxiv","id":"1610.06603","version":4},"source_aliases":[{"alias_kind":"arxiv","alias_value":"1610.06603","created_at":"2026-05-18T00:10:19Z"},{"alias_kind":"arxiv_version","alias_value":"1610.06603v4","created_at":"2026-05-18T00:10:19Z"},{"alias_kind":"doi","alias_value":"10.48550/arxiv.1610.06603","created_at":"2026-05-18T00:10:19Z"},{"alias_kind":"pith_short_12","alias_value":"K3TGK2IYX7TS","created_at":"2026-05-18T12:30:25Z"},{"alias_kind":"pith_short_16","alias_value":"K3TGK2IYX7TSBNBV","created_at":"2026-05-18T12:30:25Z"},{"alias_kind":"pith_short_8","alias_value":"K3TGK2IY","created_at":"2026-05-18T12:30:25Z"}],"events":[{"event_type":"record_created","subject_pith_number":"pith:2016:K3TGK2IYX7TSBNBVFLUYUBQBB7","target":"record","payload":{"canonical_record":{"source":{"id":"1610.06603","kind":"arxiv","version":4},"metadata":{"license":"http://arxiv.org/licenses/nonexclusive-distrib/1.0/","primary_cat":"cs.LG","submitted_at":"2016-10-20T20:54:41Z","cross_cats_sorted":["cs.DS","stat.ML"],"title_canon_sha256":"699b2a110f16969fe252c875ed66aaedab99ebd90ac1444f5d75380047921a26","abstract_canon_sha256":"6cb602bbb1c998383dd59db298218d641162231151355d5f27fca8612180d37f"},"schema_version":"1.0"},"canonical_sha256":"56e6656918bfe720b4352ae98a06010ff80729b635129bcef850833bc01743b4","receipt":{"kind":"pith_receipt","key_id":"pith-v1-2026-05","algorithm":"ed25519","signed_at":"2026-05-18T00:10:19.575171Z","signature_b64":"el8WvR6bqL4UQZDtRv1IEWxxq/VEpAffa8j5upixkFkn0g5m9SOceWyiMtuMhMcEyhePTq9pIhuCDcLJX2nQBw==","signed_message":"canonical_sha256_bytes","builder_version":"pith-number-builder-2026-05-17-v1","receipt_version":"0.3","canonical_sha256":"56e6656918bfe720b4352ae98a06010ff80729b635129bcef850833bc01743b4","last_reissued_at":"2026-05-18T00:10:19.574512Z","signature_status":"signed_v1","first_computed_at":"2026-05-18T00:10:19.574512Z","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54"},"source_kind":"arxiv","source_id":"1610.06603","source_version":4,"attestation_state":"computed"},"signer":{"signer_id":"pith.science","signer_type":"pith_registry","key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54"},"created_at":"2026-05-18T00:10:19Z","supersedes":[],"prev_event":null,"signature":{"signature_status":"signed_v1","algorithm":"ed25519","key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","signature_b64":"D50QCqcsLXw7wVpxG8hfg7+1uAPWTbZ7uOa4L68eaG0mBdodnCTR/3XUM74w4OlbOmqKWsHr7kwtPRTpvsITAA==","signed_message":"open_graph_event_sha256_bytes","signed_at":"2026-05-27T00:57:39.587870Z"},"content_sha256":"512428a5adacfcfefa99000052945a6bbf88f2a541e6868d276e6cfd0983eb2c","schema_version":"1.0","event_id":"sha256:512428a5adacfcfefa99000052945a6bbf88f2a541e6868d276e6cfd0983eb2c"},{"event_type":"graph_snapshot","subject_pith_number":"pith:2016:K3TGK2IYX7TSBNBVFLUYUBQBB7","target":"graph","payload":{"graph_snapshot":{"paper":{"title":"Combinatorial Multi-Armed Bandit with General Reward Functions","license":"http://arxiv.org/licenses/nonexclusive-distrib/1.0/","headline":"","cross_cats":["cs.DS","stat.ML"],"primary_cat":"cs.LG","authors_text":"Fu Li, Jian Li, Pinyan Lu, Wei Chen, Wei Hu, Yu Liu","submitted_at":"2016-10-20T20:54:41Z","abstract_excerpt":"In this paper, we study the stochastic combinatorial multi-armed bandit (CMAB) framework that allows a general nonlinear reward function, whose expected value may not depend only on the means of the input random variables but possibly on the entire distributions of these variables. Our framework enables a much larger class of reward functions such as the $\\max()$ function and nonlinear utility functions. Existing techniques relying on accurate estimations of the means of random variables, such as the upper confidence bound (UCB) technique, do not work directly on these functions. We propose a "},"claims":{"count":0,"items":[],"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"source":{"id":"1610.06603","kind":"arxiv","version":4},"verdict":{"id":null,"model_set":{},"created_at":null,"strongest_claim":"","one_line_summary":"","pipeline_version":null,"weakest_assumption":"","pith_extraction_headline":""},"references":{"count":0,"sample":[],"resolved_work":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57","internal_anchors":0},"formal_canon":{"evidence_count":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"author_claims":{"count":0,"strong_count":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"builder_version":"pith-number-builder-2026-05-17-v1"},"verdict_id":null},"signer":{"signer_id":"pith.science","signer_type":"pith_registry","key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54"},"created_at":"2026-05-18T00:10:19Z","supersedes":[],"prev_event":null,"signature":{"signature_status":"signed_v1","algorithm":"ed25519","key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","signature_b64":"8eILS0vqgh5IUXaHWSf4rIK32HhZfzyd9EMQ+fXeZ4fv2tuXdv5Lt3CUmIjOplGmXYCZkvTteoG0MUiRTkMFBA==","signed_message":"open_graph_event_sha256_bytes","signed_at":"2026-05-27T00:57:39.588952Z"},"content_sha256":"5733441c7888d5e468c20204b9f8a95a1c5cf39f8f4142356ff038e986ec6536","schema_version":"1.0","event_id":"sha256:5733441c7888d5e468c20204b9f8a95a1c5cf39f8f4142356ff038e986ec6536"}],"timestamp_proofs":[],"mirror_hints":[{"mirror_type":"https","name":"Pith Resolver","base_url":"https://pith.science","bundle_url":"https://pith.science/pith/K3TGK2IYX7TSBNBVFLUYUBQBB7/bundle.json","state_url":"https://pith.science/pith/K3TGK2IYX7TSBNBVFLUYUBQBB7/state.json","well_known_bundle_url":"https://pith.science/.well-known/pith/K3TGK2IYX7TSBNBVFLUYUBQBB7/bundle.json","status":"primary"}],"public_keys":[{"key_id":"pith-v1-2026-05","algorithm":"ed25519","format":"raw","public_key_b64":"stVStoiQhXFxp4s2pdzPNoqVNBMojDU/fJ2db5S3CbM=","public_key_hex":"b2d552b68890857171a78b36a5dccf368a953413288c353f7c9d9d6f94b709b3","fingerprint_sha256_b32_first128bits":"RVFV5Z2OI2J3ZUO7ERDEBCYNKS","fingerprint_sha256_hex":"8d4b5ee74e4693bcd1df2446408b0d54","rotates_at":null,"url":"https://pith.science/pith-signing-key.json","notes":"Pith uses this Ed25519 key to sign canonical record SHA-256 digests. Verify with: ed25519_verify(public_key, message=canonical_sha256_bytes, signature=base64decode(signature_b64))."}],"merge_version":"pith-open-graph-merge-v1","built_at":"2026-05-27T00:57:39Z","links":{"resolver":"https://pith.science/pith/K3TGK2IYX7TSBNBVFLUYUBQBB7","bundle":"https://pith.science/pith/K3TGK2IYX7TSBNBVFLUYUBQBB7/bundle.json","state":"https://pith.science/pith/K3TGK2IYX7TSBNBVFLUYUBQBB7/state.json","well_known_bundle":"https://pith.science/.well-known/pith/K3TGK2IYX7TSBNBVFLUYUBQBB7/bundle.json"},"state":{"state_type":"pith_open_graph_state","state_version":"1.0","pith_number":"pith:2016:K3TGK2IYX7TSBNBVFLUYUBQBB7","merge_version":"pith-open-graph-merge-v1","event_count":2,"valid_event_count":2,"invalid_event_count":0,"equivocation_count":0,"current":{"canonical_record":{"metadata":{"abstract_canon_sha256":"6cb602bbb1c998383dd59db298218d641162231151355d5f27fca8612180d37f","cross_cats_sorted":["cs.DS","stat.ML"],"license":"http://arxiv.org/licenses/nonexclusive-distrib/1.0/","primary_cat":"cs.LG","submitted_at":"2016-10-20T20:54:41Z","title_canon_sha256":"699b2a110f16969fe252c875ed66aaedab99ebd90ac1444f5d75380047921a26"},"schema_version":"1.0","source":{"id":"1610.06603","kind":"arxiv","version":4}},"source_aliases":[{"alias_kind":"arxiv","alias_value":"1610.06603","created_at":"2026-05-18T00:10:19Z"},{"alias_kind":"arxiv_version","alias_value":"1610.06603v4","created_at":"2026-05-18T00:10:19Z"},{"alias_kind":"doi","alias_value":"10.48550/arxiv.1610.06603","created_at":"2026-05-18T00:10:19Z"},{"alias_kind":"pith_short_12","alias_value":"K3TGK2IYX7TS","created_at":"2026-05-18T12:30:25Z"},{"alias_kind":"pith_short_16","alias_value":"K3TGK2IYX7TSBNBV","created_at":"2026-05-18T12:30:25Z"},{"alias_kind":"pith_short_8","alias_value":"K3TGK2IY","created_at":"2026-05-18T12:30:25Z"}],"graph_snapshots":[{"event_id":"sha256:5733441c7888d5e468c20204b9f8a95a1c5cf39f8f4142356ff038e986ec6536","target":"graph","created_at":"2026-05-18T00:10:19Z","signer":{"key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","signer_id":"pith.science","signer_type":"pith_registry"},"payload":{"graph_snapshot":{"author_claims":{"count":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57","strong_count":0},"builder_version":"pith-number-builder-2026-05-17-v1","claims":{"count":0,"items":[],"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"formal_canon":{"evidence_count":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"paper":{"abstract_excerpt":"In this paper, we study the stochastic combinatorial multi-armed bandit (CMAB) framework that allows a general nonlinear reward function, whose expected value may not depend only on the means of the input random variables but possibly on the entire distributions of these variables. Our framework enables a much larger class of reward functions such as the $\\max()$ function and nonlinear utility functions. Existing techniques relying on accurate estimations of the means of random variables, such as the upper confidence bound (UCB) technique, do not work directly on these functions. We propose a ","authors_text":"Fu Li, Jian Li, Pinyan Lu, Wei Chen, Wei Hu, Yu Liu","cross_cats":["cs.DS","stat.ML"],"headline":"","license":"http://arxiv.org/licenses/nonexclusive-distrib/1.0/","primary_cat":"cs.LG","submitted_at":"2016-10-20T20:54:41Z","title":"Combinatorial Multi-Armed Bandit with General Reward Functions"},"references":{"count":0,"internal_anchors":0,"resolved_work":0,"sample":[],"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"source":{"id":"1610.06603","kind":"arxiv","version":4},"verdict":{"created_at":null,"id":null,"model_set":{},"one_line_summary":"","pipeline_version":null,"pith_extraction_headline":"","strongest_claim":"","weakest_assumption":""}},"verdict_id":null}}],"author_attestations":[],"timestamp_anchors":[],"storage_attestations":[],"citation_signatures":[],"replication_records":[],"corrections":[],"mirror_hints":[],"record_created":{"event_id":"sha256:512428a5adacfcfefa99000052945a6bbf88f2a541e6868d276e6cfd0983eb2c","target":"record","created_at":"2026-05-18T00:10:19Z","signer":{"key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","signer_id":"pith.science","signer_type":"pith_registry"},"payload":{"attestation_state":"computed","canonical_record":{"metadata":{"abstract_canon_sha256":"6cb602bbb1c998383dd59db298218d641162231151355d5f27fca8612180d37f","cross_cats_sorted":["cs.DS","stat.ML"],"license":"http://arxiv.org/licenses/nonexclusive-distrib/1.0/","primary_cat":"cs.LG","submitted_at":"2016-10-20T20:54:41Z","title_canon_sha256":"699b2a110f16969fe252c875ed66aaedab99ebd90ac1444f5d75380047921a26"},"schema_version":"1.0","source":{"id":"1610.06603","kind":"arxiv","version":4}},"canonical_sha256":"56e6656918bfe720b4352ae98a06010ff80729b635129bcef850833bc01743b4","receipt":{"algorithm":"ed25519","builder_version":"pith-number-builder-2026-05-17-v1","canonical_sha256":"56e6656918bfe720b4352ae98a06010ff80729b635129bcef850833bc01743b4","first_computed_at":"2026-05-18T00:10:19.574512Z","key_id":"pith-v1-2026-05","kind":"pith_receipt","last_reissued_at":"2026-05-18T00:10:19.574512Z","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","receipt_version":"0.3","signature_b64":"el8WvR6bqL4UQZDtRv1IEWxxq/VEpAffa8j5upixkFkn0g5m9SOceWyiMtuMhMcEyhePTq9pIhuCDcLJX2nQBw==","signature_status":"signed_v1","signed_at":"2026-05-18T00:10:19.575171Z","signed_message":"canonical_sha256_bytes"},"source_id":"1610.06603","source_kind":"arxiv","source_version":4}}},"equivocations":[],"invalid_events":[],"applied_event_ids":["sha256:512428a5adacfcfefa99000052945a6bbf88f2a541e6868d276e6cfd0983eb2c","sha256:5733441c7888d5e468c20204b9f8a95a1c5cf39f8f4142356ff038e986ec6536"],"state_sha256":"df293eb0d30e8678d70813bc4cb2972af3b694aa2b9845b25b8c9e38c70d639d"},"bundle_signature":{"signature_status":"signed_v1","algorithm":"ed25519","key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","signature_b64":"kiWdO9dz7ZHZngYWU261pasyUR8X3NLiarJFHNVJIN4hlEG7Lpm6U1zO9X1pcD5kOLdYuU1q0r3Wcccna/jzCw==","signed_message":"bundle_sha256_bytes","signed_at":"2026-05-27T00:57:39.592384Z","bundle_sha256":"cab2c30dfad0b6084ecf1d2fccbcc828150cb15dc5356864bb3ca07587523f37"}}