{"record_type":"pith_number_record","schema_url":"https://pith.science/schemas/pith-number/v1.json","pith_number":"pith:2018:2WAQYDYYEWLTPUCDMDYQ2NGM5D","short_pith_number":"pith:2WAQYDYY","schema_version":"1.0","canonical_sha256":"d5810c0f18259737d04360f10d34cce8d9564a7e6cb57ef19e97442174ac3d8a","source":{"kind":"arxiv","id":"1809.05385","version":1},"attestation_state":"computed","paper":{"title":"Index-Based Policy for Risk-Averse Multi-Armed Bandit","license":"http://arxiv.org/licenses/nonexclusive-distrib/1.0/","headline":"","cross_cats":[],"primary_cat":"math.OC","authors_text":"Jianyu Xu, William B. Haskell, Zhisheng Ye","submitted_at":"2018-09-14T13:04:56Z","abstract_excerpt":"The multi-armed bandit (MAB) is a classical online optimization model for the trade-off between exploration and exploitation. The traditional MAB is concerned with finding the arm that minimizes the mean cost. However, minimizing the mean does not take the risk of the problem into account. We now want to accommodate risk-averse decision makers. In this work, we introduce a coherent risk measure as the criterion to form a risk-averse MAB. In particular, we derive an index-based online sampling framework for the risk-averse MAB. We develop this framework in detail for three specific risk measure"},"verification_status":{"content_addressed":true,"pith_receipt":true,"author_attested":false,"weak_author_claims":0,"strong_author_claims":0,"externally_anchored":false,"storage_verified":false,"citation_signatures":0,"replication_records":0,"graph_snapshot":true,"references_resolved":false,"formal_links_present":false},"canonical_record":{"source":{"id":"1809.05385","kind":"arxiv","version":1},"metadata":{"license":"http://arxiv.org/licenses/nonexclusive-distrib/1.0/","primary_cat":"math.OC","submitted_at":"2018-09-14T13:04:56Z","cross_cats_sorted":[],"title_canon_sha256":"65042778d8fee6cf5322720ba874c202c7500327a606c15c9e377df59e95afa0","abstract_canon_sha256":"6a528d2af1e7075b96ae69b19dffdb198d06d0bb0dc41d6fc70a7db72e2a8faa"},"schema_version":"1.0"},"receipt":{"kind":"pith_receipt","key_id":"pith-v1-2026-05","algorithm":"ed25519","signed_at":"2026-05-18T00:05:41.610258Z","signature_b64":"USVUSEhFYCqfOl66RVpRFmHUcXdXI8Ae47h3v9Wson6WgTDOcU8JJL1VC7OqFNwkBDzpjOTMcY6jXHifgfzXAw==","signed_message":"canonical_sha256_bytes","builder_version":"pith-number-builder-2026-05-17-v1","receipt_version":"0.3","canonical_sha256":"d5810c0f18259737d04360f10d34cce8d9564a7e6cb57ef19e97442174ac3d8a","last_reissued_at":"2026-05-18T00:05:41.609723Z","signature_status":"signed_v1","first_computed_at":"2026-05-18T00:05:41.609723Z","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54"},"graph_snapshot":{"paper":{"title":"Index-Based Policy for Risk-Averse Multi-Armed Bandit","license":"http://arxiv.org/licenses/nonexclusive-distrib/1.0/","headline":"","cross_cats":[],"primary_cat":"math.OC","authors_text":"Jianyu Xu, William B. Haskell, Zhisheng Ye","submitted_at":"2018-09-14T13:04:56Z","abstract_excerpt":"The multi-armed bandit (MAB) is a classical online optimization model for the trade-off between exploration and exploitation. The traditional MAB is concerned with finding the arm that minimizes the mean cost. However, minimizing the mean does not take the risk of the problem into account. We now want to accommodate risk-averse decision makers. In this work, we introduce a coherent risk measure as the criterion to form a risk-averse MAB. In particular, we derive an index-based online sampling framework for the risk-averse MAB. We develop this framework in detail for three specific risk measure"},"claims":{"count":0,"items":[],"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"source":{"id":"1809.05385","kind":"arxiv","version":1},"verdict":{"id":null,"model_set":{},"created_at":null,"strongest_claim":"","one_line_summary":"","pipeline_version":null,"weakest_assumption":"","pith_extraction_headline":""},"references":{"count":0,"sample":[],"resolved_work":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57","internal_anchors":0},"formal_canon":{"evidence_count":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"author_claims":{"count":0,"strong_count":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"builder_version":"pith-number-builder-2026-05-17-v1"},"aliases":[{"alias_kind":"arxiv","alias_value":"1809.05385","created_at":"2026-05-18T00:05:41.609810+00:00"},{"alias_kind":"arxiv_version","alias_value":"1809.05385v1","created_at":"2026-05-18T00:05:41.609810+00:00"},{"alias_kind":"doi","alias_value":"10.48550/arxiv.1809.05385","created_at":"2026-05-18T00:05:41.609810+00:00"},{"alias_kind":"pith_short_12","alias_value":"2WAQYDYYEWLT","created_at":"2026-05-18T12:32:02.567920+00:00"},{"alias_kind":"pith_short_16","alias_value":"2WAQYDYYEWLTPUCD","created_at":"2026-05-18T12:32:02.567920+00:00"},{"alias_kind":"pith_short_8","alias_value":"2WAQYDYY","created_at":"2026-05-18T12:32:02.567920+00:00"}],"events":[],"event_summary":{},"paper_claims":[],"inbound_citations":{"count":0,"internal_anchor_count":0,"sample":[]},"formal_canon":{"evidence_count":0,"sample":[],"anchors":[]},"links":{"html":"https://pith.science/pith/2WAQYDYYEWLTPUCDMDYQ2NGM5D","json":"https://pith.science/pith/2WAQYDYYEWLTPUCDMDYQ2NGM5D.json","graph_json":"https://pith.science/api/pith-number/2WAQYDYYEWLTPUCDMDYQ2NGM5D/graph.json","events_json":"https://pith.science/api/pith-number/2WAQYDYYEWLTPUCDMDYQ2NGM5D/events.json","paper":"https://pith.science/paper/2WAQYDYY"},"agent_actions":{"view_html":"https://pith.science/pith/2WAQYDYYEWLTPUCDMDYQ2NGM5D","download_json":"https://pith.science/pith/2WAQYDYYEWLTPUCDMDYQ2NGM5D.json","view_paper":"https://pith.science/paper/2WAQYDYY","resolve_alias":"https://pith.science/api/pith-number/resolve?arxiv=1809.05385&json=true","fetch_graph":"https://pith.science/api/pith-number/2WAQYDYYEWLTPUCDMDYQ2NGM5D/graph.json","fetch_events":"https://pith.science/api/pith-number/2WAQYDYYEWLTPUCDMDYQ2NGM5D/events.json","actions":{"anchor_timestamp":"https://pith.science/pith/2WAQYDYYEWLTPUCDMDYQ2NGM5D/action/timestamp_anchor","attest_storage":"https://pith.science/pith/2WAQYDYYEWLTPUCDMDYQ2NGM5D/action/storage_attestation","attest_author":"https://pith.science/pith/2WAQYDYYEWLTPUCDMDYQ2NGM5D/action/author_attestation","sign_citation":"https://pith.science/pith/2WAQYDYYEWLTPUCDMDYQ2NGM5D/action/citation_signature","submit_replication":"https://pith.science/pith/2WAQYDYYEWLTPUCDMDYQ2NGM5D/action/replication_record"}},"created_at":"2026-05-18T00:05:41.609810+00:00","updated_at":"2026-05-18T00:05:41.609810+00:00"}