{"bundle_type":"pith_open_graph_bundle","bundle_version":"1.0","pith_number":"pith:2017:5E6P7PO3CPHYXTNI5NJJBF6KY3","short_pith_number":"pith:5E6P7PO3","canonical_record":{"source":{"id":"1708.07607","kind":"arxiv","version":3},"metadata":{"license":"http://arxiv.org/licenses/nonexclusive-distrib/1.0/","primary_cat":"cs.MA","submitted_at":"2017-08-25T03:55:21Z","cross_cats_sorted":["cs.AI"],"title_canon_sha256":"536bb2f64dfbc047f151b5aed9d0f1a4429c3258475a7da21b8503066159004b","abstract_canon_sha256":"bb23d2d1dfea8893301a41fbd8e4009850967125348537819999714edc9eb9bc"},"schema_version":"1.0"},"canonical_sha256":"e93cffbddb13cf8bcda8eb529097cac6ff8ca1d6fb0e1e5759b9798df11cf943","source":{"kind":"arxiv","id":"1708.07607","version":3},"source_aliases":[{"alias_kind":"arxiv","alias_value":"1708.07607","created_at":"2026-05-18T00:22:33Z"},{"alias_kind":"arxiv_version","alias_value":"1708.07607v3","created_at":"2026-05-18T00:22:33Z"},{"alias_kind":"doi","alias_value":"10.48550/arxiv.1708.07607","created_at":"2026-05-18T00:22:33Z"},{"alias_kind":"pith_short_12","alias_value":"5E6P7PO3CPHY","created_at":"2026-05-18T12:31:00Z"},{"alias_kind":"pith_short_16","alias_value":"5E6P7PO3CPHYXTNI","created_at":"2026-05-18T12:31:00Z"},{"alias_kind":"pith_short_8","alias_value":"5E6P7PO3","created_at":"2026-05-18T12:31:00Z"}],"events":[{"event_type":"record_created","subject_pith_number":"pith:2017:5E6P7PO3CPHYXTNI5NJJBF6KY3","target":"record","payload":{"canonical_record":{"source":{"id":"1708.07607","kind":"arxiv","version":3},"metadata":{"license":"http://arxiv.org/licenses/nonexclusive-distrib/1.0/","primary_cat":"cs.MA","submitted_at":"2017-08-25T03:55:21Z","cross_cats_sorted":["cs.AI"],"title_canon_sha256":"536bb2f64dfbc047f151b5aed9d0f1a4429c3258475a7da21b8503066159004b","abstract_canon_sha256":"bb23d2d1dfea8893301a41fbd8e4009850967125348537819999714edc9eb9bc"},"schema_version":"1.0"},"canonical_sha256":"e93cffbddb13cf8bcda8eb529097cac6ff8ca1d6fb0e1e5759b9798df11cf943","receipt":{"kind":"pith_receipt","key_id":"pith-v1-2026-05","algorithm":"ed25519","signed_at":"2026-05-18T00:22:33.251264Z","signature_b64":"cCfImD/fhWK+ATl1sV9yRHmCh9iu/x9a/gF0HbMfpNVX6fIvg17T9vnKsizl11QFrxdUDMLlmJ3Ogxkf7Q8kBQ==","signed_message":"canonical_sha256_bytes","builder_version":"pith-number-builder-2026-05-17-v1","receipt_version":"0.3","canonical_sha256":"e93cffbddb13cf8bcda8eb529097cac6ff8ca1d6fb0e1e5759b9798df11cf943","last_reissued_at":"2026-05-18T00:22:33.250842Z","signature_status":"signed_v1","first_computed_at":"2026-05-18T00:22:33.250842Z","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54"},"source_kind":"arxiv","source_id":"1708.07607","source_version":3,"attestation_state":"computed"},"signer":{"signer_id":"pith.science","signer_type":"pith_registry","key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54"},"created_at":"2026-05-18T00:22:33Z","supersedes":[],"prev_event":null,"signature":{"signature_status":"signed_v1","algorithm":"ed25519","key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","signature_b64":"G51gI/LNRDsWDTkL84YDCUQtQjMtce0EspO7q5r89zPONvrsf9ujg1LiBhb1RPc6iQMdruDtfPWByINNTGDyCw==","signed_message":"open_graph_event_sha256_bytes","signed_at":"2026-06-01T16:33:31.232657Z"},"content_sha256":"db8e695465bb245babff49b2020c66f8bd54097d9a88d4a457c10716fdf9c225","schema_version":"1.0","event_id":"sha256:db8e695465bb245babff49b2020c66f8bd54097d9a88d4a457c10716fdf9c225"},{"event_type":"graph_snapshot","subject_pith_number":"pith:2017:5E6P7PO3CPHYXTNI5NJJBF6KY3","target":"graph","payload":{"graph_snapshot":{"paper":{"title":"Reinforcement Mechanism Design for e-commerce","license":"http://arxiv.org/licenses/nonexclusive-distrib/1.0/","headline":"","cross_cats":["cs.AI"],"primary_cat":"cs.MA","authors_text":"Aris Filos-Ratsikas, Pingzhong Tang, Qingpeng Cai, Yiwei Zhang","submitted_at":"2017-08-25T03:55:21Z","abstract_excerpt":"We study the problem of allocating impressions to sellers in e-commerce websites, such as Amazon, eBay or Taobao, aiming to maximize the total revenue generated by the platform. We employ a general framework of reinforcement mechanism design, which uses deep reinforcement learning to design efficient algorithms, taking the strategic behaviour of the sellers into account. Specifically, we model the impression allocation problem as a Markov decision process, where the states encode the history of impressions, prices, transactions and generated revenue and the actions are the possible impression "},"claims":{"count":0,"items":[],"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"source":{"id":"1708.07607","kind":"arxiv","version":3},"verdict":{"id":null,"model_set":{},"created_at":null,"strongest_claim":"","one_line_summary":"","pipeline_version":null,"weakest_assumption":"","pith_extraction_headline":""},"references":{"count":0,"sample":[],"resolved_work":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57","internal_anchors":0},"formal_canon":{"evidence_count":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"author_claims":{"count":0,"strong_count":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"builder_version":"pith-number-builder-2026-05-17-v1"},"verdict_id":null},"signer":{"signer_id":"pith.science","signer_type":"pith_registry","key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54"},"created_at":"2026-05-18T00:22:33Z","supersedes":[],"prev_event":null,"signature":{"signature_status":"signed_v1","algorithm":"ed25519","key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","signature_b64":"OQoPeQxXhqGbgIzpJG8baj6smg0cUbrOP2FFl4lfX/5Tq6SnFUg2BJYXYrGUqOFOgpmRr1gWi/nQEHZCHUdbAg==","signed_message":"open_graph_event_sha256_bytes","signed_at":"2026-06-01T16:33:31.232994Z"},"content_sha256":"626bbd465dfadb194ebfdefc75b99eb7178d862f38e0da05a051d44230fd73a2","schema_version":"1.0","event_id":"sha256:626bbd465dfadb194ebfdefc75b99eb7178d862f38e0da05a051d44230fd73a2"}],"timestamp_proofs":[],"mirror_hints":[{"mirror_type":"https","name":"Pith Resolver","base_url":"https://pith.science","bundle_url":"https://pith.science/pith/5E6P7PO3CPHYXTNI5NJJBF6KY3/bundle.json","state_url":"https://pith.science/pith/5E6P7PO3CPHYXTNI5NJJBF6KY3/state.json","well_known_bundle_url":"https://pith.science/.well-known/pith/5E6P7PO3CPHYXTNI5NJJBF6KY3/bundle.json","status":"primary"}],"public_keys":[{"key_id":"pith-v1-2026-05","algorithm":"ed25519","format":"raw","public_key_b64":"stVStoiQhXFxp4s2pdzPNoqVNBMojDU/fJ2db5S3CbM=","public_key_hex":"b2d552b68890857171a78b36a5dccf368a953413288c353f7c9d9d6f94b709b3","fingerprint_sha256_b32_first128bits":"RVFV5Z2OI2J3ZUO7ERDEBCYNKS","fingerprint_sha256_hex":"8d4b5ee74e4693bcd1df2446408b0d54","rotates_at":null,"url":"https://pith.science/pith-signing-key.json","notes":"Pith uses this Ed25519 key to sign canonical record SHA-256 digests. Verify with: ed25519_verify(public_key, message=canonical_sha256_bytes, signature=base64decode(signature_b64))."}],"merge_version":"pith-open-graph-merge-v1","built_at":"2026-06-01T16:33:31Z","links":{"resolver":"https://pith.science/pith/5E6P7PO3CPHYXTNI5NJJBF6KY3","bundle":"https://pith.science/pith/5E6P7PO3CPHYXTNI5NJJBF6KY3/bundle.json","state":"https://pith.science/pith/5E6P7PO3CPHYXTNI5NJJBF6KY3/state.json","well_known_bundle":"https://pith.science/.well-known/pith/5E6P7PO3CPHYXTNI5NJJBF6KY3/bundle.json"},"state":{"state_type":"pith_open_graph_state","state_version":"1.0","pith_number":"pith:2017:5E6P7PO3CPHYXTNI5NJJBF6KY3","merge_version":"pith-open-graph-merge-v1","event_count":2,"valid_event_count":2,"invalid_event_count":0,"equivocation_count":0,"current":{"canonical_record":{"metadata":{"abstract_canon_sha256":"bb23d2d1dfea8893301a41fbd8e4009850967125348537819999714edc9eb9bc","cross_cats_sorted":["cs.AI"],"license":"http://arxiv.org/licenses/nonexclusive-distrib/1.0/","primary_cat":"cs.MA","submitted_at":"2017-08-25T03:55:21Z","title_canon_sha256":"536bb2f64dfbc047f151b5aed9d0f1a4429c3258475a7da21b8503066159004b"},"schema_version":"1.0","source":{"id":"1708.07607","kind":"arxiv","version":3}},"source_aliases":[{"alias_kind":"arxiv","alias_value":"1708.07607","created_at":"2026-05-18T00:22:33Z"},{"alias_kind":"arxiv_version","alias_value":"1708.07607v3","created_at":"2026-05-18T00:22:33Z"},{"alias_kind":"doi","alias_value":"10.48550/arxiv.1708.07607","created_at":"2026-05-18T00:22:33Z"},{"alias_kind":"pith_short_12","alias_value":"5E6P7PO3CPHY","created_at":"2026-05-18T12:31:00Z"},{"alias_kind":"pith_short_16","alias_value":"5E6P7PO3CPHYXTNI","created_at":"2026-05-18T12:31:00Z"},{"alias_kind":"pith_short_8","alias_value":"5E6P7PO3","created_at":"2026-05-18T12:31:00Z"}],"graph_snapshots":[{"event_id":"sha256:626bbd465dfadb194ebfdefc75b99eb7178d862f38e0da05a051d44230fd73a2","target":"graph","created_at":"2026-05-18T00:22:33Z","signer":{"key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","signer_id":"pith.science","signer_type":"pith_registry"},"payload":{"graph_snapshot":{"author_claims":{"count":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57","strong_count":0},"builder_version":"pith-number-builder-2026-05-17-v1","claims":{"count":0,"items":[],"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"formal_canon":{"evidence_count":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"paper":{"abstract_excerpt":"We study the problem of allocating impressions to sellers in e-commerce websites, such as Amazon, eBay or Taobao, aiming to maximize the total revenue generated by the platform. We employ a general framework of reinforcement mechanism design, which uses deep reinforcement learning to design efficient algorithms, taking the strategic behaviour of the sellers into account. Specifically, we model the impression allocation problem as a Markov decision process, where the states encode the history of impressions, prices, transactions and generated revenue and the actions are the possible impression ","authors_text":"Aris Filos-Ratsikas, Pingzhong Tang, Qingpeng Cai, Yiwei Zhang","cross_cats":["cs.AI"],"headline":"","license":"http://arxiv.org/licenses/nonexclusive-distrib/1.0/","primary_cat":"cs.MA","submitted_at":"2017-08-25T03:55:21Z","title":"Reinforcement Mechanism Design for e-commerce"},"references":{"count":0,"internal_anchors":0,"resolved_work":0,"sample":[],"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"source":{"id":"1708.07607","kind":"arxiv","version":3},"verdict":{"created_at":null,"id":null,"model_set":{},"one_line_summary":"","pipeline_version":null,"pith_extraction_headline":"","strongest_claim":"","weakest_assumption":""}},"verdict_id":null}}],"author_attestations":[],"timestamp_anchors":[],"storage_attestations":[],"citation_signatures":[],"replication_records":[],"corrections":[],"mirror_hints":[],"record_created":{"event_id":"sha256:db8e695465bb245babff49b2020c66f8bd54097d9a88d4a457c10716fdf9c225","target":"record","created_at":"2026-05-18T00:22:33Z","signer":{"key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","signer_id":"pith.science","signer_type":"pith_registry"},"payload":{"attestation_state":"computed","canonical_record":{"metadata":{"abstract_canon_sha256":"bb23d2d1dfea8893301a41fbd8e4009850967125348537819999714edc9eb9bc","cross_cats_sorted":["cs.AI"],"license":"http://arxiv.org/licenses/nonexclusive-distrib/1.0/","primary_cat":"cs.MA","submitted_at":"2017-08-25T03:55:21Z","title_canon_sha256":"536bb2f64dfbc047f151b5aed9d0f1a4429c3258475a7da21b8503066159004b"},"schema_version":"1.0","source":{"id":"1708.07607","kind":"arxiv","version":3}},"canonical_sha256":"e93cffbddb13cf8bcda8eb529097cac6ff8ca1d6fb0e1e5759b9798df11cf943","receipt":{"algorithm":"ed25519","builder_version":"pith-number-builder-2026-05-17-v1","canonical_sha256":"e93cffbddb13cf8bcda8eb529097cac6ff8ca1d6fb0e1e5759b9798df11cf943","first_computed_at":"2026-05-18T00:22:33.250842Z","key_id":"pith-v1-2026-05","kind":"pith_receipt","last_reissued_at":"2026-05-18T00:22:33.250842Z","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","receipt_version":"0.3","signature_b64":"cCfImD/fhWK+ATl1sV9yRHmCh9iu/x9a/gF0HbMfpNVX6fIvg17T9vnKsizl11QFrxdUDMLlmJ3Ogxkf7Q8kBQ==","signature_status":"signed_v1","signed_at":"2026-05-18T00:22:33.251264Z","signed_message":"canonical_sha256_bytes"},"source_id":"1708.07607","source_kind":"arxiv","source_version":3}}},"equivocations":[],"invalid_events":[],"applied_event_ids":["sha256:db8e695465bb245babff49b2020c66f8bd54097d9a88d4a457c10716fdf9c225","sha256:626bbd465dfadb194ebfdefc75b99eb7178d862f38e0da05a051d44230fd73a2"],"state_sha256":"cc6c5d5f844790c1794ffa62b36d279a9e487f27f13b70628fbcde0855022efa"},"bundle_signature":{"signature_status":"signed_v1","algorithm":"ed25519","key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","signature_b64":"sf/FgkdqEcMq3AkzYehDid4qtuMGyXD/6UWxzfKGd21hOIFpBqd6q5c4CjkZJi1bU98T/Iu5wuknPbXvFaSpAQ==","signed_message":"bundle_sha256_bytes","signed_at":"2026-06-01T16:33:31.234747Z","bundle_sha256":"dda9136155da9f565580e18c6de1e1f404599fb4874243e857c0f259d5d8a015"}}