{"bundle_type":"pith_open_graph_bundle","bundle_version":"1.0","pith_number":"pith:2018:S6JLOEMJ7E2ZBMK2U7UB5J4QKD","short_pith_number":"pith:S6JLOEMJ","canonical_record":{"source":{"id":"1808.07645","kind":"arxiv","version":5},"metadata":{"license":"http://arxiv.org/licenses/nonexclusive-distrib/1.0/","primary_cat":"cs.HC","submitted_at":"2018-08-23T06:34:32Z","cross_cats_sorted":["cs.AI","cs.CL"],"title_canon_sha256":"5e97a70b885a51d5b24ffa258ecdb24dac93782e33d187480bee2e346304f5a8","abstract_canon_sha256":"1a3098cdd69bf5900b98add7a292b5d891461ce2c22d2059fa9c0612597d05ec"},"schema_version":"1.0"},"canonical_sha256":"9792b71189f93590b15aa7e81ea79050c3789182b7e8710ff3e2feb8f75a4cdf","source":{"kind":"arxiv","id":"1808.07645","version":5},"source_aliases":[{"alias_kind":"arxiv","alias_value":"1808.07645","created_at":"2026-07-03T01:17:09Z"},{"alias_kind":"arxiv_version","alias_value":"1808.07645v5","created_at":"2026-07-03T01:17:09Z"},{"alias_kind":"doi","alias_value":"10.48550/arxiv.1808.07645","created_at":"2026-07-03T01:17:09Z"},{"alias_kind":"pith_short_12","alias_value":"S6JLOEMJ7E2Z","created_at":"2026-07-03T01:17:09Z"},{"alias_kind":"pith_short_16","alias_value":"S6JLOEMJ7E2ZBMK2","created_at":"2026-07-03T01:17:09Z"},{"alias_kind":"pith_short_8","alias_value":"S6JLOEMJ","created_at":"2026-07-03T01:17:09Z"}],"events":[{"event_type":"record_created","subject_pith_number":"pith:2018:S6JLOEMJ7E2ZBMK2U7UB5J4QKD","target":"record","payload":{"canonical_record":{"source":{"id":"1808.07645","kind":"arxiv","version":5},"metadata":{"license":"http://arxiv.org/licenses/nonexclusive-distrib/1.0/","primary_cat":"cs.HC","submitted_at":"2018-08-23T06:34:32Z","cross_cats_sorted":["cs.AI","cs.CL"],"title_canon_sha256":"5e97a70b885a51d5b24ffa258ecdb24dac93782e33d187480bee2e346304f5a8","abstract_canon_sha256":"1a3098cdd69bf5900b98add7a292b5d891461ce2c22d2059fa9c0612597d05ec"},"schema_version":"1.0"},"canonical_sha256":"9792b71189f93590b15aa7e81ea79050c3789182b7e8710ff3e2feb8f75a4cdf","receipt":{"kind":"pith_receipt","key_id":"pith-v1-2026-05","algorithm":"ed25519","signed_at":"2026-07-03T01:17:09.026373Z","signature_b64":"24TCcuueQaAx9MjfWNxufvz58t8uR95blciVVgkoYStFylgTe+lB5mMqwd5xQnxolJifNsN0Y9ToiZPaG6aTBw==","signed_message":"canonical_sha256_bytes","builder_version":"pith-number-builder-2026-05-17-v1","receipt_version":"0.3","canonical_sha256":"9792b71189f93590b15aa7e81ea79050c3789182b7e8710ff3e2feb8f75a4cdf","last_reissued_at":"2026-07-03T01:17:09.025963Z","signature_status":"signed_v1","first_computed_at":"2026-07-03T01:17:09.025963Z","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54"},"source_kind":"arxiv","source_id":"1808.07645","source_version":5,"attestation_state":"computed"},"signer":{"signer_id":"pith.science","signer_type":"pith_registry","key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54"},"created_at":"2026-07-03T01:17:09Z","supersedes":[],"prev_event":null,"signature":{"signature_status":"signed_v1","algorithm":"ed25519","key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","signature_b64":"v3x+7AlmxtFpfV+oT56d72qpSXMHQQwWmE+XG1FqLabw+vAud5fWurBcT+gW2dorWexcBZkI0Rxpbbz44dlqAw==","signed_message":"open_graph_event_sha256_bytes","signed_at":"2026-07-03T16:19:09.386067Z"},"content_sha256":"3bcc805fa38d66275c6f9a97895de757da51d1ce2a14ed5a9b7918ef2de0dbea","schema_version":"1.0","event_id":"sha256:3bcc805fa38d66275c6f9a97895de757da51d1ce2a14ed5a9b7918ef2de0dbea"},{"event_type":"graph_snapshot","subject_pith_number":"pith:2018:S6JLOEMJ7E2ZBMK2U7UB5J4QKD","target":"graph","payload":{"graph_snapshot":{"paper":{"title":"Playing 20 Question Game with Policy-Based Reinforcement Learning","license":"http://arxiv.org/licenses/nonexclusive-distrib/1.0/","headline":"","cross_cats":["cs.AI","cs.CL"],"primary_cat":"cs.HC","authors_text":"Bingfeng Luo, Can Xu, Chongyang Tao, Huang Hu, Wei Wu, Xianchao Wu, Zhan Chen","submitted_at":"2018-08-23T06:34:32Z","abstract_excerpt":"The 20 Questions (Q20) game is a well known game which encourages deductive reasoning and creativity. In the game, the answerer first thinks of an object such as a famous person or a kind of animal. Then the questioner tries to guess the object by asking 20 questions. In a Q20 game system, the user is considered as the answerer while the system itself acts as the questioner which requires a good strategy of question selection to figure out the correct object and win the game. However, the optimal policy of question selection is hard to be derived due to the complexity and volatility of the gam"},"claims":{"count":0,"items":[],"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"source":{"id":"1808.07645","kind":"arxiv","version":5},"verdict":{"id":null,"model_set":{},"created_at":null,"strongest_claim":"","one_line_summary":"","pipeline_version":null,"weakest_assumption":"","pith_extraction_headline":""},"integrity":{"clean":true,"summary":{"advisory":0,"critical":0,"by_detector":{},"informational":0},"endpoint":"/pith/1808.07645/integrity.json","findings":[],"available":true,"detectors_run":[],"snapshot_sha256":"c28c3603d3b5d939e8dc4c7e95fa8dfce3d595e45f758748cecf8e644a296938"},"references":{"count":0,"sample":[],"resolved_work":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57","internal_anchors":0},"formal_canon":{"evidence_count":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"author_claims":{"count":0,"strong_count":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"builder_version":"pith-number-builder-2026-05-17-v1"},"verdict_id":null},"signer":{"signer_id":"pith.science","signer_type":"pith_registry","key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54"},"created_at":"2026-07-03T01:17:09Z","supersedes":[],"prev_event":null,"signature":{"signature_status":"signed_v1","algorithm":"ed25519","key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","signature_b64":"D698PXpMlioaY1wRbTjVUyWR/hgD3bjar90o0Vwvg4qi9YNwHZRyYWckxKpMbQMTS0BbFSj4DjGILJC7Z4XgBw==","signed_message":"open_graph_event_sha256_bytes","signed_at":"2026-07-03T16:19:09.386506Z"},"content_sha256":"b27f0cd1ed73c06a69b4a71b0d595ec085e7d8b11494c31f2e297f3b3d61cf6c","schema_version":"1.0","event_id":"sha256:b27f0cd1ed73c06a69b4a71b0d595ec085e7d8b11494c31f2e297f3b3d61cf6c"}],"timestamp_proofs":[],"mirror_hints":[{"mirror_type":"https","name":"Pith Resolver","base_url":"https://pith.science","bundle_url":"https://pith.science/pith/S6JLOEMJ7E2ZBMK2U7UB5J4QKD/bundle.json","state_url":"https://pith.science/pith/S6JLOEMJ7E2ZBMK2U7UB5J4QKD/state.json","well_known_bundle_url":"https://pith.science/.well-known/pith/S6JLOEMJ7E2ZBMK2U7UB5J4QKD/bundle.json","status":"primary"}],"public_keys":[{"key_id":"pith-v1-2026-05","algorithm":"ed25519","format":"raw","public_key_b64":"stVStoiQhXFxp4s2pdzPNoqVNBMojDU/fJ2db5S3CbM=","public_key_hex":"b2d552b68890857171a78b36a5dccf368a953413288c353f7c9d9d6f94b709b3","fingerprint_sha256_b32_first128bits":"RVFV5Z2OI2J3ZUO7ERDEBCYNKS","fingerprint_sha256_hex":"8d4b5ee74e4693bcd1df2446408b0d54","rotates_at":null,"url":"https://pith.science/pith-signing-key.json","notes":"Pith uses this Ed25519 key to sign canonical record SHA-256 digests. Verify with: ed25519_verify(public_key, message=canonical_sha256_bytes, signature=base64decode(signature_b64))."}],"merge_version":"pith-open-graph-merge-v1","built_at":"2026-07-03T16:19:09Z","links":{"resolver":"https://pith.science/pith/S6JLOEMJ7E2ZBMK2U7UB5J4QKD","bundle":"https://pith.science/pith/S6JLOEMJ7E2ZBMK2U7UB5J4QKD/bundle.json","state":"https://pith.science/pith/S6JLOEMJ7E2ZBMK2U7UB5J4QKD/state.json","well_known_bundle":"https://pith.science/.well-known/pith/S6JLOEMJ7E2ZBMK2U7UB5J4QKD/bundle.json"},"state":{"state_type":"pith_open_graph_state","state_version":"1.0","pith_number":"pith:2018:S6JLOEMJ7E2ZBMK2U7UB5J4QKD","merge_version":"pith-open-graph-merge-v1","event_count":2,"valid_event_count":2,"invalid_event_count":0,"equivocation_count":0,"current":{"canonical_record":{"metadata":{"abstract_canon_sha256":"1a3098cdd69bf5900b98add7a292b5d891461ce2c22d2059fa9c0612597d05ec","cross_cats_sorted":["cs.AI","cs.CL"],"license":"http://arxiv.org/licenses/nonexclusive-distrib/1.0/","primary_cat":"cs.HC","submitted_at":"2018-08-23T06:34:32Z","title_canon_sha256":"5e97a70b885a51d5b24ffa258ecdb24dac93782e33d187480bee2e346304f5a8"},"schema_version":"1.0","source":{"id":"1808.07645","kind":"arxiv","version":5}},"source_aliases":[{"alias_kind":"arxiv","alias_value":"1808.07645","created_at":"2026-07-03T01:17:09Z"},{"alias_kind":"arxiv_version","alias_value":"1808.07645v5","created_at":"2026-07-03T01:17:09Z"},{"alias_kind":"doi","alias_value":"10.48550/arxiv.1808.07645","created_at":"2026-07-03T01:17:09Z"},{"alias_kind":"pith_short_12","alias_value":"S6JLOEMJ7E2Z","created_at":"2026-07-03T01:17:09Z"},{"alias_kind":"pith_short_16","alias_value":"S6JLOEMJ7E2ZBMK2","created_at":"2026-07-03T01:17:09Z"},{"alias_kind":"pith_short_8","alias_value":"S6JLOEMJ","created_at":"2026-07-03T01:17:09Z"}],"graph_snapshots":[{"event_id":"sha256:b27f0cd1ed73c06a69b4a71b0d595ec085e7d8b11494c31f2e297f3b3d61cf6c","target":"graph","created_at":"2026-07-03T01:17:09Z","signer":{"key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","signer_id":"pith.science","signer_type":"pith_registry"},"payload":{"graph_snapshot":{"author_claims":{"count":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57","strong_count":0},"builder_version":"pith-number-builder-2026-05-17-v1","claims":{"count":0,"items":[],"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"formal_canon":{"evidence_count":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"integrity":{"available":true,"clean":true,"detectors_run":[],"endpoint":"/pith/1808.07645/integrity.json","findings":[],"snapshot_sha256":"c28c3603d3b5d939e8dc4c7e95fa8dfce3d595e45f758748cecf8e644a296938","summary":{"advisory":0,"by_detector":{},"critical":0,"informational":0}},"paper":{"abstract_excerpt":"The 20 Questions (Q20) game is a well known game which encourages deductive reasoning and creativity. In the game, the answerer first thinks of an object such as a famous person or a kind of animal. Then the questioner tries to guess the object by asking 20 questions. In a Q20 game system, the user is considered as the answerer while the system itself acts as the questioner which requires a good strategy of question selection to figure out the correct object and win the game. However, the optimal policy of question selection is hard to be derived due to the complexity and volatility of the gam","authors_text":"Bingfeng Luo, Can Xu, Chongyang Tao, Huang Hu, Wei Wu, Xianchao Wu, Zhan Chen","cross_cats":["cs.AI","cs.CL"],"headline":"","license":"http://arxiv.org/licenses/nonexclusive-distrib/1.0/","primary_cat":"cs.HC","submitted_at":"2018-08-23T06:34:32Z","title":"Playing 20 Question Game with Policy-Based Reinforcement Learning"},"references":{"count":0,"internal_anchors":0,"resolved_work":0,"sample":[],"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"source":{"id":"1808.07645","kind":"arxiv","version":5},"verdict":{"created_at":null,"id":null,"model_set":{},"one_line_summary":"","pipeline_version":null,"pith_extraction_headline":"","strongest_claim":"","weakest_assumption":""}},"verdict_id":null}}],"author_attestations":[],"timestamp_anchors":[],"storage_attestations":[],"citation_signatures":[],"replication_records":[],"corrections":[],"mirror_hints":[],"record_created":{"event_id":"sha256:3bcc805fa38d66275c6f9a97895de757da51d1ce2a14ed5a9b7918ef2de0dbea","target":"record","created_at":"2026-07-03T01:17:09Z","signer":{"key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","signer_id":"pith.science","signer_type":"pith_registry"},"payload":{"attestation_state":"computed","canonical_record":{"metadata":{"abstract_canon_sha256":"1a3098cdd69bf5900b98add7a292b5d891461ce2c22d2059fa9c0612597d05ec","cross_cats_sorted":["cs.AI","cs.CL"],"license":"http://arxiv.org/licenses/nonexclusive-distrib/1.0/","primary_cat":"cs.HC","submitted_at":"2018-08-23T06:34:32Z","title_canon_sha256":"5e97a70b885a51d5b24ffa258ecdb24dac93782e33d187480bee2e346304f5a8"},"schema_version":"1.0","source":{"id":"1808.07645","kind":"arxiv","version":5}},"canonical_sha256":"9792b71189f93590b15aa7e81ea79050c3789182b7e8710ff3e2feb8f75a4cdf","receipt":{"algorithm":"ed25519","builder_version":"pith-number-builder-2026-05-17-v1","canonical_sha256":"9792b71189f93590b15aa7e81ea79050c3789182b7e8710ff3e2feb8f75a4cdf","first_computed_at":"2026-07-03T01:17:09.025963Z","key_id":"pith-v1-2026-05","kind":"pith_receipt","last_reissued_at":"2026-07-03T01:17:09.025963Z","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","receipt_version":"0.3","signature_b64":"24TCcuueQaAx9MjfWNxufvz58t8uR95blciVVgkoYStFylgTe+lB5mMqwd5xQnxolJifNsN0Y9ToiZPaG6aTBw==","signature_status":"signed_v1","signed_at":"2026-07-03T01:17:09.026373Z","signed_message":"canonical_sha256_bytes"},"source_id":"1808.07645","source_kind":"arxiv","source_version":5}}},"equivocations":[],"invalid_events":[],"applied_event_ids":["sha256:3bcc805fa38d66275c6f9a97895de757da51d1ce2a14ed5a9b7918ef2de0dbea","sha256:b27f0cd1ed73c06a69b4a71b0d595ec085e7d8b11494c31f2e297f3b3d61cf6c"],"state_sha256":"2d15909f90c57204fc62378e5c313d57c4216036fb2e3365c9f5ca226c625d32"},"bundle_signature":{"signature_status":"signed_v1","algorithm":"ed25519","key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","signature_b64":"suu48l7HjP40EOHe/agV7fpixFHeKvR7lyD2CAxhOd88E5aZehdt1fAq4WmeznP+XhfnFDsCun3szD+Ey7btDA==","signed_message":"bundle_sha256_bytes","signed_at":"2026-07-03T16:19:09.388651Z","bundle_sha256":"d66fb78407c0963ed59d01e11c621fffc094f43b63663050305b0eabd8ae57b5"}}