{"bundle_type":"pith_open_graph_bundle","bundle_version":"1.0","pith_number":"pith:2020:C42JI7U3KAMJXPIUMJ5PXZEOAJ","short_pith_number":"pith:C42JI7U3","canonical_record":{"source":{"id":"2006.10389","kind":"arxiv","version":1},"metadata":{"license":"http://arxiv.org/licenses/nonexclusive-distrib/1.0/","primary_cat":"cs.IR","submitted_at":"2020-06-18T09:48:48Z","cross_cats_sorted":[],"title_canon_sha256":"d814995251be05f175a2fe621c7a7068aca3b19822d78c07116b97805208b721","abstract_canon_sha256":"a34f724271c0dec70100ad8d2b00d93dde9b7c18aa86928481b995e65a3090ac"},"schema_version":"1.0"},"canonical_sha256":"1734947e9b50189bbd14627afbe48e024d95c63455e071c2f92e43f1a3105a75","source":{"kind":"arxiv","id":"2006.10389","version":1},"source_aliases":[{"alias_kind":"arxiv","alias_value":"2006.10389","created_at":"2026-07-05T01:11:17Z"},{"alias_kind":"arxiv_version","alias_value":"2006.10389v1","created_at":"2026-07-05T01:11:17Z"},{"alias_kind":"doi","alias_value":"10.48550/arxiv.2006.10389","created_at":"2026-07-05T01:11:17Z"},{"alias_kind":"pith_short_12","alias_value":"C42JI7U3KAMJ","created_at":"2026-07-05T01:11:17Z"},{"alias_kind":"pith_short_16","alias_value":"C42JI7U3KAMJXPIU","created_at":"2026-07-05T01:11:17Z"},{"alias_kind":"pith_short_8","alias_value":"C42JI7U3","created_at":"2026-07-05T01:11:17Z"}],"events":[{"event_type":"record_created","subject_pith_number":"pith:2020:C42JI7U3KAMJXPIUMJ5PXZEOAJ","target":"record","payload":{"canonical_record":{"source":{"id":"2006.10389","kind":"arxiv","version":1},"metadata":{"license":"http://arxiv.org/licenses/nonexclusive-distrib/1.0/","primary_cat":"cs.IR","submitted_at":"2020-06-18T09:48:48Z","cross_cats_sorted":[],"title_canon_sha256":"d814995251be05f175a2fe621c7a7068aca3b19822d78c07116b97805208b721","abstract_canon_sha256":"a34f724271c0dec70100ad8d2b00d93dde9b7c18aa86928481b995e65a3090ac"},"schema_version":"1.0"},"canonical_sha256":"1734947e9b50189bbd14627afbe48e024d95c63455e071c2f92e43f1a3105a75","receipt":{"kind":"pith_receipt","key_id":"pith-v1-2026-05","algorithm":"ed25519","signed_at":"2026-07-05T01:11:17.996889Z","signature_b64":"H6OCB1gHwen/LPpT4Nufu1BiNF74aDjxOx77zcB2sQap0VMltGkaFN1270J6UAQec/dh+zXxxgYIpodu9sK3BQ==","signed_message":"canonical_sha256_bytes","builder_version":"pith-number-builder-2026-05-17-v1","receipt_version":"0.3","canonical_sha256":"1734947e9b50189bbd14627afbe48e024d95c63455e071c2f92e43f1a3105a75","last_reissued_at":"2026-07-05T01:11:17.996535Z","signature_status":"signed_v1","first_computed_at":"2026-07-05T01:11:17.996535Z","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54"},"source_kind":"arxiv","source_id":"2006.10389","source_version":1,"attestation_state":"computed"},"signer":{"signer_id":"pith.science","signer_type":"pith_registry","key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54"},"created_at":"2026-07-05T01:11:17Z","supersedes":[],"prev_event":null,"signature":{"signature_status":"signed_v1","algorithm":"ed25519","key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","signature_b64":"7jvYvOWbKth1rzEhzhDATuty0LtZn/jjtQEGD4WGGfyRmeBhsdU91tygSGbBY6O2M4Ec/0qqNDxOkxwRc9+uCg==","signed_message":"open_graph_event_sha256_bytes","signed_at":"2026-07-05T11:54:37.520281Z"},"content_sha256":"6f11f9357cc5a7bf81195425cb7cfebfc4d9c7731de0ebd8c11fc7a42a791429","schema_version":"1.0","event_id":"sha256:6f11f9357cc5a7bf81195425cb7cfebfc4d9c7731de0ebd8c11fc7a42a791429"},{"event_type":"graph_snapshot","subject_pith_number":"pith:2020:C42JI7U3KAMJXPIUMJ5PXZEOAJ","target":"graph","payload":{"graph_snapshot":{"paper":{"title":"Interactive Recommender System via Knowledge Graph-enhanced Reinforcement Learning","license":"http://arxiv.org/licenses/nonexclusive-distrib/1.0/","headline":"","cross_cats":[],"primary_cat":"cs.IR","authors_text":"Haokun Chen, Kan Ren, Ruiming Tang, Sijin Zhou, Weinan Zhang, Xinyi Dai, Xiuqiang He, Yong Yu","submitted_at":"2020-06-18T09:48:48Z","abstract_excerpt":"Interactive recommender system (IRS) has drawn huge attention because of its flexible recommendation strategy and the consideration of optimal long-term user experiences. To deal with the dynamic user preference and optimize accumulative utilities, researchers have introduced reinforcement learning (RL) into IRS. However, RL methods share a common issue of sample efficiency, i.e., huge amount of interaction data is required to train an effective recommendation policy, which is caused by the sparse user responses and the large action space consisting of a large number of candidate items. Moreov"},"claims":{"count":0,"items":[],"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"source":{"id":"2006.10389","kind":"arxiv","version":1},"verdict":{"id":null,"model_set":{},"created_at":null,"strongest_claim":"","one_line_summary":"","pipeline_version":null,"weakest_assumption":"","pith_extraction_headline":""},"integrity":{"clean":true,"summary":{"advisory":0,"critical":0,"by_detector":{},"informational":0},"endpoint":"/pith/2006.10389/integrity.json","findings":[],"available":true,"detectors_run":[],"snapshot_sha256":"c28c3603d3b5d939e8dc4c7e95fa8dfce3d595e45f758748cecf8e644a296938"},"references":{"count":0,"sample":[],"resolved_work":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57","internal_anchors":0},"formal_canon":{"evidence_count":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"author_claims":{"count":0,"strong_count":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"builder_version":"pith-number-builder-2026-05-17-v1"},"verdict_id":null},"signer":{"signer_id":"pith.science","signer_type":"pith_registry","key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54"},"created_at":"2026-07-05T01:11:17Z","supersedes":[],"prev_event":null,"signature":{"signature_status":"signed_v1","algorithm":"ed25519","key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","signature_b64":"w+ZkBW2Mogiz/Y4+21ppFznBHLdKhwOXPEXFEKipE1T6GaJkSx9pKbbLZHg/WHhP0ehEEg4s+zKNJho18EI3Aw==","signed_message":"open_graph_event_sha256_bytes","signed_at":"2026-07-05T11:54:37.520701Z"},"content_sha256":"387f48e73b6647699e5a6823c78c11bbf7b3378277cab733a46d4356f0018b30","schema_version":"1.0","event_id":"sha256:387f48e73b6647699e5a6823c78c11bbf7b3378277cab733a46d4356f0018b30"}],"timestamp_proofs":[],"mirror_hints":[{"mirror_type":"https","name":"Pith Resolver","base_url":"https://pith.science","bundle_url":"https://pith.science/pith/C42JI7U3KAMJXPIUMJ5PXZEOAJ/bundle.json","state_url":"https://pith.science/pith/C42JI7U3KAMJXPIUMJ5PXZEOAJ/state.json","well_known_bundle_url":"https://pith.science/.well-known/pith/C42JI7U3KAMJXPIUMJ5PXZEOAJ/bundle.json","status":"primary"}],"public_keys":[{"key_id":"pith-v1-2026-05","algorithm":"ed25519","format":"raw","public_key_b64":"stVStoiQhXFxp4s2pdzPNoqVNBMojDU/fJ2db5S3CbM=","public_key_hex":"b2d552b68890857171a78b36a5dccf368a953413288c353f7c9d9d6f94b709b3","fingerprint_sha256_b32_first128bits":"RVFV5Z2OI2J3ZUO7ERDEBCYNKS","fingerprint_sha256_hex":"8d4b5ee74e4693bcd1df2446408b0d54","rotates_at":null,"url":"https://pith.science/pith-signing-key.json","notes":"Pith uses this Ed25519 key to sign canonical record SHA-256 digests. Verify with: ed25519_verify(public_key, message=canonical_sha256_bytes, signature=base64decode(signature_b64))."}],"merge_version":"pith-open-graph-merge-v1","built_at":"2026-07-05T11:54:37Z","links":{"resolver":"https://pith.science/pith/C42JI7U3KAMJXPIUMJ5PXZEOAJ","bundle":"https://pith.science/pith/C42JI7U3KAMJXPIUMJ5PXZEOAJ/bundle.json","state":"https://pith.science/pith/C42JI7U3KAMJXPIUMJ5PXZEOAJ/state.json","well_known_bundle":"https://pith.science/.well-known/pith/C42JI7U3KAMJXPIUMJ5PXZEOAJ/bundle.json"},"state":{"state_type":"pith_open_graph_state","state_version":"1.0","pith_number":"pith:2020:C42JI7U3KAMJXPIUMJ5PXZEOAJ","merge_version":"pith-open-graph-merge-v1","event_count":2,"valid_event_count":2,"invalid_event_count":0,"equivocation_count":0,"current":{"canonical_record":{"metadata":{"abstract_canon_sha256":"a34f724271c0dec70100ad8d2b00d93dde9b7c18aa86928481b995e65a3090ac","cross_cats_sorted":[],"license":"http://arxiv.org/licenses/nonexclusive-distrib/1.0/","primary_cat":"cs.IR","submitted_at":"2020-06-18T09:48:48Z","title_canon_sha256":"d814995251be05f175a2fe621c7a7068aca3b19822d78c07116b97805208b721"},"schema_version":"1.0","source":{"id":"2006.10389","kind":"arxiv","version":1}},"source_aliases":[{"alias_kind":"arxiv","alias_value":"2006.10389","created_at":"2026-07-05T01:11:17Z"},{"alias_kind":"arxiv_version","alias_value":"2006.10389v1","created_at":"2026-07-05T01:11:17Z"},{"alias_kind":"doi","alias_value":"10.48550/arxiv.2006.10389","created_at":"2026-07-05T01:11:17Z"},{"alias_kind":"pith_short_12","alias_value":"C42JI7U3KAMJ","created_at":"2026-07-05T01:11:17Z"},{"alias_kind":"pith_short_16","alias_value":"C42JI7U3KAMJXPIU","created_at":"2026-07-05T01:11:17Z"},{"alias_kind":"pith_short_8","alias_value":"C42JI7U3","created_at":"2026-07-05T01:11:17Z"}],"graph_snapshots":[{"event_id":"sha256:387f48e73b6647699e5a6823c78c11bbf7b3378277cab733a46d4356f0018b30","target":"graph","created_at":"2026-07-05T01:11:17Z","signer":{"key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","signer_id":"pith.science","signer_type":"pith_registry"},"payload":{"graph_snapshot":{"author_claims":{"count":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57","strong_count":0},"builder_version":"pith-number-builder-2026-05-17-v1","claims":{"count":0,"items":[],"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"formal_canon":{"evidence_count":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"integrity":{"available":true,"clean":true,"detectors_run":[],"endpoint":"/pith/2006.10389/integrity.json","findings":[],"snapshot_sha256":"c28c3603d3b5d939e8dc4c7e95fa8dfce3d595e45f758748cecf8e644a296938","summary":{"advisory":0,"by_detector":{},"critical":0,"informational":0}},"paper":{"abstract_excerpt":"Interactive recommender system (IRS) has drawn huge attention because of its flexible recommendation strategy and the consideration of optimal long-term user experiences. To deal with the dynamic user preference and optimize accumulative utilities, researchers have introduced reinforcement learning (RL) into IRS. However, RL methods share a common issue of sample efficiency, i.e., huge amount of interaction data is required to train an effective recommendation policy, which is caused by the sparse user responses and the large action space consisting of a large number of candidate items. Moreov","authors_text":"Haokun Chen, Kan Ren, Ruiming Tang, Sijin Zhou, Weinan Zhang, Xinyi Dai, Xiuqiang He, Yong Yu","cross_cats":[],"headline":"","license":"http://arxiv.org/licenses/nonexclusive-distrib/1.0/","primary_cat":"cs.IR","submitted_at":"2020-06-18T09:48:48Z","title":"Interactive Recommender System via Knowledge Graph-enhanced Reinforcement Learning"},"references":{"count":0,"internal_anchors":0,"resolved_work":0,"sample":[],"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"source":{"id":"2006.10389","kind":"arxiv","version":1},"verdict":{"created_at":null,"id":null,"model_set":{},"one_line_summary":"","pipeline_version":null,"pith_extraction_headline":"","strongest_claim":"","weakest_assumption":""}},"verdict_id":null}}],"author_attestations":[],"timestamp_anchors":[],"storage_attestations":[],"citation_signatures":[],"replication_records":[],"corrections":[],"mirror_hints":[],"record_created":{"event_id":"sha256:6f11f9357cc5a7bf81195425cb7cfebfc4d9c7731de0ebd8c11fc7a42a791429","target":"record","created_at":"2026-07-05T01:11:17Z","signer":{"key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","signer_id":"pith.science","signer_type":"pith_registry"},"payload":{"attestation_state":"computed","canonical_record":{"metadata":{"abstract_canon_sha256":"a34f724271c0dec70100ad8d2b00d93dde9b7c18aa86928481b995e65a3090ac","cross_cats_sorted":[],"license":"http://arxiv.org/licenses/nonexclusive-distrib/1.0/","primary_cat":"cs.IR","submitted_at":"2020-06-18T09:48:48Z","title_canon_sha256":"d814995251be05f175a2fe621c7a7068aca3b19822d78c07116b97805208b721"},"schema_version":"1.0","source":{"id":"2006.10389","kind":"arxiv","version":1}},"canonical_sha256":"1734947e9b50189bbd14627afbe48e024d95c63455e071c2f92e43f1a3105a75","receipt":{"algorithm":"ed25519","builder_version":"pith-number-builder-2026-05-17-v1","canonical_sha256":"1734947e9b50189bbd14627afbe48e024d95c63455e071c2f92e43f1a3105a75","first_computed_at":"2026-07-05T01:11:17.996535Z","key_id":"pith-v1-2026-05","kind":"pith_receipt","last_reissued_at":"2026-07-05T01:11:17.996535Z","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","receipt_version":"0.3","signature_b64":"H6OCB1gHwen/LPpT4Nufu1BiNF74aDjxOx77zcB2sQap0VMltGkaFN1270J6UAQec/dh+zXxxgYIpodu9sK3BQ==","signature_status":"signed_v1","signed_at":"2026-07-05T01:11:17.996889Z","signed_message":"canonical_sha256_bytes"},"source_id":"2006.10389","source_kind":"arxiv","source_version":1}}},"equivocations":[],"invalid_events":[],"applied_event_ids":["sha256:6f11f9357cc5a7bf81195425cb7cfebfc4d9c7731de0ebd8c11fc7a42a791429","sha256:387f48e73b6647699e5a6823c78c11bbf7b3378277cab733a46d4356f0018b30"],"state_sha256":"954c8dd7a68180347ce692bb579f67d3123bc0253e57e07eac5865daa5d8cf68"},"bundle_signature":{"signature_status":"signed_v1","algorithm":"ed25519","key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","signature_b64":"P08RIwUOO2a66CXcTnnxJw7FbOzn5dwVLX/GZhPIbUPibE4QJv9FKjBQUMbIlg3O2cf1dSMxDXnVFLpstXguBA==","signed_message":"bundle_sha256_bytes","signed_at":"2026-07-05T11:54:37.522858Z","bundle_sha256":"7a27d82b85e81420285686483c8df5d425edcfd1b112a4e419fb656755931c27"}}