{"bundle_type":"pith_open_graph_bundle","bundle_version":"1.0","pith_number":"pith:2019:ULBGVE2U7D4WYML4XAIVHP3OH5","short_pith_number":"pith:ULBGVE2U","canonical_record":{"source":{"id":"1904.08051","kind":"arxiv","version":1},"metadata":{"license":"http://arxiv.org/licenses/nonexclusive-distrib/1.0/","primary_cat":"cs.CL","submitted_at":"2019-04-17T02:21:51Z","cross_cats_sorted":["cs.LG"],"title_canon_sha256":"94a9c58dd28112116b9c8dc913a519c85e3bca68ffe9e81646d123a98f3d6b57","abstract_canon_sha256":"31acf739b09e5783f7161acee266d073735bcc7b9183228764caeedf447e5b62"},"schema_version":"1.0"},"canonical_sha256":"a2c26a9354f8f96c317cb81153bf6e3f641c1097f9c5c7d6a76cb8bd9019d55a","source":{"kind":"arxiv","id":"1904.08051","version":1},"source_aliases":[{"alias_kind":"arxiv","alias_value":"1904.08051","created_at":"2026-05-17T23:48:18Z"},{"alias_kind":"arxiv_version","alias_value":"1904.08051v1","created_at":"2026-05-17T23:48:18Z"},{"alias_kind":"doi","alias_value":"10.48550/arxiv.1904.08051","created_at":"2026-05-17T23:48:18Z"},{"alias_kind":"pith_short_12","alias_value":"ULBGVE2U7D4W","created_at":"2026-05-18T12:33:30Z"},{"alias_kind":"pith_short_16","alias_value":"ULBGVE2U7D4WYML4","created_at":"2026-05-18T12:33:30Z"},{"alias_kind":"pith_short_8","alias_value":"ULBGVE2U","created_at":"2026-05-18T12:33:30Z"}],"events":[{"event_type":"record_created","subject_pith_number":"pith:2019:ULBGVE2U7D4WYML4XAIVHP3OH5","target":"record","payload":{"canonical_record":{"source":{"id":"1904.08051","kind":"arxiv","version":1},"metadata":{"license":"http://arxiv.org/licenses/nonexclusive-distrib/1.0/","primary_cat":"cs.CL","submitted_at":"2019-04-17T02:21:51Z","cross_cats_sorted":["cs.LG"],"title_canon_sha256":"94a9c58dd28112116b9c8dc913a519c85e3bca68ffe9e81646d123a98f3d6b57","abstract_canon_sha256":"31acf739b09e5783f7161acee266d073735bcc7b9183228764caeedf447e5b62"},"schema_version":"1.0"},"canonical_sha256":"a2c26a9354f8f96c317cb81153bf6e3f641c1097f9c5c7d6a76cb8bd9019d55a","receipt":{"kind":"pith_receipt","key_id":"pith-v1-2026-05","algorithm":"ed25519","signed_at":"2026-05-17T23:48:18.914904Z","signature_b64":"go4D1GV+vyWXNk23ZqrIa0CeqhEyXCduaMUHm8mJRtslDBYJ+sVu0JDDhgVzfI325mtY66f7An9da2GTDHhMAw==","signed_message":"canonical_sha256_bytes","builder_version":"pith-number-builder-2026-05-17-v1","receipt_version":"0.3","canonical_sha256":"a2c26a9354f8f96c317cb81153bf6e3f641c1097f9c5c7d6a76cb8bd9019d55a","last_reissued_at":"2026-05-17T23:48:18.914301Z","signature_status":"signed_v1","first_computed_at":"2026-05-17T23:48:18.914301Z","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54"},"source_kind":"arxiv","source_id":"1904.08051","source_version":1,"attestation_state":"computed"},"signer":{"signer_id":"pith.science","signer_type":"pith_registry","key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54"},"created_at":"2026-05-17T23:48:18Z","supersedes":[],"prev_event":null,"signature":{"signature_status":"signed_v1","algorithm":"ed25519","key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","signature_b64":"cFnIcu3r+44m4OOB7eU4lYPtRVeMCoqY5v3YLGFX2FxfN8YRt4LrzpPDG3PRVky7R+SBYiHB2D9E3L0yOZPnBw==","signed_message":"open_graph_event_sha256_bytes","signed_at":"2026-06-03T05:26:26.995704Z"},"content_sha256":"a0d97bde74dcb8d654358b8ca77707b0933c7aa87d96140084fe7fa8bf04f669","schema_version":"1.0","event_id":"sha256:a0d97bde74dcb8d654358b8ca77707b0933c7aa87d96140084fe7fa8bf04f669"},{"event_type":"graph_snapshot","subject_pith_number":"pith:2019:ULBGVE2U7D4WYML4XAIVHP3OH5","target":"graph","payload":{"graph_snapshot":{"paper":{"title":"Posterior-regularized REINFORCE for Instance Selection in Distant Supervision","license":"http://arxiv.org/licenses/nonexclusive-distrib/1.0/","headline":"","cross_cats":["cs.LG"],"primary_cat":"cs.CL","authors_text":"Fei Wu, Qi Zhang, Shiliang Pu, Siliang Tang, Xiang Ren, Yueting Zhuang","submitted_at":"2019-04-17T02:21:51Z","abstract_excerpt":"This paper provides a new way to improve the efficiency of the REINFORCE training process. We apply it to the task of instance selection in distant supervision. Modeling the instance selection in one bag as a sequential decision process, a reinforcement learning agent is trained to determine whether an instance is valuable or not and construct a new bag with less noisy instances. However unbiased methods, such as REINFORCE, could usually take much time to train. This paper adopts posterior regularization (PR) to integrate some domain-specific rules in instance selection using REINFORCE. As the"},"claims":{"count":0,"items":[],"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"source":{"id":"1904.08051","kind":"arxiv","version":1},"verdict":{"id":null,"model_set":{},"created_at":null,"strongest_claim":"","one_line_summary":"","pipeline_version":null,"weakest_assumption":"","pith_extraction_headline":""},"references":{"count":0,"sample":[],"resolved_work":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57","internal_anchors":0},"formal_canon":{"evidence_count":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"author_claims":{"count":0,"strong_count":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"builder_version":"pith-number-builder-2026-05-17-v1"},"verdict_id":null},"signer":{"signer_id":"pith.science","signer_type":"pith_registry","key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54"},"created_at":"2026-05-17T23:48:18Z","supersedes":[],"prev_event":null,"signature":{"signature_status":"signed_v1","algorithm":"ed25519","key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","signature_b64":"+r96fKFZTuuPyHZ/HJPw5O/ABh6CjUKY+mNHurG05EjuEk+Sp6cd3maWA9Jq8UtuNzSExHfmZw6f/zfdMTuPAQ==","signed_message":"open_graph_event_sha256_bytes","signed_at":"2026-06-03T05:26:26.996061Z"},"content_sha256":"b82d559822b0825c31c3389362668e96b9598e2697804406da651a034ebccadd","schema_version":"1.0","event_id":"sha256:b82d559822b0825c31c3389362668e96b9598e2697804406da651a034ebccadd"}],"timestamp_proofs":[],"mirror_hints":[{"mirror_type":"https","name":"Pith Resolver","base_url":"https://pith.science","bundle_url":"https://pith.science/pith/ULBGVE2U7D4WYML4XAIVHP3OH5/bundle.json","state_url":"https://pith.science/pith/ULBGVE2U7D4WYML4XAIVHP3OH5/state.json","well_known_bundle_url":"https://pith.science/.well-known/pith/ULBGVE2U7D4WYML4XAIVHP3OH5/bundle.json","status":"primary"}],"public_keys":[{"key_id":"pith-v1-2026-05","algorithm":"ed25519","format":"raw","public_key_b64":"stVStoiQhXFxp4s2pdzPNoqVNBMojDU/fJ2db5S3CbM=","public_key_hex":"b2d552b68890857171a78b36a5dccf368a953413288c353f7c9d9d6f94b709b3","fingerprint_sha256_b32_first128bits":"RVFV5Z2OI2J3ZUO7ERDEBCYNKS","fingerprint_sha256_hex":"8d4b5ee74e4693bcd1df2446408b0d54","rotates_at":null,"url":"https://pith.science/pith-signing-key.json","notes":"Pith uses this Ed25519 key to sign canonical record SHA-256 digests. Verify with: ed25519_verify(public_key, message=canonical_sha256_bytes, signature=base64decode(signature_b64))."}],"merge_version":"pith-open-graph-merge-v1","built_at":"2026-06-03T05:26:26Z","links":{"resolver":"https://pith.science/pith/ULBGVE2U7D4WYML4XAIVHP3OH5","bundle":"https://pith.science/pith/ULBGVE2U7D4WYML4XAIVHP3OH5/bundle.json","state":"https://pith.science/pith/ULBGVE2U7D4WYML4XAIVHP3OH5/state.json","well_known_bundle":"https://pith.science/.well-known/pith/ULBGVE2U7D4WYML4XAIVHP3OH5/bundle.json"},"state":{"state_type":"pith_open_graph_state","state_version":"1.0","pith_number":"pith:2019:ULBGVE2U7D4WYML4XAIVHP3OH5","merge_version":"pith-open-graph-merge-v1","event_count":2,"valid_event_count":2,"invalid_event_count":0,"equivocation_count":0,"current":{"canonical_record":{"metadata":{"abstract_canon_sha256":"31acf739b09e5783f7161acee266d073735bcc7b9183228764caeedf447e5b62","cross_cats_sorted":["cs.LG"],"license":"http://arxiv.org/licenses/nonexclusive-distrib/1.0/","primary_cat":"cs.CL","submitted_at":"2019-04-17T02:21:51Z","title_canon_sha256":"94a9c58dd28112116b9c8dc913a519c85e3bca68ffe9e81646d123a98f3d6b57"},"schema_version":"1.0","source":{"id":"1904.08051","kind":"arxiv","version":1}},"source_aliases":[{"alias_kind":"arxiv","alias_value":"1904.08051","created_at":"2026-05-17T23:48:18Z"},{"alias_kind":"arxiv_version","alias_value":"1904.08051v1","created_at":"2026-05-17T23:48:18Z"},{"alias_kind":"doi","alias_value":"10.48550/arxiv.1904.08051","created_at":"2026-05-17T23:48:18Z"},{"alias_kind":"pith_short_12","alias_value":"ULBGVE2U7D4W","created_at":"2026-05-18T12:33:30Z"},{"alias_kind":"pith_short_16","alias_value":"ULBGVE2U7D4WYML4","created_at":"2026-05-18T12:33:30Z"},{"alias_kind":"pith_short_8","alias_value":"ULBGVE2U","created_at":"2026-05-18T12:33:30Z"}],"graph_snapshots":[{"event_id":"sha256:b82d559822b0825c31c3389362668e96b9598e2697804406da651a034ebccadd","target":"graph","created_at":"2026-05-17T23:48:18Z","signer":{"key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","signer_id":"pith.science","signer_type":"pith_registry"},"payload":{"graph_snapshot":{"author_claims":{"count":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57","strong_count":0},"builder_version":"pith-number-builder-2026-05-17-v1","claims":{"count":0,"items":[],"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"formal_canon":{"evidence_count":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"paper":{"abstract_excerpt":"This paper provides a new way to improve the efficiency of the REINFORCE training process. We apply it to the task of instance selection in distant supervision. Modeling the instance selection in one bag as a sequential decision process, a reinforcement learning agent is trained to determine whether an instance is valuable or not and construct a new bag with less noisy instances. However unbiased methods, such as REINFORCE, could usually take much time to train. This paper adopts posterior regularization (PR) to integrate some domain-specific rules in instance selection using REINFORCE. As the","authors_text":"Fei Wu, Qi Zhang, Shiliang Pu, Siliang Tang, Xiang Ren, Yueting Zhuang","cross_cats":["cs.LG"],"headline":"","license":"http://arxiv.org/licenses/nonexclusive-distrib/1.0/","primary_cat":"cs.CL","submitted_at":"2019-04-17T02:21:51Z","title":"Posterior-regularized REINFORCE for Instance Selection in Distant Supervision"},"references":{"count":0,"internal_anchors":0,"resolved_work":0,"sample":[],"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"source":{"id":"1904.08051","kind":"arxiv","version":1},"verdict":{"created_at":null,"id":null,"model_set":{},"one_line_summary":"","pipeline_version":null,"pith_extraction_headline":"","strongest_claim":"","weakest_assumption":""}},"verdict_id":null}}],"author_attestations":[],"timestamp_anchors":[],"storage_attestations":[],"citation_signatures":[],"replication_records":[],"corrections":[],"mirror_hints":[],"record_created":{"event_id":"sha256:a0d97bde74dcb8d654358b8ca77707b0933c7aa87d96140084fe7fa8bf04f669","target":"record","created_at":"2026-05-17T23:48:18Z","signer":{"key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","signer_id":"pith.science","signer_type":"pith_registry"},"payload":{"attestation_state":"computed","canonical_record":{"metadata":{"abstract_canon_sha256":"31acf739b09e5783f7161acee266d073735bcc7b9183228764caeedf447e5b62","cross_cats_sorted":["cs.LG"],"license":"http://arxiv.org/licenses/nonexclusive-distrib/1.0/","primary_cat":"cs.CL","submitted_at":"2019-04-17T02:21:51Z","title_canon_sha256":"94a9c58dd28112116b9c8dc913a519c85e3bca68ffe9e81646d123a98f3d6b57"},"schema_version":"1.0","source":{"id":"1904.08051","kind":"arxiv","version":1}},"canonical_sha256":"a2c26a9354f8f96c317cb81153bf6e3f641c1097f9c5c7d6a76cb8bd9019d55a","receipt":{"algorithm":"ed25519","builder_version":"pith-number-builder-2026-05-17-v1","canonical_sha256":"a2c26a9354f8f96c317cb81153bf6e3f641c1097f9c5c7d6a76cb8bd9019d55a","first_computed_at":"2026-05-17T23:48:18.914301Z","key_id":"pith-v1-2026-05","kind":"pith_receipt","last_reissued_at":"2026-05-17T23:48:18.914301Z","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","receipt_version":"0.3","signature_b64":"go4D1GV+vyWXNk23ZqrIa0CeqhEyXCduaMUHm8mJRtslDBYJ+sVu0JDDhgVzfI325mtY66f7An9da2GTDHhMAw==","signature_status":"signed_v1","signed_at":"2026-05-17T23:48:18.914904Z","signed_message":"canonical_sha256_bytes"},"source_id":"1904.08051","source_kind":"arxiv","source_version":1}}},"equivocations":[],"invalid_events":[],"applied_event_ids":["sha256:a0d97bde74dcb8d654358b8ca77707b0933c7aa87d96140084fe7fa8bf04f669","sha256:b82d559822b0825c31c3389362668e96b9598e2697804406da651a034ebccadd"],"state_sha256":"fa00514320a9043275274442b3e50d925d19ad815d1d551f7f1f13f250a72b30"},"bundle_signature":{"signature_status":"signed_v1","algorithm":"ed25519","key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","signature_b64":"/FONAKk6DFO5f6uHVqwEjxGY1Z0zxg6KIhr6sVUvQEmVF086QMHAImPh3ZLMgB3FFpcFjClEkIQoNHMuc+lgBg==","signed_message":"bundle_sha256_bytes","signed_at":"2026-06-03T05:26:26.997985Z","bundle_sha256":"558cbbea7989b6096f14ebd56b0cae5d8e77a527a32b4e377f4329f0a321538e"}}