{"bundle_type":"pith_open_graph_bundle","bundle_version":"1.0","pith_number":"pith:2018:RTGESAQMBGLOHGVFQ4DGNCD6FV","short_pith_number":"pith:RTGESAQM","canonical_record":{"source":{"id":"1808.08622","kind":"arxiv","version":1},"metadata":{"license":"http://arxiv.org/licenses/nonexclusive-distrib/1.0/","primary_cat":"cs.CL","submitted_at":"2018-08-26T21:12:43Z","cross_cats_sorted":[],"title_canon_sha256":"5263404c1bee5d9d0c74b3b093a5fd7170257d0370badab1f78b41c8dc49b7a4","abstract_canon_sha256":"31e018d449e6babf20380676ec634d52ac2f5bbb31424678ac1794b253ed10c0"},"schema_version":"1.0"},"canonical_sha256":"8ccc49020c0996e39aa5870666887e2d74713095737d7e78478b90ecb10b1fdb","source":{"kind":"arxiv","id":"1808.08622","version":1},"source_aliases":[{"alias_kind":"arxiv","alias_value":"1808.08622","created_at":"2026-05-18T00:07:13Z"},{"alias_kind":"arxiv_version","alias_value":"1808.08622v1","created_at":"2026-05-18T00:07:13Z"},{"alias_kind":"doi","alias_value":"10.48550/arxiv.1808.08622","created_at":"2026-05-18T00:07:13Z"},{"alias_kind":"pith_short_12","alias_value":"RTGESAQMBGLO","created_at":"2026-05-18T12:32:50Z"},{"alias_kind":"pith_short_16","alias_value":"RTGESAQMBGLOHGVF","created_at":"2026-05-18T12:32:50Z"},{"alias_kind":"pith_short_8","alias_value":"RTGESAQM","created_at":"2026-05-18T12:32:50Z"}],"events":[{"event_type":"record_created","subject_pith_number":"pith:2018:RTGESAQMBGLOHGVFQ4DGNCD6FV","target":"record","payload":{"canonical_record":{"source":{"id":"1808.08622","kind":"arxiv","version":1},"metadata":{"license":"http://arxiv.org/licenses/nonexclusive-distrib/1.0/","primary_cat":"cs.CL","submitted_at":"2018-08-26T21:12:43Z","cross_cats_sorted":[],"title_canon_sha256":"5263404c1bee5d9d0c74b3b093a5fd7170257d0370badab1f78b41c8dc49b7a4","abstract_canon_sha256":"31e018d449e6babf20380676ec634d52ac2f5bbb31424678ac1794b253ed10c0"},"schema_version":"1.0"},"canonical_sha256":"8ccc49020c0996e39aa5870666887e2d74713095737d7e78478b90ecb10b1fdb","receipt":{"kind":"pith_receipt","key_id":"pith-v1-2026-05","algorithm":"ed25519","signed_at":"2026-05-18T00:07:13.849015Z","signature_b64":"9oYH8O+mcBuNHcLoexJLQQlCd1GThoNkZ1KdTOlUIoKZcXac1I3VwtEZB6YaIo8AAS0yrz+QM1vYbxaN9iUwDQ==","signed_message":"canonical_sha256_bytes","builder_version":"pith-number-builder-2026-05-17-v1","receipt_version":"0.3","canonical_sha256":"8ccc49020c0996e39aa5870666887e2d74713095737d7e78478b90ecb10b1fdb","last_reissued_at":"2026-05-18T00:07:13.848509Z","signature_status":"signed_v1","first_computed_at":"2026-05-18T00:07:13.848509Z","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54"},"source_kind":"arxiv","source_id":"1808.08622","source_version":1,"attestation_state":"computed"},"signer":{"signer_id":"pith.science","signer_type":"pith_registry","key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54"},"created_at":"2026-05-18T00:07:13Z","supersedes":[],"prev_event":null,"signature":{"signature_status":"signed_v1","algorithm":"ed25519","key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","signature_b64":"f/DQ9mEOCFk2uUUo/YFAYcXGR9PPrFHdOjjdknQyWQssD658Jj251opV24yg9agn2SbJd3gaRGZrlzYixuMYCQ==","signed_message":"open_graph_event_sha256_bytes","signed_at":"2026-05-31T05:37:25.147004Z"},"content_sha256":"ea4b374058d5d0ad8c68cee5150a0dfcaba00fd6255c486132207c3e766d3fba","schema_version":"1.0","event_id":"sha256:ea4b374058d5d0ad8c68cee5150a0dfcaba00fd6255c486132207c3e766d3fba"},{"event_type":"graph_snapshot","subject_pith_number":"pith:2018:RTGESAQMBGLOHGVFQ4DGNCD6FV","target":"graph","payload":{"graph_snapshot":{"paper":{"title":"Semi-Supervised Event Extraction with Paraphrase Clusters","license":"http://arxiv.org/licenses/nonexclusive-distrib/1.0/","headline":"","cross_cats":[],"primary_cat":"cs.CL","authors_text":"Colin Lockard, Daniel S. Weld, Hannaneh Hajishirzi, James Ferguson","submitted_at":"2018-08-26T21:12:43Z","abstract_excerpt":"Supervised event extraction systems are limited in their accuracy due to the lack of available training data. We present a method for self-training event extraction systems by bootstrapping additional training data. This is done by taking advantage of the occurrence of multiple mentions of the same event instances across newswire articles from multiple sources. If our system can make a highconfidence extraction of some mentions in such a cluster, it can then acquire diverse training examples by adding the other mentions as well. Our experiments show significant performance improvements on mult"},"claims":{"count":0,"items":[],"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"source":{"id":"1808.08622","kind":"arxiv","version":1},"verdict":{"id":null,"model_set":{},"created_at":null,"strongest_claim":"","one_line_summary":"","pipeline_version":null,"weakest_assumption":"","pith_extraction_headline":""},"references":{"count":0,"sample":[],"resolved_work":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57","internal_anchors":0},"formal_canon":{"evidence_count":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"author_claims":{"count":0,"strong_count":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"builder_version":"pith-number-builder-2026-05-17-v1"},"verdict_id":null},"signer":{"signer_id":"pith.science","signer_type":"pith_registry","key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54"},"created_at":"2026-05-18T00:07:13Z","supersedes":[],"prev_event":null,"signature":{"signature_status":"signed_v1","algorithm":"ed25519","key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","signature_b64":"ZID6X+8ahsi0vCnMHYgGg/zCp4nGmVutAwVrI7j8pGMW5C5Rj96MO5cpvN8lI5o9shQd7Umon03exIJBf7tGBw==","signed_message":"open_graph_event_sha256_bytes","signed_at":"2026-05-31T05:37:25.147737Z"},"content_sha256":"97f30e0316d2e6c8c7b4435b208d9578f37e19aa0fedc0bf1fd6750f282514f4","schema_version":"1.0","event_id":"sha256:97f30e0316d2e6c8c7b4435b208d9578f37e19aa0fedc0bf1fd6750f282514f4"}],"timestamp_proofs":[],"mirror_hints":[{"mirror_type":"https","name":"Pith Resolver","base_url":"https://pith.science","bundle_url":"https://pith.science/pith/RTGESAQMBGLOHGVFQ4DGNCD6FV/bundle.json","state_url":"https://pith.science/pith/RTGESAQMBGLOHGVFQ4DGNCD6FV/state.json","well_known_bundle_url":"https://pith.science/.well-known/pith/RTGESAQMBGLOHGVFQ4DGNCD6FV/bundle.json","status":"primary"}],"public_keys":[{"key_id":"pith-v1-2026-05","algorithm":"ed25519","format":"raw","public_key_b64":"stVStoiQhXFxp4s2pdzPNoqVNBMojDU/fJ2db5S3CbM=","public_key_hex":"b2d552b68890857171a78b36a5dccf368a953413288c353f7c9d9d6f94b709b3","fingerprint_sha256_b32_first128bits":"RVFV5Z2OI2J3ZUO7ERDEBCYNKS","fingerprint_sha256_hex":"8d4b5ee74e4693bcd1df2446408b0d54","rotates_at":null,"url":"https://pith.science/pith-signing-key.json","notes":"Pith uses this Ed25519 key to sign canonical record SHA-256 digests. Verify with: ed25519_verify(public_key, message=canonical_sha256_bytes, signature=base64decode(signature_b64))."}],"merge_version":"pith-open-graph-merge-v1","built_at":"2026-05-31T05:37:25Z","links":{"resolver":"https://pith.science/pith/RTGESAQMBGLOHGVFQ4DGNCD6FV","bundle":"https://pith.science/pith/RTGESAQMBGLOHGVFQ4DGNCD6FV/bundle.json","state":"https://pith.science/pith/RTGESAQMBGLOHGVFQ4DGNCD6FV/state.json","well_known_bundle":"https://pith.science/.well-known/pith/RTGESAQMBGLOHGVFQ4DGNCD6FV/bundle.json"},"state":{"state_type":"pith_open_graph_state","state_version":"1.0","pith_number":"pith:2018:RTGESAQMBGLOHGVFQ4DGNCD6FV","merge_version":"pith-open-graph-merge-v1","event_count":2,"valid_event_count":2,"invalid_event_count":0,"equivocation_count":0,"current":{"canonical_record":{"metadata":{"abstract_canon_sha256":"31e018d449e6babf20380676ec634d52ac2f5bbb31424678ac1794b253ed10c0","cross_cats_sorted":[],"license":"http://arxiv.org/licenses/nonexclusive-distrib/1.0/","primary_cat":"cs.CL","submitted_at":"2018-08-26T21:12:43Z","title_canon_sha256":"5263404c1bee5d9d0c74b3b093a5fd7170257d0370badab1f78b41c8dc49b7a4"},"schema_version":"1.0","source":{"id":"1808.08622","kind":"arxiv","version":1}},"source_aliases":[{"alias_kind":"arxiv","alias_value":"1808.08622","created_at":"2026-05-18T00:07:13Z"},{"alias_kind":"arxiv_version","alias_value":"1808.08622v1","created_at":"2026-05-18T00:07:13Z"},{"alias_kind":"doi","alias_value":"10.48550/arxiv.1808.08622","created_at":"2026-05-18T00:07:13Z"},{"alias_kind":"pith_short_12","alias_value":"RTGESAQMBGLO","created_at":"2026-05-18T12:32:50Z"},{"alias_kind":"pith_short_16","alias_value":"RTGESAQMBGLOHGVF","created_at":"2026-05-18T12:32:50Z"},{"alias_kind":"pith_short_8","alias_value":"RTGESAQM","created_at":"2026-05-18T12:32:50Z"}],"graph_snapshots":[{"event_id":"sha256:97f30e0316d2e6c8c7b4435b208d9578f37e19aa0fedc0bf1fd6750f282514f4","target":"graph","created_at":"2026-05-18T00:07:13Z","signer":{"key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","signer_id":"pith.science","signer_type":"pith_registry"},"payload":{"graph_snapshot":{"author_claims":{"count":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57","strong_count":0},"builder_version":"pith-number-builder-2026-05-17-v1","claims":{"count":0,"items":[],"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"formal_canon":{"evidence_count":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"paper":{"abstract_excerpt":"Supervised event extraction systems are limited in their accuracy due to the lack of available training data. We present a method for self-training event extraction systems by bootstrapping additional training data. This is done by taking advantage of the occurrence of multiple mentions of the same event instances across newswire articles from multiple sources. If our system can make a highconfidence extraction of some mentions in such a cluster, it can then acquire diverse training examples by adding the other mentions as well. Our experiments show significant performance improvements on mult","authors_text":"Colin Lockard, Daniel S. Weld, Hannaneh Hajishirzi, James Ferguson","cross_cats":[],"headline":"","license":"http://arxiv.org/licenses/nonexclusive-distrib/1.0/","primary_cat":"cs.CL","submitted_at":"2018-08-26T21:12:43Z","title":"Semi-Supervised Event Extraction with Paraphrase Clusters"},"references":{"count":0,"internal_anchors":0,"resolved_work":0,"sample":[],"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"source":{"id":"1808.08622","kind":"arxiv","version":1},"verdict":{"created_at":null,"id":null,"model_set":{},"one_line_summary":"","pipeline_version":null,"pith_extraction_headline":"","strongest_claim":"","weakest_assumption":""}},"verdict_id":null}}],"author_attestations":[],"timestamp_anchors":[],"storage_attestations":[],"citation_signatures":[],"replication_records":[],"corrections":[],"mirror_hints":[],"record_created":{"event_id":"sha256:ea4b374058d5d0ad8c68cee5150a0dfcaba00fd6255c486132207c3e766d3fba","target":"record","created_at":"2026-05-18T00:07:13Z","signer":{"key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","signer_id":"pith.science","signer_type":"pith_registry"},"payload":{"attestation_state":"computed","canonical_record":{"metadata":{"abstract_canon_sha256":"31e018d449e6babf20380676ec634d52ac2f5bbb31424678ac1794b253ed10c0","cross_cats_sorted":[],"license":"http://arxiv.org/licenses/nonexclusive-distrib/1.0/","primary_cat":"cs.CL","submitted_at":"2018-08-26T21:12:43Z","title_canon_sha256":"5263404c1bee5d9d0c74b3b093a5fd7170257d0370badab1f78b41c8dc49b7a4"},"schema_version":"1.0","source":{"id":"1808.08622","kind":"arxiv","version":1}},"canonical_sha256":"8ccc49020c0996e39aa5870666887e2d74713095737d7e78478b90ecb10b1fdb","receipt":{"algorithm":"ed25519","builder_version":"pith-number-builder-2026-05-17-v1","canonical_sha256":"8ccc49020c0996e39aa5870666887e2d74713095737d7e78478b90ecb10b1fdb","first_computed_at":"2026-05-18T00:07:13.848509Z","key_id":"pith-v1-2026-05","kind":"pith_receipt","last_reissued_at":"2026-05-18T00:07:13.848509Z","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","receipt_version":"0.3","signature_b64":"9oYH8O+mcBuNHcLoexJLQQlCd1GThoNkZ1KdTOlUIoKZcXac1I3VwtEZB6YaIo8AAS0yrz+QM1vYbxaN9iUwDQ==","signature_status":"signed_v1","signed_at":"2026-05-18T00:07:13.849015Z","signed_message":"canonical_sha256_bytes"},"source_id":"1808.08622","source_kind":"arxiv","source_version":1}}},"equivocations":[],"invalid_events":[],"applied_event_ids":["sha256:ea4b374058d5d0ad8c68cee5150a0dfcaba00fd6255c486132207c3e766d3fba","sha256:97f30e0316d2e6c8c7b4435b208d9578f37e19aa0fedc0bf1fd6750f282514f4"],"state_sha256":"01b6e8dc05239044adcdc4ca9a7d266d50bff37715ef7bec5b6794dbe44be472"},"bundle_signature":{"signature_status":"signed_v1","algorithm":"ed25519","key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","signature_b64":"2q7RDNxx81BmA7N6giwq+Ihy/2e3Xzg+4mCUvl4MaHEv6ywFdtmRBoe+nm3dcJ73Ir2c53vzQyPmZh4QBezXAg==","signed_message":"bundle_sha256_bytes","signed_at":"2026-05-31T05:37:25.152179Z","bundle_sha256":"d101f2232ffb8f8f4dd25565d9a4ef1481cc579840dc96fe4cd5c6e4f8614661"}}