{"bundle_type":"pith_open_graph_bundle","bundle_version":"1.0","pith_number":"pith:2018:KGJFG4WMLX2IKFFLQXMDXCT3LO","short_pith_number":"pith:KGJFG4WM","canonical_record":{"source":{"id":"1804.05942","kind":"arxiv","version":3},"metadata":{"license":"http://arxiv.org/licenses/nonexclusive-distrib/1.0/","primary_cat":"cs.IR","submitted_at":"2018-04-13T17:08:45Z","cross_cats_sorted":["cs.DL"],"title_canon_sha256":"e4126cd1391e5d16c0a7c75f4b60dd97b323e1dff796c8a6aef55cc2694e05e9","abstract_canon_sha256":"11edd80d34ec3c8e9d03d2c08f8645f364bd6ec7ccc7235ce3997dff2e19fcd4"},"schema_version":"1.0"},"canonical_sha256":"51925372cc5df48514ab85d83b8a7b5b90b5f878878de1a8d59ea1b890226557","source":{"kind":"arxiv","id":"1804.05942","version":3},"source_aliases":[{"alias_kind":"arxiv","alias_value":"1804.05942","created_at":"2026-05-18T00:02:45Z"},{"alias_kind":"arxiv_version","alias_value":"1804.05942v3","created_at":"2026-05-18T00:02:45Z"},{"alias_kind":"doi","alias_value":"10.48550/arxiv.1804.05942","created_at":"2026-05-18T00:02:45Z"},{"alias_kind":"pith_short_12","alias_value":"KGJFG4WMLX2I","created_at":"2026-05-18T12:32:33Z"},{"alias_kind":"pith_short_16","alias_value":"KGJFG4WMLX2IKFFL","created_at":"2026-05-18T12:32:33Z"},{"alias_kind":"pith_short_8","alias_value":"KGJFG4WM","created_at":"2026-05-18T12:32:33Z"}],"events":[{"event_type":"record_created","subject_pith_number":"pith:2018:KGJFG4WMLX2IKFFLQXMDXCT3LO","target":"record","payload":{"canonical_record":{"source":{"id":"1804.05942","kind":"arxiv","version":3},"metadata":{"license":"http://arxiv.org/licenses/nonexclusive-distrib/1.0/","primary_cat":"cs.IR","submitted_at":"2018-04-13T17:08:45Z","cross_cats_sorted":["cs.DL"],"title_canon_sha256":"e4126cd1391e5d16c0a7c75f4b60dd97b323e1dff796c8a6aef55cc2694e05e9","abstract_canon_sha256":"11edd80d34ec3c8e9d03d2c08f8645f364bd6ec7ccc7235ce3997dff2e19fcd4"},"schema_version":"1.0"},"canonical_sha256":"51925372cc5df48514ab85d83b8a7b5b90b5f878878de1a8d59ea1b890226557","receipt":{"kind":"pith_receipt","key_id":"pith-v1-2026-05","algorithm":"ed25519","signed_at":"2026-05-18T00:02:45.034063Z","signature_b64":"5+V9cLvApDI/h4eIfWD7dzgImBd8elCtdEmLP0ZSqO1y6wuhxHnVVlIm+fBav5tEkXHOFXr3caY1oXfQ7CcoCA==","signed_message":"canonical_sha256_bytes","builder_version":"pith-number-builder-2026-05-17-v1","receipt_version":"0.3","canonical_sha256":"51925372cc5df48514ab85d83b8a7b5b90b5f878878de1a8d59ea1b890226557","last_reissued_at":"2026-05-18T00:02:45.033508Z","signature_status":"signed_v1","first_computed_at":"2026-05-18T00:02:45.033508Z","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54"},"source_kind":"arxiv","source_id":"1804.05942","source_version":3,"attestation_state":"computed"},"signer":{"signer_id":"pith.science","signer_type":"pith_registry","key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54"},"created_at":"2026-05-18T00:02:45Z","supersedes":[],"prev_event":null,"signature":{"signature_status":"signed_v1","algorithm":"ed25519","key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","signature_b64":"dsXV6d+21dLIwlZUY75joG/vjuBnLwfTZBbuoRRbLixBagMlpSLsz0KbLHoO4PujFQf60qNzFlnDpIvxP2UNAw==","signed_message":"open_graph_event_sha256_bytes","signed_at":"2026-05-29T21:12:15.999558Z"},"content_sha256":"b2632254a7380e6b83998571efe23eeb808a19a246af8d3959840c42c3dfe9ff","schema_version":"1.0","event_id":"sha256:b2632254a7380e6b83998571efe23eeb808a19a246af8d3959840c42c3dfe9ff"},{"event_type":"graph_snapshot","subject_pith_number":"pith:2018:KGJFG4WMLX2IKFFLQXMDXCT3LO","target":"graph","payload":{"graph_snapshot":{"paper":{"title":"Are Abstracts Enough for Hypothesis Generation?","license":"http://arxiv.org/licenses/nonexclusive-distrib/1.0/","headline":"","cross_cats":["cs.DL"],"primary_cat":"cs.IR","authors_text":"Alexander Herzog, Angelo Carrabba, Ilya Safro, Justin Sybrandt","submitted_at":"2018-04-13T17:08:45Z","abstract_excerpt":"The potential for automatic hypothesis generation (HG) systems to improve research productivity keeps pace with the growing set of publicly available scientific information. But as data becomes easier to acquire, we must understand the effect different textual data sources have on our resulting hypotheses. Are abstracts enough for HG, or does it need full-text papers? How many papers does an HG system need to make valuable predictions? How sensitive is a general-purpose HG system to hyperparameter values or input quality? What effect does corpus size and document length have on HG results? To "},"claims":{"count":0,"items":[],"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"source":{"id":"1804.05942","kind":"arxiv","version":3},"verdict":{"id":null,"model_set":{},"created_at":null,"strongest_claim":"","one_line_summary":"","pipeline_version":null,"weakest_assumption":"","pith_extraction_headline":""},"references":{"count":0,"sample":[],"resolved_work":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57","internal_anchors":0},"formal_canon":{"evidence_count":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"author_claims":{"count":0,"strong_count":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"builder_version":"pith-number-builder-2026-05-17-v1"},"verdict_id":null},"signer":{"signer_id":"pith.science","signer_type":"pith_registry","key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54"},"created_at":"2026-05-18T00:02:45Z","supersedes":[],"prev_event":null,"signature":{"signature_status":"signed_v1","algorithm":"ed25519","key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","signature_b64":"x272qWPu47h0betpNr1LEOQviIbKD6gCjU/xH2jHPUyfBCC6dphotavgfTRmxcV0c4VhSg+fExtR6B8w2rGRBg==","signed_message":"open_graph_event_sha256_bytes","signed_at":"2026-05-29T21:12:16.000235Z"},"content_sha256":"a8e7b647171c822098d544c36099475b4215fd7e73ad32779edc53484071e5ed","schema_version":"1.0","event_id":"sha256:a8e7b647171c822098d544c36099475b4215fd7e73ad32779edc53484071e5ed"}],"timestamp_proofs":[],"mirror_hints":[{"mirror_type":"https","name":"Pith Resolver","base_url":"https://pith.science","bundle_url":"https://pith.science/pith/KGJFG4WMLX2IKFFLQXMDXCT3LO/bundle.json","state_url":"https://pith.science/pith/KGJFG4WMLX2IKFFLQXMDXCT3LO/state.json","well_known_bundle_url":"https://pith.science/.well-known/pith/KGJFG4WMLX2IKFFLQXMDXCT3LO/bundle.json","status":"primary"}],"public_keys":[{"key_id":"pith-v1-2026-05","algorithm":"ed25519","format":"raw","public_key_b64":"stVStoiQhXFxp4s2pdzPNoqVNBMojDU/fJ2db5S3CbM=","public_key_hex":"b2d552b68890857171a78b36a5dccf368a953413288c353f7c9d9d6f94b709b3","fingerprint_sha256_b32_first128bits":"RVFV5Z2OI2J3ZUO7ERDEBCYNKS","fingerprint_sha256_hex":"8d4b5ee74e4693bcd1df2446408b0d54","rotates_at":null,"url":"https://pith.science/pith-signing-key.json","notes":"Pith uses this Ed25519 key to sign canonical record SHA-256 digests. Verify with: ed25519_verify(public_key, message=canonical_sha256_bytes, signature=base64decode(signature_b64))."}],"merge_version":"pith-open-graph-merge-v1","built_at":"2026-05-29T21:12:16Z","links":{"resolver":"https://pith.science/pith/KGJFG4WMLX2IKFFLQXMDXCT3LO","bundle":"https://pith.science/pith/KGJFG4WMLX2IKFFLQXMDXCT3LO/bundle.json","state":"https://pith.science/pith/KGJFG4WMLX2IKFFLQXMDXCT3LO/state.json","well_known_bundle":"https://pith.science/.well-known/pith/KGJFG4WMLX2IKFFLQXMDXCT3LO/bundle.json"},"state":{"state_type":"pith_open_graph_state","state_version":"1.0","pith_number":"pith:2018:KGJFG4WMLX2IKFFLQXMDXCT3LO","merge_version":"pith-open-graph-merge-v1","event_count":2,"valid_event_count":2,"invalid_event_count":0,"equivocation_count":0,"current":{"canonical_record":{"metadata":{"abstract_canon_sha256":"11edd80d34ec3c8e9d03d2c08f8645f364bd6ec7ccc7235ce3997dff2e19fcd4","cross_cats_sorted":["cs.DL"],"license":"http://arxiv.org/licenses/nonexclusive-distrib/1.0/","primary_cat":"cs.IR","submitted_at":"2018-04-13T17:08:45Z","title_canon_sha256":"e4126cd1391e5d16c0a7c75f4b60dd97b323e1dff796c8a6aef55cc2694e05e9"},"schema_version":"1.0","source":{"id":"1804.05942","kind":"arxiv","version":3}},"source_aliases":[{"alias_kind":"arxiv","alias_value":"1804.05942","created_at":"2026-05-18T00:02:45Z"},{"alias_kind":"arxiv_version","alias_value":"1804.05942v3","created_at":"2026-05-18T00:02:45Z"},{"alias_kind":"doi","alias_value":"10.48550/arxiv.1804.05942","created_at":"2026-05-18T00:02:45Z"},{"alias_kind":"pith_short_12","alias_value":"KGJFG4WMLX2I","created_at":"2026-05-18T12:32:33Z"},{"alias_kind":"pith_short_16","alias_value":"KGJFG4WMLX2IKFFL","created_at":"2026-05-18T12:32:33Z"},{"alias_kind":"pith_short_8","alias_value":"KGJFG4WM","created_at":"2026-05-18T12:32:33Z"}],"graph_snapshots":[{"event_id":"sha256:a8e7b647171c822098d544c36099475b4215fd7e73ad32779edc53484071e5ed","target":"graph","created_at":"2026-05-18T00:02:45Z","signer":{"key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","signer_id":"pith.science","signer_type":"pith_registry"},"payload":{"graph_snapshot":{"author_claims":{"count":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57","strong_count":0},"builder_version":"pith-number-builder-2026-05-17-v1","claims":{"count":0,"items":[],"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"formal_canon":{"evidence_count":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"paper":{"abstract_excerpt":"The potential for automatic hypothesis generation (HG) systems to improve research productivity keeps pace with the growing set of publicly available scientific information. But as data becomes easier to acquire, we must understand the effect different textual data sources have on our resulting hypotheses. Are abstracts enough for HG, or does it need full-text papers? How many papers does an HG system need to make valuable predictions? How sensitive is a general-purpose HG system to hyperparameter values or input quality? What effect does corpus size and document length have on HG results? To ","authors_text":"Alexander Herzog, Angelo Carrabba, Ilya Safro, Justin Sybrandt","cross_cats":["cs.DL"],"headline":"","license":"http://arxiv.org/licenses/nonexclusive-distrib/1.0/","primary_cat":"cs.IR","submitted_at":"2018-04-13T17:08:45Z","title":"Are Abstracts Enough for Hypothesis Generation?"},"references":{"count":0,"internal_anchors":0,"resolved_work":0,"sample":[],"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"source":{"id":"1804.05942","kind":"arxiv","version":3},"verdict":{"created_at":null,"id":null,"model_set":{},"one_line_summary":"","pipeline_version":null,"pith_extraction_headline":"","strongest_claim":"","weakest_assumption":""}},"verdict_id":null}}],"author_attestations":[],"timestamp_anchors":[],"storage_attestations":[],"citation_signatures":[],"replication_records":[],"corrections":[],"mirror_hints":[],"record_created":{"event_id":"sha256:b2632254a7380e6b83998571efe23eeb808a19a246af8d3959840c42c3dfe9ff","target":"record","created_at":"2026-05-18T00:02:45Z","signer":{"key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","signer_id":"pith.science","signer_type":"pith_registry"},"payload":{"attestation_state":"computed","canonical_record":{"metadata":{"abstract_canon_sha256":"11edd80d34ec3c8e9d03d2c08f8645f364bd6ec7ccc7235ce3997dff2e19fcd4","cross_cats_sorted":["cs.DL"],"license":"http://arxiv.org/licenses/nonexclusive-distrib/1.0/","primary_cat":"cs.IR","submitted_at":"2018-04-13T17:08:45Z","title_canon_sha256":"e4126cd1391e5d16c0a7c75f4b60dd97b323e1dff796c8a6aef55cc2694e05e9"},"schema_version":"1.0","source":{"id":"1804.05942","kind":"arxiv","version":3}},"canonical_sha256":"51925372cc5df48514ab85d83b8a7b5b90b5f878878de1a8d59ea1b890226557","receipt":{"algorithm":"ed25519","builder_version":"pith-number-builder-2026-05-17-v1","canonical_sha256":"51925372cc5df48514ab85d83b8a7b5b90b5f878878de1a8d59ea1b890226557","first_computed_at":"2026-05-18T00:02:45.033508Z","key_id":"pith-v1-2026-05","kind":"pith_receipt","last_reissued_at":"2026-05-18T00:02:45.033508Z","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","receipt_version":"0.3","signature_b64":"5+V9cLvApDI/h4eIfWD7dzgImBd8elCtdEmLP0ZSqO1y6wuhxHnVVlIm+fBav5tEkXHOFXr3caY1oXfQ7CcoCA==","signature_status":"signed_v1","signed_at":"2026-05-18T00:02:45.034063Z","signed_message":"canonical_sha256_bytes"},"source_id":"1804.05942","source_kind":"arxiv","source_version":3}}},"equivocations":[],"invalid_events":[],"applied_event_ids":["sha256:b2632254a7380e6b83998571efe23eeb808a19a246af8d3959840c42c3dfe9ff","sha256:a8e7b647171c822098d544c36099475b4215fd7e73ad32779edc53484071e5ed"],"state_sha256":"a6ec981088abc9ab44db0981f26bc9ee017dcd101683d405d474604e504473a4"},"bundle_signature":{"signature_status":"signed_v1","algorithm":"ed25519","key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","signature_b64":"tOvTjgSjRl3o5XqjtWBW+vxdnu3OXx0pAtBfwsGLJWX9HLHFl59SITbKR0PksC2ZFKplaQV5g14bd284lH4qAw==","signed_message":"bundle_sha256_bytes","signed_at":"2026-05-29T21:12:16.004109Z","bundle_sha256":"b7bf7968f9ac93a5cadbe3bc7410f3aaf18545e4b82c1564ba6c112623b06575"}}