{"bundle_type":"pith_open_graph_bundle","bundle_version":"1.0","pith_number":"pith:2016:BD3VOUPKMC554FXBXQAWPHSUF2","short_pith_number":"pith:BD3VOUPK","canonical_record":{"source":{"id":"1608.01972","kind":"arxiv","version":2},"metadata":{"license":"http://arxiv.org/licenses/nonexclusive-distrib/1.0/","primary_cat":"cs.CL","submitted_at":"2016-08-05T18:53:42Z","cross_cats_sorted":["cs.IR"],"title_canon_sha256":"5866313e42334193d34b6a705fc9b751472d6be0bb271682d725f04d27d76b4e","abstract_canon_sha256":"80b7f22c513a02f644056b3621be9c1e7147ea3c95e3200caeaff1f7610f7e13"},"schema_version":"1.0"},"canonical_sha256":"08f75751ea60bbde16e1bc01679e542e918b591d19627bec3b20e64d0dbe568a","source":{"kind":"arxiv","id":"1608.01972","version":2},"source_aliases":[{"alias_kind":"arxiv","alias_value":"1608.01972","created_at":"2026-05-18T00:32:36Z"},{"alias_kind":"arxiv_version","alias_value":"1608.01972v2","created_at":"2026-05-18T00:32:36Z"},{"alias_kind":"doi","alias_value":"10.48550/arxiv.1608.01972","created_at":"2026-05-18T00:32:36Z"},{"alias_kind":"pith_short_12","alias_value":"BD3VOUPKMC55","created_at":"2026-05-18T12:30:07Z"},{"alias_kind":"pith_short_16","alias_value":"BD3VOUPKMC554FXB","created_at":"2026-05-18T12:30:07Z"},{"alias_kind":"pith_short_8","alias_value":"BD3VOUPK","created_at":"2026-05-18T12:30:07Z"}],"events":[{"event_type":"record_created","subject_pith_number":"pith:2016:BD3VOUPKMC554FXBXQAWPHSUF2","target":"record","payload":{"canonical_record":{"source":{"id":"1608.01972","kind":"arxiv","version":2},"metadata":{"license":"http://arxiv.org/licenses/nonexclusive-distrib/1.0/","primary_cat":"cs.CL","submitted_at":"2016-08-05T18:53:42Z","cross_cats_sorted":["cs.IR"],"title_canon_sha256":"5866313e42334193d34b6a705fc9b751472d6be0bb271682d725f04d27d76b4e","abstract_canon_sha256":"80b7f22c513a02f644056b3621be9c1e7147ea3c95e3200caeaff1f7610f7e13"},"schema_version":"1.0"},"canonical_sha256":"08f75751ea60bbde16e1bc01679e542e918b591d19627bec3b20e64d0dbe568a","receipt":{"kind":"pith_receipt","key_id":"pith-v1-2026-05","algorithm":"ed25519","signed_at":"2026-05-18T00:32:36.463036Z","signature_b64":"YXSuHo+s7YnFc21ILsqFpy3wUsX+VJGHLp8+2nW7fKrtTv0d4vJKOk3yMUa8yc99CMeUQZi7kuosKz3rfCS2Ag==","signed_message":"canonical_sha256_bytes","builder_version":"pith-number-builder-2026-05-17-v1","receipt_version":"0.3","canonical_sha256":"08f75751ea60bbde16e1bc01679e542e918b591d19627bec3b20e64d0dbe568a","last_reissued_at":"2026-05-18T00:32:36.462211Z","signature_status":"signed_v1","first_computed_at":"2026-05-18T00:32:36.462211Z","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54"},"source_kind":"arxiv","source_id":"1608.01972","source_version":2,"attestation_state":"computed"},"signer":{"signer_id":"pith.science","signer_type":"pith_registry","key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54"},"created_at":"2026-05-18T00:32:36Z","supersedes":[],"prev_event":null,"signature":{"signature_status":"signed_v1","algorithm":"ed25519","key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","signature_b64":"CLZ4R9ON0x6sMG+T7LjJRDCW/jRrKtJooOj+Un5jYbpiJ4J6zdAIvrKwRVyXHpLXtaZ3TMouFqb31Hfmuht/CA==","signed_message":"open_graph_event_sha256_bytes","signed_at":"2026-06-02T01:07:07.422460Z"},"content_sha256":"d0f6e6b0282d03bb293182767a0ac0bf7517e9ae154e2f8d5a25f91d939f98ae","schema_version":"1.0","event_id":"sha256:d0f6e6b0282d03bb293182767a0ac0bf7517e9ae154e2f8d5a25f91d939f98ae"},{"event_type":"graph_snapshot","subject_pith_number":"pith:2016:BD3VOUPKMC554FXBXQAWPHSUF2","target":"graph","payload":{"graph_snapshot":{"paper":{"title":"Bridging the Gap: Incorporating a Semantic Similarity Measure for Effectively Mapping PubMed Queries to Documents","license":"http://arxiv.org/licenses/nonexclusive-distrib/1.0/","headline":"","cross_cats":["cs.IR"],"primary_cat":"cs.CL","authors_text":"Nicolas Fiorini, Sun Kim, W. John Wilbur, Zhiyong Lu","submitted_at":"2016-08-05T18:53:42Z","abstract_excerpt":"The main approach of traditional information retrieval (IR) is to examine how many words from a query appear in a document. A drawback of this approach, however, is that it may fail to detect relevant documents where no or only few words from a query are found. The semantic analysis methods such as LSA (latent semantic analysis) and LDA (latent Dirichlet allocation) have been proposed to address the issue, but their performance is not superior compared to common IR approaches. Here we present a query-document similarity measure motivated by the Word Mover's Distance. Unlike other similarity me"},"claims":{"count":0,"items":[],"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"source":{"id":"1608.01972","kind":"arxiv","version":2},"verdict":{"id":null,"model_set":{},"created_at":null,"strongest_claim":"","one_line_summary":"","pipeline_version":null,"weakest_assumption":"","pith_extraction_headline":""},"references":{"count":0,"sample":[],"resolved_work":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57","internal_anchors":0},"formal_canon":{"evidence_count":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"author_claims":{"count":0,"strong_count":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"builder_version":"pith-number-builder-2026-05-17-v1"},"verdict_id":null},"signer":{"signer_id":"pith.science","signer_type":"pith_registry","key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54"},"created_at":"2026-05-18T00:32:36Z","supersedes":[],"prev_event":null,"signature":{"signature_status":"signed_v1","algorithm":"ed25519","key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","signature_b64":"mkzApjO3TZnN7Vsrxql1jXSnwEsbCi1Ffm9bThnmkGOROt6o7g6oMytCuQAKSRs9Qt+gf5EA6YLelnjKGrHdDA==","signed_message":"open_graph_event_sha256_bytes","signed_at":"2026-06-02T01:07:07.422807Z"},"content_sha256":"c5823a467a5e832f92a9f10c125b4c29a16a1e044d7f86b8b5382a3ac994b3c0","schema_version":"1.0","event_id":"sha256:c5823a467a5e832f92a9f10c125b4c29a16a1e044d7f86b8b5382a3ac994b3c0"}],"timestamp_proofs":[],"mirror_hints":[{"mirror_type":"https","name":"Pith Resolver","base_url":"https://pith.science","bundle_url":"https://pith.science/pith/BD3VOUPKMC554FXBXQAWPHSUF2/bundle.json","state_url":"https://pith.science/pith/BD3VOUPKMC554FXBXQAWPHSUF2/state.json","well_known_bundle_url":"https://pith.science/.well-known/pith/BD3VOUPKMC554FXBXQAWPHSUF2/bundle.json","status":"primary"}],"public_keys":[{"key_id":"pith-v1-2026-05","algorithm":"ed25519","format":"raw","public_key_b64":"stVStoiQhXFxp4s2pdzPNoqVNBMojDU/fJ2db5S3CbM=","public_key_hex":"b2d552b68890857171a78b36a5dccf368a953413288c353f7c9d9d6f94b709b3","fingerprint_sha256_b32_first128bits":"RVFV5Z2OI2J3ZUO7ERDEBCYNKS","fingerprint_sha256_hex":"8d4b5ee74e4693bcd1df2446408b0d54","rotates_at":null,"url":"https://pith.science/pith-signing-key.json","notes":"Pith uses this Ed25519 key to sign canonical record SHA-256 digests. Verify with: ed25519_verify(public_key, message=canonical_sha256_bytes, signature=base64decode(signature_b64))."}],"merge_version":"pith-open-graph-merge-v1","built_at":"2026-06-02T01:07:07Z","links":{"resolver":"https://pith.science/pith/BD3VOUPKMC554FXBXQAWPHSUF2","bundle":"https://pith.science/pith/BD3VOUPKMC554FXBXQAWPHSUF2/bundle.json","state":"https://pith.science/pith/BD3VOUPKMC554FXBXQAWPHSUF2/state.json","well_known_bundle":"https://pith.science/.well-known/pith/BD3VOUPKMC554FXBXQAWPHSUF2/bundle.json"},"state":{"state_type":"pith_open_graph_state","state_version":"1.0","pith_number":"pith:2016:BD3VOUPKMC554FXBXQAWPHSUF2","merge_version":"pith-open-graph-merge-v1","event_count":2,"valid_event_count":2,"invalid_event_count":0,"equivocation_count":0,"current":{"canonical_record":{"metadata":{"abstract_canon_sha256":"80b7f22c513a02f644056b3621be9c1e7147ea3c95e3200caeaff1f7610f7e13","cross_cats_sorted":["cs.IR"],"license":"http://arxiv.org/licenses/nonexclusive-distrib/1.0/","primary_cat":"cs.CL","submitted_at":"2016-08-05T18:53:42Z","title_canon_sha256":"5866313e42334193d34b6a705fc9b751472d6be0bb271682d725f04d27d76b4e"},"schema_version":"1.0","source":{"id":"1608.01972","kind":"arxiv","version":2}},"source_aliases":[{"alias_kind":"arxiv","alias_value":"1608.01972","created_at":"2026-05-18T00:32:36Z"},{"alias_kind":"arxiv_version","alias_value":"1608.01972v2","created_at":"2026-05-18T00:32:36Z"},{"alias_kind":"doi","alias_value":"10.48550/arxiv.1608.01972","created_at":"2026-05-18T00:32:36Z"},{"alias_kind":"pith_short_12","alias_value":"BD3VOUPKMC55","created_at":"2026-05-18T12:30:07Z"},{"alias_kind":"pith_short_16","alias_value":"BD3VOUPKMC554FXB","created_at":"2026-05-18T12:30:07Z"},{"alias_kind":"pith_short_8","alias_value":"BD3VOUPK","created_at":"2026-05-18T12:30:07Z"}],"graph_snapshots":[{"event_id":"sha256:c5823a467a5e832f92a9f10c125b4c29a16a1e044d7f86b8b5382a3ac994b3c0","target":"graph","created_at":"2026-05-18T00:32:36Z","signer":{"key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","signer_id":"pith.science","signer_type":"pith_registry"},"payload":{"graph_snapshot":{"author_claims":{"count":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57","strong_count":0},"builder_version":"pith-number-builder-2026-05-17-v1","claims":{"count":0,"items":[],"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"formal_canon":{"evidence_count":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"paper":{"abstract_excerpt":"The main approach of traditional information retrieval (IR) is to examine how many words from a query appear in a document. A drawback of this approach, however, is that it may fail to detect relevant documents where no or only few words from a query are found. The semantic analysis methods such as LSA (latent semantic analysis) and LDA (latent Dirichlet allocation) have been proposed to address the issue, but their performance is not superior compared to common IR approaches. Here we present a query-document similarity measure motivated by the Word Mover's Distance. Unlike other similarity me","authors_text":"Nicolas Fiorini, Sun Kim, W. John Wilbur, Zhiyong Lu","cross_cats":["cs.IR"],"headline":"","license":"http://arxiv.org/licenses/nonexclusive-distrib/1.0/","primary_cat":"cs.CL","submitted_at":"2016-08-05T18:53:42Z","title":"Bridging the Gap: Incorporating a Semantic Similarity Measure for Effectively Mapping PubMed Queries to Documents"},"references":{"count":0,"internal_anchors":0,"resolved_work":0,"sample":[],"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"source":{"id":"1608.01972","kind":"arxiv","version":2},"verdict":{"created_at":null,"id":null,"model_set":{},"one_line_summary":"","pipeline_version":null,"pith_extraction_headline":"","strongest_claim":"","weakest_assumption":""}},"verdict_id":null}}],"author_attestations":[],"timestamp_anchors":[],"storage_attestations":[],"citation_signatures":[],"replication_records":[],"corrections":[],"mirror_hints":[],"record_created":{"event_id":"sha256:d0f6e6b0282d03bb293182767a0ac0bf7517e9ae154e2f8d5a25f91d939f98ae","target":"record","created_at":"2026-05-18T00:32:36Z","signer":{"key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","signer_id":"pith.science","signer_type":"pith_registry"},"payload":{"attestation_state":"computed","canonical_record":{"metadata":{"abstract_canon_sha256":"80b7f22c513a02f644056b3621be9c1e7147ea3c95e3200caeaff1f7610f7e13","cross_cats_sorted":["cs.IR"],"license":"http://arxiv.org/licenses/nonexclusive-distrib/1.0/","primary_cat":"cs.CL","submitted_at":"2016-08-05T18:53:42Z","title_canon_sha256":"5866313e42334193d34b6a705fc9b751472d6be0bb271682d725f04d27d76b4e"},"schema_version":"1.0","source":{"id":"1608.01972","kind":"arxiv","version":2}},"canonical_sha256":"08f75751ea60bbde16e1bc01679e542e918b591d19627bec3b20e64d0dbe568a","receipt":{"algorithm":"ed25519","builder_version":"pith-number-builder-2026-05-17-v1","canonical_sha256":"08f75751ea60bbde16e1bc01679e542e918b591d19627bec3b20e64d0dbe568a","first_computed_at":"2026-05-18T00:32:36.462211Z","key_id":"pith-v1-2026-05","kind":"pith_receipt","last_reissued_at":"2026-05-18T00:32:36.462211Z","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","receipt_version":"0.3","signature_b64":"YXSuHo+s7YnFc21ILsqFpy3wUsX+VJGHLp8+2nW7fKrtTv0d4vJKOk3yMUa8yc99CMeUQZi7kuosKz3rfCS2Ag==","signature_status":"signed_v1","signed_at":"2026-05-18T00:32:36.463036Z","signed_message":"canonical_sha256_bytes"},"source_id":"1608.01972","source_kind":"arxiv","source_version":2}}},"equivocations":[],"invalid_events":[],"applied_event_ids":["sha256:d0f6e6b0282d03bb293182767a0ac0bf7517e9ae154e2f8d5a25f91d939f98ae","sha256:c5823a467a5e832f92a9f10c125b4c29a16a1e044d7f86b8b5382a3ac994b3c0"],"state_sha256":"d00d4e8e0a03e3bb9a8856a6ee19eea7396499991f05cfcb72e1ee93b61f538d"},"bundle_signature":{"signature_status":"signed_v1","algorithm":"ed25519","key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","signature_b64":"sKS9Mo6FkKiIr6hd0jWwjYErCStJJV9hW1a8+mvqgIYwMw2oVTF4dJHuzSVqq+MWn2woLR6OdgwI556ws5fbCQ==","signed_message":"bundle_sha256_bytes","signed_at":"2026-06-02T01:07:07.424661Z","bundle_sha256":"f6dbc85616c38a4fba478fff2362ae9a261f1c3d3d1c02069d7d11e6851e88cd"}}