{"bundle_type":"pith_open_graph_bundle","bundle_version":"1.0","pith_number":"pith:2018:X34CY4W3JPVRGBXHPSYHD47W2R","short_pith_number":"pith:X34CY4W3","canonical_record":{"source":{"id":"1812.07695","kind":"arxiv","version":2},"metadata":{"license":"http://arxiv.org/licenses/nonexclusive-distrib/1.0/","primary_cat":"cs.DB","submitted_at":"2018-12-18T23:30:39Z","cross_cats_sorted":[],"title_canon_sha256":"f0bbb4489dbf7e85d7bf73b375598745ce59a0494d6c7562fccd259a21eeb11e","abstract_canon_sha256":"a55d780cd24c84eed960c73229b6991ee709d357323dd4d01adfd94976ebe8ab"},"schema_version":"1.0"},"canonical_sha256":"bef82c72db4beb1306e77cb071f3f6d476c4e979393a300a237fdcb5e66a9c6f","source":{"kind":"arxiv","id":"1812.07695","version":2},"source_aliases":[{"alias_kind":"arxiv","alias_value":"1812.07695","created_at":"2026-05-17T23:56:33Z"},{"alias_kind":"arxiv_version","alias_value":"1812.07695v2","created_at":"2026-05-17T23:56:33Z"},{"alias_kind":"doi","alias_value":"10.48550/arxiv.1812.07695","created_at":"2026-05-17T23:56:33Z"},{"alias_kind":"pith_short_12","alias_value":"X34CY4W3JPVR","created_at":"2026-05-18T12:33:01Z"},{"alias_kind":"pith_short_16","alias_value":"X34CY4W3JPVRGBXH","created_at":"2026-05-18T12:33:01Z"},{"alias_kind":"pith_short_8","alias_value":"X34CY4W3","created_at":"2026-05-18T12:33:01Z"}],"events":[{"event_type":"record_created","subject_pith_number":"pith:2018:X34CY4W3JPVRGBXHPSYHD47W2R","target":"record","payload":{"canonical_record":{"source":{"id":"1812.07695","kind":"arxiv","version":2},"metadata":{"license":"http://arxiv.org/licenses/nonexclusive-distrib/1.0/","primary_cat":"cs.DB","submitted_at":"2018-12-18T23:30:39Z","cross_cats_sorted":[],"title_canon_sha256":"f0bbb4489dbf7e85d7bf73b375598745ce59a0494d6c7562fccd259a21eeb11e","abstract_canon_sha256":"a55d780cd24c84eed960c73229b6991ee709d357323dd4d01adfd94976ebe8ab"},"schema_version":"1.0"},"canonical_sha256":"bef82c72db4beb1306e77cb071f3f6d476c4e979393a300a237fdcb5e66a9c6f","receipt":{"kind":"pith_receipt","key_id":"pith-v1-2026-05","algorithm":"ed25519","signed_at":"2026-05-17T23:56:33.250201Z","signature_b64":"a1SaOCqmVI+ugBXyvPJqeJbxeC20UPgQACJErQe5kC1EbTVTMwnzxcT8+IwI2nHfnoj9aZ+6qu0ac7Rq+gMuBg==","signed_message":"canonical_sha256_bytes","builder_version":"pith-number-builder-2026-05-17-v1","receipt_version":"0.3","canonical_sha256":"bef82c72db4beb1306e77cb071f3f6d476c4e979393a300a237fdcb5e66a9c6f","last_reissued_at":"2026-05-17T23:56:33.249696Z","signature_status":"signed_v1","first_computed_at":"2026-05-17T23:56:33.249696Z","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54"},"source_kind":"arxiv","source_id":"1812.07695","source_version":2,"attestation_state":"computed"},"signer":{"signer_id":"pith.science","signer_type":"pith_registry","key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54"},"created_at":"2026-05-17T23:56:33Z","supersedes":[],"prev_event":null,"signature":{"signature_status":"signed_v1","algorithm":"ed25519","key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","signature_b64":"faqHM8YX5KJlpNZ5Qo6K+S5wUqWjnJ6O2mt4pp0i5nbHsAl/wPGWizUQfpV3g672lHtICj2xL7OpTLoUcql8Ag==","signed_message":"open_graph_event_sha256_bytes","signed_at":"2026-05-28T04:47:31.391087Z"},"content_sha256":"abffb1ead0f48b9bf11c3530da2967368d09d5aaa2c1f785d082a621de24267f","schema_version":"1.0","event_id":"sha256:abffb1ead0f48b9bf11c3530da2967368d09d5aaa2c1f785d082a621de24267f"},{"event_type":"graph_snapshot","subject_pith_number":"pith:2018:X34CY4W3JPVRGBXHPSYHD47W2R","target":"graph","payload":{"graph_snapshot":{"paper":{"title":"Index-based, High-dimensional, Cosine Threshold Querying with Optimality Guarantees","license":"http://arxiv.org/licenses/nonexclusive-distrib/1.0/","headline":"","cross_cats":[],"primary_cat":"cs.DB","authors_text":"Benjamin Pullman, Jianguo Wang, Nuno Bandeira, Yannis Papakonstantinou, Yuliang Li","submitted_at":"2018-12-18T23:30:39Z","abstract_excerpt":"Given a database of vectors, a cosine threshold query returns all vectors in the database having cosine similarity to a query vector above a given threshold {\\theta}. These queries arise naturally in many applications, such as document retrieval, image search, and mass spectrometry. The present paper considers the efficient evaluation of such queries, providing novel optimality guarantees and exhibiting good performance on real datasets. We take as a starting point Fagin's well-known Threshold Algorithm (TA), which can be used to answer cosine threshold queries as follows: an inverted index is"},"claims":{"count":0,"items":[],"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"source":{"id":"1812.07695","kind":"arxiv","version":2},"verdict":{"id":null,"model_set":{},"created_at":null,"strongest_claim":"","one_line_summary":"","pipeline_version":null,"weakest_assumption":"","pith_extraction_headline":""},"references":{"count":0,"sample":[],"resolved_work":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57","internal_anchors":0},"formal_canon":{"evidence_count":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"author_claims":{"count":0,"strong_count":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"builder_version":"pith-number-builder-2026-05-17-v1"},"verdict_id":null},"signer":{"signer_id":"pith.science","signer_type":"pith_registry","key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54"},"created_at":"2026-05-17T23:56:33Z","supersedes":[],"prev_event":null,"signature":{"signature_status":"signed_v1","algorithm":"ed25519","key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","signature_b64":"YHvaHKSU6Fl7oIkB4CDaGODiwoVEnFrDJU7KdtN8+ZYGRlk+Nt/onlp51wIuyAYAF1UNOmUlSM3vESiLj/dmCg==","signed_message":"open_graph_event_sha256_bytes","signed_at":"2026-05-28T04:47:31.391476Z"},"content_sha256":"825e7820c76cd8dcbe44342ff337015176cdef09fb942f6fe95012e8c00900aa","schema_version":"1.0","event_id":"sha256:825e7820c76cd8dcbe44342ff337015176cdef09fb942f6fe95012e8c00900aa"}],"timestamp_proofs":[],"mirror_hints":[{"mirror_type":"https","name":"Pith Resolver","base_url":"https://pith.science","bundle_url":"https://pith.science/pith/X34CY4W3JPVRGBXHPSYHD47W2R/bundle.json","state_url":"https://pith.science/pith/X34CY4W3JPVRGBXHPSYHD47W2R/state.json","well_known_bundle_url":"https://pith.science/.well-known/pith/X34CY4W3JPVRGBXHPSYHD47W2R/bundle.json","status":"primary"}],"public_keys":[{"key_id":"pith-v1-2026-05","algorithm":"ed25519","format":"raw","public_key_b64":"stVStoiQhXFxp4s2pdzPNoqVNBMojDU/fJ2db5S3CbM=","public_key_hex":"b2d552b68890857171a78b36a5dccf368a953413288c353f7c9d9d6f94b709b3","fingerprint_sha256_b32_first128bits":"RVFV5Z2OI2J3ZUO7ERDEBCYNKS","fingerprint_sha256_hex":"8d4b5ee74e4693bcd1df2446408b0d54","rotates_at":null,"url":"https://pith.science/pith-signing-key.json","notes":"Pith uses this Ed25519 key to sign canonical record SHA-256 digests. Verify with: ed25519_verify(public_key, message=canonical_sha256_bytes, signature=base64decode(signature_b64))."}],"merge_version":"pith-open-graph-merge-v1","built_at":"2026-05-28T04:47:31Z","links":{"resolver":"https://pith.science/pith/X34CY4W3JPVRGBXHPSYHD47W2R","bundle":"https://pith.science/pith/X34CY4W3JPVRGBXHPSYHD47W2R/bundle.json","state":"https://pith.science/pith/X34CY4W3JPVRGBXHPSYHD47W2R/state.json","well_known_bundle":"https://pith.science/.well-known/pith/X34CY4W3JPVRGBXHPSYHD47W2R/bundle.json"},"state":{"state_type":"pith_open_graph_state","state_version":"1.0","pith_number":"pith:2018:X34CY4W3JPVRGBXHPSYHD47W2R","merge_version":"pith-open-graph-merge-v1","event_count":2,"valid_event_count":2,"invalid_event_count":0,"equivocation_count":0,"current":{"canonical_record":{"metadata":{"abstract_canon_sha256":"a55d780cd24c84eed960c73229b6991ee709d357323dd4d01adfd94976ebe8ab","cross_cats_sorted":[],"license":"http://arxiv.org/licenses/nonexclusive-distrib/1.0/","primary_cat":"cs.DB","submitted_at":"2018-12-18T23:30:39Z","title_canon_sha256":"f0bbb4489dbf7e85d7bf73b375598745ce59a0494d6c7562fccd259a21eeb11e"},"schema_version":"1.0","source":{"id":"1812.07695","kind":"arxiv","version":2}},"source_aliases":[{"alias_kind":"arxiv","alias_value":"1812.07695","created_at":"2026-05-17T23:56:33Z"},{"alias_kind":"arxiv_version","alias_value":"1812.07695v2","created_at":"2026-05-17T23:56:33Z"},{"alias_kind":"doi","alias_value":"10.48550/arxiv.1812.07695","created_at":"2026-05-17T23:56:33Z"},{"alias_kind":"pith_short_12","alias_value":"X34CY4W3JPVR","created_at":"2026-05-18T12:33:01Z"},{"alias_kind":"pith_short_16","alias_value":"X34CY4W3JPVRGBXH","created_at":"2026-05-18T12:33:01Z"},{"alias_kind":"pith_short_8","alias_value":"X34CY4W3","created_at":"2026-05-18T12:33:01Z"}],"graph_snapshots":[{"event_id":"sha256:825e7820c76cd8dcbe44342ff337015176cdef09fb942f6fe95012e8c00900aa","target":"graph","created_at":"2026-05-17T23:56:33Z","signer":{"key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","signer_id":"pith.science","signer_type":"pith_registry"},"payload":{"graph_snapshot":{"author_claims":{"count":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57","strong_count":0},"builder_version":"pith-number-builder-2026-05-17-v1","claims":{"count":0,"items":[],"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"formal_canon":{"evidence_count":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"paper":{"abstract_excerpt":"Given a database of vectors, a cosine threshold query returns all vectors in the database having cosine similarity to a query vector above a given threshold {\\theta}. These queries arise naturally in many applications, such as document retrieval, image search, and mass spectrometry. The present paper considers the efficient evaluation of such queries, providing novel optimality guarantees and exhibiting good performance on real datasets. We take as a starting point Fagin's well-known Threshold Algorithm (TA), which can be used to answer cosine threshold queries as follows: an inverted index is","authors_text":"Benjamin Pullman, Jianguo Wang, Nuno Bandeira, Yannis Papakonstantinou, Yuliang Li","cross_cats":[],"headline":"","license":"http://arxiv.org/licenses/nonexclusive-distrib/1.0/","primary_cat":"cs.DB","submitted_at":"2018-12-18T23:30:39Z","title":"Index-based, High-dimensional, Cosine Threshold Querying with Optimality Guarantees"},"references":{"count":0,"internal_anchors":0,"resolved_work":0,"sample":[],"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"source":{"id":"1812.07695","kind":"arxiv","version":2},"verdict":{"created_at":null,"id":null,"model_set":{},"one_line_summary":"","pipeline_version":null,"pith_extraction_headline":"","strongest_claim":"","weakest_assumption":""}},"verdict_id":null}}],"author_attestations":[],"timestamp_anchors":[],"storage_attestations":[],"citation_signatures":[],"replication_records":[],"corrections":[],"mirror_hints":[],"record_created":{"event_id":"sha256:abffb1ead0f48b9bf11c3530da2967368d09d5aaa2c1f785d082a621de24267f","target":"record","created_at":"2026-05-17T23:56:33Z","signer":{"key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","signer_id":"pith.science","signer_type":"pith_registry"},"payload":{"attestation_state":"computed","canonical_record":{"metadata":{"abstract_canon_sha256":"a55d780cd24c84eed960c73229b6991ee709d357323dd4d01adfd94976ebe8ab","cross_cats_sorted":[],"license":"http://arxiv.org/licenses/nonexclusive-distrib/1.0/","primary_cat":"cs.DB","submitted_at":"2018-12-18T23:30:39Z","title_canon_sha256":"f0bbb4489dbf7e85d7bf73b375598745ce59a0494d6c7562fccd259a21eeb11e"},"schema_version":"1.0","source":{"id":"1812.07695","kind":"arxiv","version":2}},"canonical_sha256":"bef82c72db4beb1306e77cb071f3f6d476c4e979393a300a237fdcb5e66a9c6f","receipt":{"algorithm":"ed25519","builder_version":"pith-number-builder-2026-05-17-v1","canonical_sha256":"bef82c72db4beb1306e77cb071f3f6d476c4e979393a300a237fdcb5e66a9c6f","first_computed_at":"2026-05-17T23:56:33.249696Z","key_id":"pith-v1-2026-05","kind":"pith_receipt","last_reissued_at":"2026-05-17T23:56:33.249696Z","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","receipt_version":"0.3","signature_b64":"a1SaOCqmVI+ugBXyvPJqeJbxeC20UPgQACJErQe5kC1EbTVTMwnzxcT8+IwI2nHfnoj9aZ+6qu0ac7Rq+gMuBg==","signature_status":"signed_v1","signed_at":"2026-05-17T23:56:33.250201Z","signed_message":"canonical_sha256_bytes"},"source_id":"1812.07695","source_kind":"arxiv","source_version":2}}},"equivocations":[],"invalid_events":[],"applied_event_ids":["sha256:abffb1ead0f48b9bf11c3530da2967368d09d5aaa2c1f785d082a621de24267f","sha256:825e7820c76cd8dcbe44342ff337015176cdef09fb942f6fe95012e8c00900aa"],"state_sha256":"7562f7d06fe15d3a5b373bcc2016c2bc4ec0c8c30f4a482cae89264b294d189a"},"bundle_signature":{"signature_status":"signed_v1","algorithm":"ed25519","key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","signature_b64":"QKDmwDw6re2o6y6dYmuPbpKVw5eOwM+C4Ze20QiON6sGYPhuNC/p1dXd1HOiGPVOy2kZ8v8kAY+f6G1GjLjqAg==","signed_message":"bundle_sha256_bytes","signed_at":"2026-05-28T04:47:31.393502Z","bundle_sha256":"4683dcdf00a8a51c8dd3bf1b91c836d1bd1edd2c8af4fc5cd7f7bbd3c6491a08"}}