{"bundle_type":"pith_open_graph_bundle","bundle_version":"1.0","pith_number":"pith:2015:KFFRYICXPZGJHHG65O6SJTMIHD","short_pith_number":"pith:KFFRYICX","canonical_record":{"source":{"id":"1508.03116","kind":"arxiv","version":1},"metadata":{"license":"http://arxiv.org/licenses/nonexclusive-distrib/1.0/","primary_cat":"cs.DB","submitted_at":"2015-08-13T04:23:58Z","cross_cats_sorted":[],"title_canon_sha256":"4a7f72ddeaeb193fd22a852fd074f6cf38a5cd9ff64bd412fa7c4e5c5789a1e4","abstract_canon_sha256":"c605ac8f2fde59383cc3fcca3d5901e91510b4ed42f27fa579f26ebc744a2009"},"schema_version":"1.0"},"canonical_sha256":"514b1c20577e4c939cdeebbd24cd8838f3984bdd66d01616bc93f8f1e79c50fd","source":{"kind":"arxiv","id":"1508.03116","version":1},"source_aliases":[{"alias_kind":"arxiv","alias_value":"1508.03116","created_at":"2026-05-18T01:35:21Z"},{"alias_kind":"arxiv_version","alias_value":"1508.03116v1","created_at":"2026-05-18T01:35:21Z"},{"alias_kind":"doi","alias_value":"10.48550/arxiv.1508.03116","created_at":"2026-05-18T01:35:21Z"},{"alias_kind":"pith_short_12","alias_value":"KFFRYICXPZGJ","created_at":"2026-05-18T12:29:27Z"},{"alias_kind":"pith_short_16","alias_value":"KFFRYICXPZGJHHG6","created_at":"2026-05-18T12:29:27Z"},{"alias_kind":"pith_short_8","alias_value":"KFFRYICX","created_at":"2026-05-18T12:29:27Z"}],"events":[{"event_type":"record_created","subject_pith_number":"pith:2015:KFFRYICXPZGJHHG65O6SJTMIHD","target":"record","payload":{"canonical_record":{"source":{"id":"1508.03116","kind":"arxiv","version":1},"metadata":{"license":"http://arxiv.org/licenses/nonexclusive-distrib/1.0/","primary_cat":"cs.DB","submitted_at":"2015-08-13T04:23:58Z","cross_cats_sorted":[],"title_canon_sha256":"4a7f72ddeaeb193fd22a852fd074f6cf38a5cd9ff64bd412fa7c4e5c5789a1e4","abstract_canon_sha256":"c605ac8f2fde59383cc3fcca3d5901e91510b4ed42f27fa579f26ebc744a2009"},"schema_version":"1.0"},"canonical_sha256":"514b1c20577e4c939cdeebbd24cd8838f3984bdd66d01616bc93f8f1e79c50fd","receipt":{"kind":"pith_receipt","key_id":"pith-v1-2026-05","algorithm":"ed25519","signed_at":"2026-05-18T01:35:21.671743Z","signature_b64":"JonGX23vdz1halwx6vKA6YLFdXGicREddel+oy9a+V79bkvLLKwXxw0CZW3452sE09Y+ob55rDDJPDdcK9YVBg==","signed_message":"canonical_sha256_bytes","builder_version":"pith-number-builder-2026-05-17-v1","receipt_version":"0.3","canonical_sha256":"514b1c20577e4c939cdeebbd24cd8838f3984bdd66d01616bc93f8f1e79c50fd","last_reissued_at":"2026-05-18T01:35:21.670979Z","signature_status":"signed_v1","first_computed_at":"2026-05-18T01:35:21.670979Z","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54"},"source_kind":"arxiv","source_id":"1508.03116","source_version":1,"attestation_state":"computed"},"signer":{"signer_id":"pith.science","signer_type":"pith_registry","key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54"},"created_at":"2026-05-18T01:35:21Z","supersedes":[],"prev_event":null,"signature":{"signature_status":"signed_v1","algorithm":"ed25519","key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","signature_b64":"itfSJLG96VkeB7rm+POUDkYUiCDqWyZdDxco30lHKhX5CgWyAsxuXGcjFqFxn0ftancIY1azDEL/nV7SJnrMBg==","signed_message":"open_graph_event_sha256_bytes","signed_at":"2026-06-07T15:25:33.111710Z"},"content_sha256":"8ac4270bdb41d3a7d4732e78191fa4483ad15d5054f4ea2e4470a8d8495828e9","schema_version":"1.0","event_id":"sha256:8ac4270bdb41d3a7d4732e78191fa4483ad15d5054f4ea2e4470a8d8495828e9"},{"event_type":"graph_snapshot","subject_pith_number":"pith:2015:KFFRYICXPZGJHHG65O6SJTMIHD","target":"graph","payload":{"graph_snapshot":{"paper":{"title":"Query-Driven Sampling for Collective Entity Resolution","license":"http://arxiv.org/licenses/nonexclusive-distrib/1.0/","headline":"","cross_cats":[],"primary_cat":"cs.DB","authors_text":"Christan Grant, Daisy Zhe Wang, Michael L. Wick","submitted_at":"2015-08-13T04:23:58Z","abstract_excerpt":"Probabilistic databases play a preeminent role in the processing and management of uncertain data. Recently, many database research efforts have integrated probabilistic models into databases to support tasks such as information extraction and labeling. Many of these efforts are based on batch oriented inference which inhibits a realtime workflow. One important task is entity resolution (ER). ER is the process of determining records (mentions) in a database that correspond to the same real-world entity. Traditional pairwise ER methods can lead to inconsistencies and low accuracy due to localiz"},"claims":{"count":0,"items":[],"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"source":{"id":"1508.03116","kind":"arxiv","version":1},"verdict":{"id":null,"model_set":{},"created_at":null,"strongest_claim":"","one_line_summary":"","pipeline_version":null,"weakest_assumption":"","pith_extraction_headline":""},"references":{"count":0,"sample":[],"resolved_work":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57","internal_anchors":0},"formal_canon":{"evidence_count":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"author_claims":{"count":0,"strong_count":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"builder_version":"pith-number-builder-2026-05-17-v1"},"verdict_id":null},"signer":{"signer_id":"pith.science","signer_type":"pith_registry","key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54"},"created_at":"2026-05-18T01:35:21Z","supersedes":[],"prev_event":null,"signature":{"signature_status":"signed_v1","algorithm":"ed25519","key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","signature_b64":"c82oaL651lFMRKabw88DabcRknInSbChHS3EN9x7lSnSxPY6BSFzMfCQo5J3dgLmxiK3Rv1Ikd2xJ7NbmgEzAw==","signed_message":"open_graph_event_sha256_bytes","signed_at":"2026-06-07T15:25:33.112380Z"},"content_sha256":"84b8eaee639060d74d4e63d28652860bfe4b3c9e1633a4616a5a3d02d809c8a0","schema_version":"1.0","event_id":"sha256:84b8eaee639060d74d4e63d28652860bfe4b3c9e1633a4616a5a3d02d809c8a0"}],"timestamp_proofs":[],"mirror_hints":[{"mirror_type":"https","name":"Pith Resolver","base_url":"https://pith.science","bundle_url":"https://pith.science/pith/KFFRYICXPZGJHHG65O6SJTMIHD/bundle.json","state_url":"https://pith.science/pith/KFFRYICXPZGJHHG65O6SJTMIHD/state.json","well_known_bundle_url":"https://pith.science/.well-known/pith/KFFRYICXPZGJHHG65O6SJTMIHD/bundle.json","status":"primary"}],"public_keys":[{"key_id":"pith-v1-2026-05","algorithm":"ed25519","format":"raw","public_key_b64":"stVStoiQhXFxp4s2pdzPNoqVNBMojDU/fJ2db5S3CbM=","public_key_hex":"b2d552b68890857171a78b36a5dccf368a953413288c353f7c9d9d6f94b709b3","fingerprint_sha256_b32_first128bits":"RVFV5Z2OI2J3ZUO7ERDEBCYNKS","fingerprint_sha256_hex":"8d4b5ee74e4693bcd1df2446408b0d54","rotates_at":null,"url":"https://pith.science/pith-signing-key.json","notes":"Pith uses this Ed25519 key to sign canonical record SHA-256 digests. Verify with: ed25519_verify(public_key, message=canonical_sha256_bytes, signature=base64decode(signature_b64))."}],"merge_version":"pith-open-graph-merge-v1","built_at":"2026-06-07T15:25:33Z","links":{"resolver":"https://pith.science/pith/KFFRYICXPZGJHHG65O6SJTMIHD","bundle":"https://pith.science/pith/KFFRYICXPZGJHHG65O6SJTMIHD/bundle.json","state":"https://pith.science/pith/KFFRYICXPZGJHHG65O6SJTMIHD/state.json","well_known_bundle":"https://pith.science/.well-known/pith/KFFRYICXPZGJHHG65O6SJTMIHD/bundle.json"},"state":{"state_type":"pith_open_graph_state","state_version":"1.0","pith_number":"pith:2015:KFFRYICXPZGJHHG65O6SJTMIHD","merge_version":"pith-open-graph-merge-v1","event_count":2,"valid_event_count":2,"invalid_event_count":0,"equivocation_count":0,"current":{"canonical_record":{"metadata":{"abstract_canon_sha256":"c605ac8f2fde59383cc3fcca3d5901e91510b4ed42f27fa579f26ebc744a2009","cross_cats_sorted":[],"license":"http://arxiv.org/licenses/nonexclusive-distrib/1.0/","primary_cat":"cs.DB","submitted_at":"2015-08-13T04:23:58Z","title_canon_sha256":"4a7f72ddeaeb193fd22a852fd074f6cf38a5cd9ff64bd412fa7c4e5c5789a1e4"},"schema_version":"1.0","source":{"id":"1508.03116","kind":"arxiv","version":1}},"source_aliases":[{"alias_kind":"arxiv","alias_value":"1508.03116","created_at":"2026-05-18T01:35:21Z"},{"alias_kind":"arxiv_version","alias_value":"1508.03116v1","created_at":"2026-05-18T01:35:21Z"},{"alias_kind":"doi","alias_value":"10.48550/arxiv.1508.03116","created_at":"2026-05-18T01:35:21Z"},{"alias_kind":"pith_short_12","alias_value":"KFFRYICXPZGJ","created_at":"2026-05-18T12:29:27Z"},{"alias_kind":"pith_short_16","alias_value":"KFFRYICXPZGJHHG6","created_at":"2026-05-18T12:29:27Z"},{"alias_kind":"pith_short_8","alias_value":"KFFRYICX","created_at":"2026-05-18T12:29:27Z"}],"graph_snapshots":[{"event_id":"sha256:84b8eaee639060d74d4e63d28652860bfe4b3c9e1633a4616a5a3d02d809c8a0","target":"graph","created_at":"2026-05-18T01:35:21Z","signer":{"key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","signer_id":"pith.science","signer_type":"pith_registry"},"payload":{"graph_snapshot":{"author_claims":{"count":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57","strong_count":0},"builder_version":"pith-number-builder-2026-05-17-v1","claims":{"count":0,"items":[],"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"formal_canon":{"evidence_count":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"paper":{"abstract_excerpt":"Probabilistic databases play a preeminent role in the processing and management of uncertain data. Recently, many database research efforts have integrated probabilistic models into databases to support tasks such as information extraction and labeling. Many of these efforts are based on batch oriented inference which inhibits a realtime workflow. One important task is entity resolution (ER). ER is the process of determining records (mentions) in a database that correspond to the same real-world entity. Traditional pairwise ER methods can lead to inconsistencies and low accuracy due to localiz","authors_text":"Christan Grant, Daisy Zhe Wang, Michael L. Wick","cross_cats":[],"headline":"","license":"http://arxiv.org/licenses/nonexclusive-distrib/1.0/","primary_cat":"cs.DB","submitted_at":"2015-08-13T04:23:58Z","title":"Query-Driven Sampling for Collective Entity Resolution"},"references":{"count":0,"internal_anchors":0,"resolved_work":0,"sample":[],"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"source":{"id":"1508.03116","kind":"arxiv","version":1},"verdict":{"created_at":null,"id":null,"model_set":{},"one_line_summary":"","pipeline_version":null,"pith_extraction_headline":"","strongest_claim":"","weakest_assumption":""}},"verdict_id":null}}],"author_attestations":[],"timestamp_anchors":[],"storage_attestations":[],"citation_signatures":[],"replication_records":[],"corrections":[],"mirror_hints":[],"record_created":{"event_id":"sha256:8ac4270bdb41d3a7d4732e78191fa4483ad15d5054f4ea2e4470a8d8495828e9","target":"record","created_at":"2026-05-18T01:35:21Z","signer":{"key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","signer_id":"pith.science","signer_type":"pith_registry"},"payload":{"attestation_state":"computed","canonical_record":{"metadata":{"abstract_canon_sha256":"c605ac8f2fde59383cc3fcca3d5901e91510b4ed42f27fa579f26ebc744a2009","cross_cats_sorted":[],"license":"http://arxiv.org/licenses/nonexclusive-distrib/1.0/","primary_cat":"cs.DB","submitted_at":"2015-08-13T04:23:58Z","title_canon_sha256":"4a7f72ddeaeb193fd22a852fd074f6cf38a5cd9ff64bd412fa7c4e5c5789a1e4"},"schema_version":"1.0","source":{"id":"1508.03116","kind":"arxiv","version":1}},"canonical_sha256":"514b1c20577e4c939cdeebbd24cd8838f3984bdd66d01616bc93f8f1e79c50fd","receipt":{"algorithm":"ed25519","builder_version":"pith-number-builder-2026-05-17-v1","canonical_sha256":"514b1c20577e4c939cdeebbd24cd8838f3984bdd66d01616bc93f8f1e79c50fd","first_computed_at":"2026-05-18T01:35:21.670979Z","key_id":"pith-v1-2026-05","kind":"pith_receipt","last_reissued_at":"2026-05-18T01:35:21.670979Z","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","receipt_version":"0.3","signature_b64":"JonGX23vdz1halwx6vKA6YLFdXGicREddel+oy9a+V79bkvLLKwXxw0CZW3452sE09Y+ob55rDDJPDdcK9YVBg==","signature_status":"signed_v1","signed_at":"2026-05-18T01:35:21.671743Z","signed_message":"canonical_sha256_bytes"},"source_id":"1508.03116","source_kind":"arxiv","source_version":1}}},"equivocations":[],"invalid_events":[],"applied_event_ids":["sha256:8ac4270bdb41d3a7d4732e78191fa4483ad15d5054f4ea2e4470a8d8495828e9","sha256:84b8eaee639060d74d4e63d28652860bfe4b3c9e1633a4616a5a3d02d809c8a0"],"state_sha256":"115150ac2ab57732e7386cf23b2b2bde496227d52ce521b90d4fcbf008ab702e"},"bundle_signature":{"signature_status":"signed_v1","algorithm":"ed25519","key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","signature_b64":"Q6T/HLu9CB9RfpGS2OmCSotw+foTMk9C2kWbU4LwUR6Rs81BZDvYizbT4gvcselnRxPR5oAo42E/Jk26yZUuBQ==","signed_message":"bundle_sha256_bytes","signed_at":"2026-06-07T15:25:33.116695Z","bundle_sha256":"66b50b3b4a53a7b6f649d78dfe1caa7ec9977934efafdc159fc10519001b11aa"}}