{"bundle_type":"pith_open_graph_bundle","bundle_version":"1.0","pith_number":"pith:2015:USGP7OWFT6P3IGAFCHWT4DJUXD","short_pith_number":"pith:USGP7OWF","canonical_record":{"source":{"id":"1502.00731","kind":"arxiv","version":4},"metadata":{"license":"http://arxiv.org/licenses/nonexclusive-distrib/1.0/","primary_cat":"cs.DB","submitted_at":"2015-02-03T04:16:24Z","cross_cats_sorted":["cs.CL","cs.LG"],"title_canon_sha256":"1c1875c47ddc9d41876914f64ef8e60ba309aa9d49df0061924308b529ab5916","abstract_canon_sha256":"ab17b56c535a18b3491dd27756199acba6e1315ec707c5b6b2f73b8d39cfac0b"},"schema_version":"1.0"},"canonical_sha256":"a48cffbac59f9fb4180511ed3e0d34b8f196b3aec5a584bb86845f08f31e69e0","source":{"kind":"arxiv","id":"1502.00731","version":4},"source_aliases":[{"alias_kind":"arxiv","alias_value":"1502.00731","created_at":"2026-05-18T01:48:06Z"},{"alias_kind":"arxiv_version","alias_value":"1502.00731v4","created_at":"2026-05-18T01:48:06Z"},{"alias_kind":"doi","alias_value":"10.48550/arxiv.1502.00731","created_at":"2026-05-18T01:48:06Z"},{"alias_kind":"pith_short_12","alias_value":"USGP7OWFT6P3","created_at":"2026-05-18T12:29:44Z"},{"alias_kind":"pith_short_16","alias_value":"USGP7OWFT6P3IGAF","created_at":"2026-05-18T12:29:44Z"},{"alias_kind":"pith_short_8","alias_value":"USGP7OWF","created_at":"2026-05-18T12:29:44Z"}],"events":[{"event_type":"record_created","subject_pith_number":"pith:2015:USGP7OWFT6P3IGAFCHWT4DJUXD","target":"record","payload":{"canonical_record":{"source":{"id":"1502.00731","kind":"arxiv","version":4},"metadata":{"license":"http://arxiv.org/licenses/nonexclusive-distrib/1.0/","primary_cat":"cs.DB","submitted_at":"2015-02-03T04:16:24Z","cross_cats_sorted":["cs.CL","cs.LG"],"title_canon_sha256":"1c1875c47ddc9d41876914f64ef8e60ba309aa9d49df0061924308b529ab5916","abstract_canon_sha256":"ab17b56c535a18b3491dd27756199acba6e1315ec707c5b6b2f73b8d39cfac0b"},"schema_version":"1.0"},"canonical_sha256":"a48cffbac59f9fb4180511ed3e0d34b8f196b3aec5a584bb86845f08f31e69e0","receipt":{"kind":"pith_receipt","key_id":"pith-v1-2026-05","algorithm":"ed25519","signed_at":"2026-05-18T01:48:06.402653Z","signature_b64":"27hGt5fX1/2vKU0tBQXFP6SeEKEfJk369WjFETpVoD/kYXRcfSY8RiIwV7tRQJLHVRXa869qXN6IA95F+7T3Dw==","signed_message":"canonical_sha256_bytes","builder_version":"pith-number-builder-2026-05-17-v1","receipt_version":"0.3","canonical_sha256":"a48cffbac59f9fb4180511ed3e0d34b8f196b3aec5a584bb86845f08f31e69e0","last_reissued_at":"2026-05-18T01:48:06.402039Z","signature_status":"signed_v1","first_computed_at":"2026-05-18T01:48:06.402039Z","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54"},"source_kind":"arxiv","source_id":"1502.00731","source_version":4,"attestation_state":"computed"},"signer":{"signer_id":"pith.science","signer_type":"pith_registry","key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54"},"created_at":"2026-05-18T01:48:06Z","supersedes":[],"prev_event":null,"signature":{"signature_status":"signed_v1","algorithm":"ed25519","key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","signature_b64":"AnP+QOuBtkv4Q1PeC8dPs/w02Dj/eEQEvm27qKqD9nHRr+MuhQhUFhDCESJQE6SnIyc1LjKWf5ByGjTmAWQ5BA==","signed_message":"open_graph_event_sha256_bytes","signed_at":"2026-05-25T12:59:56.237966Z"},"content_sha256":"2e8c7659ba832a8ecd0d1637fd6e4aa938430eee675edd91a7d222890fc84534","schema_version":"1.0","event_id":"sha256:2e8c7659ba832a8ecd0d1637fd6e4aa938430eee675edd91a7d222890fc84534"},{"event_type":"graph_snapshot","subject_pith_number":"pith:2015:USGP7OWFT6P3IGAFCHWT4DJUXD","target":"graph","payload":{"graph_snapshot":{"paper":{"title":"Incremental Knowledge Base Construction Using DeepDive","license":"http://arxiv.org/licenses/nonexclusive-distrib/1.0/","headline":"","cross_cats":["cs.CL","cs.LG"],"primary_cat":"cs.DB","authors_text":"Ce Zhang, Christopher De Sa, Christopher R\\'e, Feiran Wang, Jaeho Shin, Sen Wu","submitted_at":"2015-02-03T04:16:24Z","abstract_excerpt":"Populating a database with unstructured information is a long-standing problem in industry and research that encompasses problems of extraction, cleaning, and integration. Recent names used for this problem include dealing with dark data and knowledge base construction (KBC). In this work, we describe DeepDive, a system that combines database and machine learning ideas to help develop KBC systems, and we present techniques to make the KBC process more efficient. We observe that the KBC process is iterative, and we develop techniques to incrementally produce inference results for KBC systems. W"},"claims":{"count":0,"items":[],"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"source":{"id":"1502.00731","kind":"arxiv","version":4},"verdict":{"id":null,"model_set":{},"created_at":null,"strongest_claim":"","one_line_summary":"","pipeline_version":null,"weakest_assumption":"","pith_extraction_headline":""},"references":{"count":0,"sample":[],"resolved_work":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57","internal_anchors":0},"formal_canon":{"evidence_count":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"author_claims":{"count":0,"strong_count":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"builder_version":"pith-number-builder-2026-05-17-v1"},"verdict_id":null},"signer":{"signer_id":"pith.science","signer_type":"pith_registry","key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54"},"created_at":"2026-05-18T01:48:06Z","supersedes":[],"prev_event":null,"signature":{"signature_status":"signed_v1","algorithm":"ed25519","key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","signature_b64":"vn7OeBXjJt0OQFkyBQJw8D9SjQ+wgYz1Y5t+EC9Uy9FduNncD/oGtUete5GpV3HhJlHYwO0uzzyhHZyz0XfYBg==","signed_message":"open_graph_event_sha256_bytes","signed_at":"2026-05-25T12:59:56.238420Z"},"content_sha256":"cdf07de78f29343025250b85d1b9ae709244e8d99faeb7b914e2e2ce7bafbb0f","schema_version":"1.0","event_id":"sha256:cdf07de78f29343025250b85d1b9ae709244e8d99faeb7b914e2e2ce7bafbb0f"}],"timestamp_proofs":[],"mirror_hints":[{"mirror_type":"https","name":"Pith Resolver","base_url":"https://pith.science","bundle_url":"https://pith.science/pith/USGP7OWFT6P3IGAFCHWT4DJUXD/bundle.json","state_url":"https://pith.science/pith/USGP7OWFT6P3IGAFCHWT4DJUXD/state.json","well_known_bundle_url":"https://pith.science/.well-known/pith/USGP7OWFT6P3IGAFCHWT4DJUXD/bundle.json","status":"primary"}],"public_keys":[{"key_id":"pith-v1-2026-05","algorithm":"ed25519","format":"raw","public_key_b64":"stVStoiQhXFxp4s2pdzPNoqVNBMojDU/fJ2db5S3CbM=","public_key_hex":"b2d552b68890857171a78b36a5dccf368a953413288c353f7c9d9d6f94b709b3","fingerprint_sha256_b32_first128bits":"RVFV5Z2OI2J3ZUO7ERDEBCYNKS","fingerprint_sha256_hex":"8d4b5ee74e4693bcd1df2446408b0d54","rotates_at":null,"url":"https://pith.science/pith-signing-key.json","notes":"Pith uses this Ed25519 key to sign canonical record SHA-256 digests. Verify with: ed25519_verify(public_key, message=canonical_sha256_bytes, signature=base64decode(signature_b64))."}],"merge_version":"pith-open-graph-merge-v1","built_at":"2026-05-25T12:59:56Z","links":{"resolver":"https://pith.science/pith/USGP7OWFT6P3IGAFCHWT4DJUXD","bundle":"https://pith.science/pith/USGP7OWFT6P3IGAFCHWT4DJUXD/bundle.json","state":"https://pith.science/pith/USGP7OWFT6P3IGAFCHWT4DJUXD/state.json","well_known_bundle":"https://pith.science/.well-known/pith/USGP7OWFT6P3IGAFCHWT4DJUXD/bundle.json"},"state":{"state_type":"pith_open_graph_state","state_version":"1.0","pith_number":"pith:2015:USGP7OWFT6P3IGAFCHWT4DJUXD","merge_version":"pith-open-graph-merge-v1","event_count":2,"valid_event_count":2,"invalid_event_count":0,"equivocation_count":0,"current":{"canonical_record":{"metadata":{"abstract_canon_sha256":"ab17b56c535a18b3491dd27756199acba6e1315ec707c5b6b2f73b8d39cfac0b","cross_cats_sorted":["cs.CL","cs.LG"],"license":"http://arxiv.org/licenses/nonexclusive-distrib/1.0/","primary_cat":"cs.DB","submitted_at":"2015-02-03T04:16:24Z","title_canon_sha256":"1c1875c47ddc9d41876914f64ef8e60ba309aa9d49df0061924308b529ab5916"},"schema_version":"1.0","source":{"id":"1502.00731","kind":"arxiv","version":4}},"source_aliases":[{"alias_kind":"arxiv","alias_value":"1502.00731","created_at":"2026-05-18T01:48:06Z"},{"alias_kind":"arxiv_version","alias_value":"1502.00731v4","created_at":"2026-05-18T01:48:06Z"},{"alias_kind":"doi","alias_value":"10.48550/arxiv.1502.00731","created_at":"2026-05-18T01:48:06Z"},{"alias_kind":"pith_short_12","alias_value":"USGP7OWFT6P3","created_at":"2026-05-18T12:29:44Z"},{"alias_kind":"pith_short_16","alias_value":"USGP7OWFT6P3IGAF","created_at":"2026-05-18T12:29:44Z"},{"alias_kind":"pith_short_8","alias_value":"USGP7OWF","created_at":"2026-05-18T12:29:44Z"}],"graph_snapshots":[{"event_id":"sha256:cdf07de78f29343025250b85d1b9ae709244e8d99faeb7b914e2e2ce7bafbb0f","target":"graph","created_at":"2026-05-18T01:48:06Z","signer":{"key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","signer_id":"pith.science","signer_type":"pith_registry"},"payload":{"graph_snapshot":{"author_claims":{"count":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57","strong_count":0},"builder_version":"pith-number-builder-2026-05-17-v1","claims":{"count":0,"items":[],"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"formal_canon":{"evidence_count":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"paper":{"abstract_excerpt":"Populating a database with unstructured information is a long-standing problem in industry and research that encompasses problems of extraction, cleaning, and integration. Recent names used for this problem include dealing with dark data and knowledge base construction (KBC). In this work, we describe DeepDive, a system that combines database and machine learning ideas to help develop KBC systems, and we present techniques to make the KBC process more efficient. We observe that the KBC process is iterative, and we develop techniques to incrementally produce inference results for KBC systems. W","authors_text":"Ce Zhang, Christopher De Sa, Christopher R\\'e, Feiran Wang, Jaeho Shin, Sen Wu","cross_cats":["cs.CL","cs.LG"],"headline":"","license":"http://arxiv.org/licenses/nonexclusive-distrib/1.0/","primary_cat":"cs.DB","submitted_at":"2015-02-03T04:16:24Z","title":"Incremental Knowledge Base Construction Using DeepDive"},"references":{"count":0,"internal_anchors":0,"resolved_work":0,"sample":[],"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"source":{"id":"1502.00731","kind":"arxiv","version":4},"verdict":{"created_at":null,"id":null,"model_set":{},"one_line_summary":"","pipeline_version":null,"pith_extraction_headline":"","strongest_claim":"","weakest_assumption":""}},"verdict_id":null}}],"author_attestations":[],"timestamp_anchors":[],"storage_attestations":[],"citation_signatures":[],"replication_records":[],"corrections":[],"mirror_hints":[],"record_created":{"event_id":"sha256:2e8c7659ba832a8ecd0d1637fd6e4aa938430eee675edd91a7d222890fc84534","target":"record","created_at":"2026-05-18T01:48:06Z","signer":{"key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","signer_id":"pith.science","signer_type":"pith_registry"},"payload":{"attestation_state":"computed","canonical_record":{"metadata":{"abstract_canon_sha256":"ab17b56c535a18b3491dd27756199acba6e1315ec707c5b6b2f73b8d39cfac0b","cross_cats_sorted":["cs.CL","cs.LG"],"license":"http://arxiv.org/licenses/nonexclusive-distrib/1.0/","primary_cat":"cs.DB","submitted_at":"2015-02-03T04:16:24Z","title_canon_sha256":"1c1875c47ddc9d41876914f64ef8e60ba309aa9d49df0061924308b529ab5916"},"schema_version":"1.0","source":{"id":"1502.00731","kind":"arxiv","version":4}},"canonical_sha256":"a48cffbac59f9fb4180511ed3e0d34b8f196b3aec5a584bb86845f08f31e69e0","receipt":{"algorithm":"ed25519","builder_version":"pith-number-builder-2026-05-17-v1","canonical_sha256":"a48cffbac59f9fb4180511ed3e0d34b8f196b3aec5a584bb86845f08f31e69e0","first_computed_at":"2026-05-18T01:48:06.402039Z","key_id":"pith-v1-2026-05","kind":"pith_receipt","last_reissued_at":"2026-05-18T01:48:06.402039Z","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","receipt_version":"0.3","signature_b64":"27hGt5fX1/2vKU0tBQXFP6SeEKEfJk369WjFETpVoD/kYXRcfSY8RiIwV7tRQJLHVRXa869qXN6IA95F+7T3Dw==","signature_status":"signed_v1","signed_at":"2026-05-18T01:48:06.402653Z","signed_message":"canonical_sha256_bytes"},"source_id":"1502.00731","source_kind":"arxiv","source_version":4}}},"equivocations":[],"invalid_events":[],"applied_event_ids":["sha256:2e8c7659ba832a8ecd0d1637fd6e4aa938430eee675edd91a7d222890fc84534","sha256:cdf07de78f29343025250b85d1b9ae709244e8d99faeb7b914e2e2ce7bafbb0f"],"state_sha256":"b38bac346ad15054f8eb9f92f187ddff4dc3a1c46f2ef3a738d5fe342ce5a479"},"bundle_signature":{"signature_status":"signed_v1","algorithm":"ed25519","key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","signature_b64":"ND3MazMpaznzApKE7v1UWx5ne+vcQ0SEM1e2UhTMEP/MNZOtd2BBS9aWIXD9sLenhTOqxHzAL5MYfLPnBSSBBQ==","signed_message":"bundle_sha256_bytes","signed_at":"2026-05-25T12:59:56.240967Z","bundle_sha256":"54a87798a525edcbfe862d1020097b012f79d8ec71d6acd678a6a32ff41a0b36"}}