{"state_type":"pith_open_graph_state","state_version":"1.0","pith_number":"pith:2017:JRQ2M4F4OLLTM73HZNJUWM2V5G","merge_version":"pith-open-graph-merge-v1","event_count":2,"valid_event_count":2,"invalid_event_count":0,"equivocation_count":0,"current":{"canonical_record":{"metadata":{"abstract_canon_sha256":"d9f8bddec30866d1fe3f554bf56b6e1840be6053464b100fd99e9da98ef24c99","cross_cats_sorted":["cs.DS"],"license":"http://arxiv.org/licenses/nonexclusive-distrib/1.0/","primary_cat":"cs.DB","submitted_at":"2017-08-04T07:26:20Z","title_canon_sha256":"44d2d5f2cf1f5ca9bca87d8f5fe25090506876105a6375b455ad7eaec455c288"},"schema_version":"1.0","source":{"id":"1708.01402","kind":"arxiv","version":4}},"source_aliases":[{"alias_kind":"arxiv","alias_value":"1708.01402","created_at":"2026-05-18T00:24:42Z"},{"alias_kind":"arxiv_version","alias_value":"1708.01402v4","created_at":"2026-05-18T00:24:42Z"},{"alias_kind":"doi","alias_value":"10.48550/arxiv.1708.01402","created_at":"2026-05-18T00:24:42Z"},{"alias_kind":"pith_short_12","alias_value":"JRQ2M4F4OLLT","created_at":"2026-05-18T12:31:24Z"},{"alias_kind":"pith_short_16","alias_value":"JRQ2M4F4OLLTM73H","created_at":"2026-05-18T12:31:24Z"},{"alias_kind":"pith_short_8","alias_value":"JRQ2M4F4","created_at":"2026-05-18T12:31:24Z"}],"graph_snapshots":[{"event_id":"sha256:0940ad802e634f889545745ae74af4aa135ad9581d682000828dee51018203af","target":"graph","created_at":"2026-05-18T00:24:42Z","signer":{"key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","signer_id":"pith.science","signer_type":"pith_registry"},"payload":{"graph_snapshot":{"author_claims":{"count":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57","strong_count":0},"builder_version":"pith-number-builder-2026-05-17-v1","claims":{"count":0,"items":[],"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"formal_canon":{"evidence_count":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"paper":{"abstract_excerpt":"Accurate and efficient record linkage is an open challenge of particular relevance to Australian Government Agencies, who recognise that so-called wicked social problems are best tackled by forming partnerships founded on large-scale data fusion. Names and addresses are the most common attributes on which data from different government agencies can be linked. In this paper, we focus on the problem of address linking. Linkage is particularly problematic when the data has significant quality issues. The most common approach for dealing with quality issues is to standardise raw data prior to link","authors_text":"Kee Siong Ng, Tania Churchill, Yuhang Zhang","cross_cats":["cs.DS"],"headline":"","license":"http://arxiv.org/licenses/nonexclusive-distrib/1.0/","primary_cat":"cs.DB","submitted_at":"2017-08-04T07:26:20Z","title":"Exploiting Redundancy, Recurrence and Parallelism: How to Link Millions of Addresses with Ten Lines of Code in Ten Minutes"},"references":{"count":0,"internal_anchors":0,"resolved_work":0,"sample":[],"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"source":{"id":"1708.01402","kind":"arxiv","version":4},"verdict":{"created_at":null,"id":null,"model_set":{},"one_line_summary":"","pipeline_version":null,"pith_extraction_headline":"","strongest_claim":"","weakest_assumption":""}},"verdict_id":null}}],"author_attestations":[],"timestamp_anchors":[],"storage_attestations":[],"citation_signatures":[],"replication_records":[],"corrections":[],"mirror_hints":[],"record_created":{"event_id":"sha256:34e8e97a416143eb5a17aa0eb95311c7914e1dda0f995590620905e738406768","target":"record","created_at":"2026-05-18T00:24:42Z","signer":{"key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","signer_id":"pith.science","signer_type":"pith_registry"},"payload":{"attestation_state":"computed","canonical_record":{"metadata":{"abstract_canon_sha256":"d9f8bddec30866d1fe3f554bf56b6e1840be6053464b100fd99e9da98ef24c99","cross_cats_sorted":["cs.DS"],"license":"http://arxiv.org/licenses/nonexclusive-distrib/1.0/","primary_cat":"cs.DB","submitted_at":"2017-08-04T07:26:20Z","title_canon_sha256":"44d2d5f2cf1f5ca9bca87d8f5fe25090506876105a6375b455ad7eaec455c288"},"schema_version":"1.0","source":{"id":"1708.01402","kind":"arxiv","version":4}},"canonical_sha256":"4c61a670bc72d7367f67cb534b3355e9b7e27bc9a70d3f4ec2acf686a76ddc23","receipt":{"algorithm":"ed25519","builder_version":"pith-number-builder-2026-05-17-v1","canonical_sha256":"4c61a670bc72d7367f67cb534b3355e9b7e27bc9a70d3f4ec2acf686a76ddc23","first_computed_at":"2026-05-18T00:24:42.549687Z","key_id":"pith-v1-2026-05","kind":"pith_receipt","last_reissued_at":"2026-05-18T00:24:42.549687Z","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","receipt_version":"0.3","signature_b64":"w06sng0TPvW61YTKYEcbl68VJoaXSYu3f+v9WWw9iXry82SDizDGIHYtXfd/h4xUrvu3zGfE/qkF1+5FvUt5DA==","signature_status":"signed_v1","signed_at":"2026-05-18T00:24:42.550345Z","signed_message":"canonical_sha256_bytes"},"source_id":"1708.01402","source_kind":"arxiv","source_version":4}}},"equivocations":[],"invalid_events":[],"applied_event_ids":["sha256:34e8e97a416143eb5a17aa0eb95311c7914e1dda0f995590620905e738406768","sha256:0940ad802e634f889545745ae74af4aa135ad9581d682000828dee51018203af"],"state_sha256":"1cd174479da22516fd060dcc4aee84337957f3b52674e1a1d91df028f99fcc01"}