{"bundle_type":"pith_open_graph_bundle","bundle_version":"1.0","pith_number":"pith:2011:PO6EZICZ732ZXBGUZMJJYAHQPW","short_pith_number":"pith:PO6EZICZ","canonical_record":{"source":{"id":"1107.1697","kind":"arxiv","version":1},"metadata":{"license":"http://arxiv.org/licenses/nonexclusive-distrib/1.0/","primary_cat":"stat.CO","submitted_at":"2011-07-08T18:50:16Z","cross_cats_sorted":["cs.DS"],"title_canon_sha256":"c77a5737abf60a267296eeebc28eb9df9cb8021d6d1506c4d870027ce49f1525","abstract_canon_sha256":"5253c2f2348d28de06fe8274238ffe7d97d82243a02b2979ea9d4e1b49c147d6"},"schema_version":"1.0"},"canonical_sha256":"7bbc4ca059fef59b84d4cb129c00f07db86e385d8109f35e273afa357c4ae858","source":{"kind":"arxiv","id":"1107.1697","version":1},"source_aliases":[{"alias_kind":"arxiv","alias_value":"1107.1697","created_at":"2026-05-18T02:21:43Z"},{"alias_kind":"arxiv_version","alias_value":"1107.1697v1","created_at":"2026-05-18T02:21:43Z"},{"alias_kind":"doi","alias_value":"10.48550/arxiv.1107.1697","created_at":"2026-05-18T02:21:43Z"},{"alias_kind":"pith_short_12","alias_value":"PO6EZICZ732Z","created_at":"2026-05-18T12:26:39Z"},{"alias_kind":"pith_short_16","alias_value":"PO6EZICZ732ZXBGU","created_at":"2026-05-18T12:26:39Z"},{"alias_kind":"pith_short_8","alias_value":"PO6EZICZ","created_at":"2026-05-18T12:26:39Z"}],"events":[{"event_type":"record_created","subject_pith_number":"pith:2011:PO6EZICZ732ZXBGUZMJJYAHQPW","target":"record","payload":{"canonical_record":{"source":{"id":"1107.1697","kind":"arxiv","version":1},"metadata":{"license":"http://arxiv.org/licenses/nonexclusive-distrib/1.0/","primary_cat":"stat.CO","submitted_at":"2011-07-08T18:50:16Z","cross_cats_sorted":["cs.DS"],"title_canon_sha256":"c77a5737abf60a267296eeebc28eb9df9cb8021d6d1506c4d870027ce49f1525","abstract_canon_sha256":"5253c2f2348d28de06fe8274238ffe7d97d82243a02b2979ea9d4e1b49c147d6"},"schema_version":"1.0"},"canonical_sha256":"7bbc4ca059fef59b84d4cb129c00f07db86e385d8109f35e273afa357c4ae858","receipt":{"kind":"pith_receipt","key_id":"pith-v1-2026-05","algorithm":"ed25519","signed_at":"2026-05-18T02:21:43.166788Z","signature_b64":"fOqLWi0JaPCZh+3Du4yuvqLuBpPxYQ7tusBLtMtR/wNvLjUkXQZ/P34xMIIByASJLf7LhMtV5l7a5ncpGDTMCQ==","signed_message":"canonical_sha256_bytes","builder_version":"pith-number-builder-2026-05-17-v1","receipt_version":"0.3","canonical_sha256":"7bbc4ca059fef59b84d4cb129c00f07db86e385d8109f35e273afa357c4ae858","last_reissued_at":"2026-05-18T02:21:43.166396Z","signature_status":"signed_v1","first_computed_at":"2026-05-18T02:21:43.166396Z","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54"},"source_kind":"arxiv","source_id":"1107.1697","source_version":1,"attestation_state":"computed"},"signer":{"signer_id":"pith.science","signer_type":"pith_registry","key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54"},"created_at":"2026-05-18T02:21:43Z","supersedes":[],"prev_event":null,"signature":{"signature_status":"signed_v1","algorithm":"ed25519","key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","signature_b64":"HzVMHXk7u4eELoVdnuWv1eInb5yizsd2e41sIeoqjyIMVRaPMhkY+JG5la7AISR3DH0QyovDhi6EiLSTIFMVBA==","signed_message":"open_graph_event_sha256_bytes","signed_at":"2026-05-31T16:38:09.114213Z"},"content_sha256":"adc2fbc8b1f4a2f2442ccf0bd3eeb3786ef569bb87d024f724bd3f4a4d4bc756","schema_version":"1.0","event_id":"sha256:adc2fbc8b1f4a2f2442ccf0bd3eeb3786ef569bb87d024f724bd3f4a4d4bc756"},{"event_type":"graph_snapshot","subject_pith_number":"pith:2011:PO6EZICZ732ZXBGUZMJJYAHQPW","target":"graph","payload":{"graph_snapshot":{"paper":{"title":"Distinct counting with a self-learning bitmap","license":"http://arxiv.org/licenses/nonexclusive-distrib/1.0/","headline":"","cross_cats":["cs.DS"],"primary_cat":"stat.CO","authors_text":"Aiyou Chen, Jin Cao, Larry Shepp, Tuan Nguyen","submitted_at":"2011-07-08T18:50:16Z","abstract_excerpt":"Counting the number of distinct elements (cardinality) in a dataset is a fundamental problem in database management. In recent years, due to many of its modern applications, there has been significant interest to address the distinct counting problem in a data stream setting, where each incoming data can be seen only once and cannot be stored for long periods of time. Many probabilistic approaches based on either sampling or sketching have been proposed in the computer science literature, that only require limited computing and memory resources. However, the performances of these methods are n"},"claims":{"count":0,"items":[],"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"source":{"id":"1107.1697","kind":"arxiv","version":1},"verdict":{"id":null,"model_set":{},"created_at":null,"strongest_claim":"","one_line_summary":"","pipeline_version":null,"weakest_assumption":"","pith_extraction_headline":""},"references":{"count":0,"sample":[],"resolved_work":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57","internal_anchors":0},"formal_canon":{"evidence_count":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"author_claims":{"count":0,"strong_count":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"builder_version":"pith-number-builder-2026-05-17-v1"},"verdict_id":null},"signer":{"signer_id":"pith.science","signer_type":"pith_registry","key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54"},"created_at":"2026-05-18T02:21:43Z","supersedes":[],"prev_event":null,"signature":{"signature_status":"signed_v1","algorithm":"ed25519","key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","signature_b64":"kfABf4pfyHQ+w4JC3FS/XCgdFD5K7IewT7dlN1I98QfbfTHwsjG2Z3vrKsVMfIhQDkibLIYJgkRjfQG5qvFKAw==","signed_message":"open_graph_event_sha256_bytes","signed_at":"2026-05-31T16:38:09.114734Z"},"content_sha256":"ebd2d4f33f0e9860d16768feb6c1248f9bedf92cc04b574d14c97c2487f15db9","schema_version":"1.0","event_id":"sha256:ebd2d4f33f0e9860d16768feb6c1248f9bedf92cc04b574d14c97c2487f15db9"}],"timestamp_proofs":[],"mirror_hints":[{"mirror_type":"https","name":"Pith Resolver","base_url":"https://pith.science","bundle_url":"https://pith.science/pith/PO6EZICZ732ZXBGUZMJJYAHQPW/bundle.json","state_url":"https://pith.science/pith/PO6EZICZ732ZXBGUZMJJYAHQPW/state.json","well_known_bundle_url":"https://pith.science/.well-known/pith/PO6EZICZ732ZXBGUZMJJYAHQPW/bundle.json","status":"primary"}],"public_keys":[{"key_id":"pith-v1-2026-05","algorithm":"ed25519","format":"raw","public_key_b64":"stVStoiQhXFxp4s2pdzPNoqVNBMojDU/fJ2db5S3CbM=","public_key_hex":"b2d552b68890857171a78b36a5dccf368a953413288c353f7c9d9d6f94b709b3","fingerprint_sha256_b32_first128bits":"RVFV5Z2OI2J3ZUO7ERDEBCYNKS","fingerprint_sha256_hex":"8d4b5ee74e4693bcd1df2446408b0d54","rotates_at":null,"url":"https://pith.science/pith-signing-key.json","notes":"Pith uses this Ed25519 key to sign canonical record SHA-256 digests. Verify with: ed25519_verify(public_key, message=canonical_sha256_bytes, signature=base64decode(signature_b64))."}],"merge_version":"pith-open-graph-merge-v1","built_at":"2026-05-31T16:38:09Z","links":{"resolver":"https://pith.science/pith/PO6EZICZ732ZXBGUZMJJYAHQPW","bundle":"https://pith.science/pith/PO6EZICZ732ZXBGUZMJJYAHQPW/bundle.json","state":"https://pith.science/pith/PO6EZICZ732ZXBGUZMJJYAHQPW/state.json","well_known_bundle":"https://pith.science/.well-known/pith/PO6EZICZ732ZXBGUZMJJYAHQPW/bundle.json"},"state":{"state_type":"pith_open_graph_state","state_version":"1.0","pith_number":"pith:2011:PO6EZICZ732ZXBGUZMJJYAHQPW","merge_version":"pith-open-graph-merge-v1","event_count":2,"valid_event_count":2,"invalid_event_count":0,"equivocation_count":0,"current":{"canonical_record":{"metadata":{"abstract_canon_sha256":"5253c2f2348d28de06fe8274238ffe7d97d82243a02b2979ea9d4e1b49c147d6","cross_cats_sorted":["cs.DS"],"license":"http://arxiv.org/licenses/nonexclusive-distrib/1.0/","primary_cat":"stat.CO","submitted_at":"2011-07-08T18:50:16Z","title_canon_sha256":"c77a5737abf60a267296eeebc28eb9df9cb8021d6d1506c4d870027ce49f1525"},"schema_version":"1.0","source":{"id":"1107.1697","kind":"arxiv","version":1}},"source_aliases":[{"alias_kind":"arxiv","alias_value":"1107.1697","created_at":"2026-05-18T02:21:43Z"},{"alias_kind":"arxiv_version","alias_value":"1107.1697v1","created_at":"2026-05-18T02:21:43Z"},{"alias_kind":"doi","alias_value":"10.48550/arxiv.1107.1697","created_at":"2026-05-18T02:21:43Z"},{"alias_kind":"pith_short_12","alias_value":"PO6EZICZ732Z","created_at":"2026-05-18T12:26:39Z"},{"alias_kind":"pith_short_16","alias_value":"PO6EZICZ732ZXBGU","created_at":"2026-05-18T12:26:39Z"},{"alias_kind":"pith_short_8","alias_value":"PO6EZICZ","created_at":"2026-05-18T12:26:39Z"}],"graph_snapshots":[{"event_id":"sha256:ebd2d4f33f0e9860d16768feb6c1248f9bedf92cc04b574d14c97c2487f15db9","target":"graph","created_at":"2026-05-18T02:21:43Z","signer":{"key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","signer_id":"pith.science","signer_type":"pith_registry"},"payload":{"graph_snapshot":{"author_claims":{"count":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57","strong_count":0},"builder_version":"pith-number-builder-2026-05-17-v1","claims":{"count":0,"items":[],"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"formal_canon":{"evidence_count":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"paper":{"abstract_excerpt":"Counting the number of distinct elements (cardinality) in a dataset is a fundamental problem in database management. In recent years, due to many of its modern applications, there has been significant interest to address the distinct counting problem in a data stream setting, where each incoming data can be seen only once and cannot be stored for long periods of time. Many probabilistic approaches based on either sampling or sketching have been proposed in the computer science literature, that only require limited computing and memory resources. However, the performances of these methods are n","authors_text":"Aiyou Chen, Jin Cao, Larry Shepp, Tuan Nguyen","cross_cats":["cs.DS"],"headline":"","license":"http://arxiv.org/licenses/nonexclusive-distrib/1.0/","primary_cat":"stat.CO","submitted_at":"2011-07-08T18:50:16Z","title":"Distinct counting with a self-learning bitmap"},"references":{"count":0,"internal_anchors":0,"resolved_work":0,"sample":[],"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"source":{"id":"1107.1697","kind":"arxiv","version":1},"verdict":{"created_at":null,"id":null,"model_set":{},"one_line_summary":"","pipeline_version":null,"pith_extraction_headline":"","strongest_claim":"","weakest_assumption":""}},"verdict_id":null}}],"author_attestations":[],"timestamp_anchors":[],"storage_attestations":[],"citation_signatures":[],"replication_records":[],"corrections":[],"mirror_hints":[],"record_created":{"event_id":"sha256:adc2fbc8b1f4a2f2442ccf0bd3eeb3786ef569bb87d024f724bd3f4a4d4bc756","target":"record","created_at":"2026-05-18T02:21:43Z","signer":{"key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","signer_id":"pith.science","signer_type":"pith_registry"},"payload":{"attestation_state":"computed","canonical_record":{"metadata":{"abstract_canon_sha256":"5253c2f2348d28de06fe8274238ffe7d97d82243a02b2979ea9d4e1b49c147d6","cross_cats_sorted":["cs.DS"],"license":"http://arxiv.org/licenses/nonexclusive-distrib/1.0/","primary_cat":"stat.CO","submitted_at":"2011-07-08T18:50:16Z","title_canon_sha256":"c77a5737abf60a267296eeebc28eb9df9cb8021d6d1506c4d870027ce49f1525"},"schema_version":"1.0","source":{"id":"1107.1697","kind":"arxiv","version":1}},"canonical_sha256":"7bbc4ca059fef59b84d4cb129c00f07db86e385d8109f35e273afa357c4ae858","receipt":{"algorithm":"ed25519","builder_version":"pith-number-builder-2026-05-17-v1","canonical_sha256":"7bbc4ca059fef59b84d4cb129c00f07db86e385d8109f35e273afa357c4ae858","first_computed_at":"2026-05-18T02:21:43.166396Z","key_id":"pith-v1-2026-05","kind":"pith_receipt","last_reissued_at":"2026-05-18T02:21:43.166396Z","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","receipt_version":"0.3","signature_b64":"fOqLWi0JaPCZh+3Du4yuvqLuBpPxYQ7tusBLtMtR/wNvLjUkXQZ/P34xMIIByASJLf7LhMtV5l7a5ncpGDTMCQ==","signature_status":"signed_v1","signed_at":"2026-05-18T02:21:43.166788Z","signed_message":"canonical_sha256_bytes"},"source_id":"1107.1697","source_kind":"arxiv","source_version":1}}},"equivocations":[],"invalid_events":[],"applied_event_ids":["sha256:adc2fbc8b1f4a2f2442ccf0bd3eeb3786ef569bb87d024f724bd3f4a4d4bc756","sha256:ebd2d4f33f0e9860d16768feb6c1248f9bedf92cc04b574d14c97c2487f15db9"],"state_sha256":"ada4256e826e90cdeb978696b5d82581fb503d2b379c98c2aeb394c0c1048dda"},"bundle_signature":{"signature_status":"signed_v1","algorithm":"ed25519","key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","signature_b64":"5xZyzBsIgJ3+a4eSPSYYTVRDMshcI8mE6H02CZwq9ImvPT8O/HKC0gTX3aSnc/sRKz9MJwN+R32Dlv7PXwMfCA==","signed_message":"bundle_sha256_bytes","signed_at":"2026-05-31T16:38:09.117994Z","bundle_sha256":"d6bb219a3449966a5c32cf87f7a210675c162df992e53d25bca58e0616cbd9f4"}}