{"bundle_type":"pith_open_graph_bundle","bundle_version":"1.0","pith_number":"pith:2023:SYRUPKFAE4AZHGQUTELY2JADLP","short_pith_number":"pith:SYRUPKFA","canonical_record":{"source":{"id":"2307.00417","kind":"arxiv","version":1},"metadata":{"license":"http://arxiv.org/licenses/nonexclusive-distrib/1.0/","primary_cat":"cs.DB","submitted_at":"2023-07-01T20:00:30Z","cross_cats_sorted":["cs.HC"],"title_canon_sha256":"7d39cd69ee2e935b21701e9f8714416ce5812412bc9f92c7a5fbbb6a03d640fd","abstract_canon_sha256":"12f6b529d20da1b3667ca43910585074f1e2ea5ef671b800e5baedcfed50536d"},"schema_version":"1.0"},"canonical_sha256":"962347a8a02701939a1499178d24035bc8827db891e78a204e34b7b5e36f4b8c","source":{"kind":"arxiv","id":"2307.00417","version":1},"source_aliases":[{"alias_kind":"arxiv","alias_value":"2307.00417","created_at":"2026-07-05T06:26:55Z"},{"alias_kind":"arxiv_version","alias_value":"2307.00417v1","created_at":"2026-07-05T06:26:55Z"},{"alias_kind":"doi","alias_value":"10.48550/arxiv.2307.00417","created_at":"2026-07-05T06:26:55Z"},{"alias_kind":"pith_short_12","alias_value":"SYRUPKFAE4AZ","created_at":"2026-07-05T06:26:55Z"},{"alias_kind":"pith_short_16","alias_value":"SYRUPKFAE4AZHGQU","created_at":"2026-07-05T06:26:55Z"},{"alias_kind":"pith_short_8","alias_value":"SYRUPKFA","created_at":"2026-07-05T06:26:55Z"}],"events":[{"event_type":"record_created","subject_pith_number":"pith:2023:SYRUPKFAE4AZHGQUTELY2JADLP","target":"record","payload":{"canonical_record":{"source":{"id":"2307.00417","kind":"arxiv","version":1},"metadata":{"license":"http://arxiv.org/licenses/nonexclusive-distrib/1.0/","primary_cat":"cs.DB","submitted_at":"2023-07-01T20:00:30Z","cross_cats_sorted":["cs.HC"],"title_canon_sha256":"7d39cd69ee2e935b21701e9f8714416ce5812412bc9f92c7a5fbbb6a03d640fd","abstract_canon_sha256":"12f6b529d20da1b3667ca43910585074f1e2ea5ef671b800e5baedcfed50536d"},"schema_version":"1.0"},"canonical_sha256":"962347a8a02701939a1499178d24035bc8827db891e78a204e34b7b5e36f4b8c","receipt":{"kind":"pith_receipt","key_id":"pith-v1-2026-05","algorithm":"ed25519","signed_at":"2026-07-05T06:26:55.908559Z","signature_b64":"NfbvqHyoT4TztJxbuj3hWNkJSbdZxIH/jBPTZ2lvHLf6MJi3PQuFL8Aioy8oZco1GXfSmElbFO2XymY6X7mHDg==","signed_message":"canonical_sha256_bytes","builder_version":"pith-number-builder-2026-05-17-v1","receipt_version":"0.3","canonical_sha256":"962347a8a02701939a1499178d24035bc8827db891e78a204e34b7b5e36f4b8c","last_reissued_at":"2026-07-05T06:26:55.908051Z","signature_status":"signed_v1","first_computed_at":"2026-07-05T06:26:55.908051Z","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54"},"source_kind":"arxiv","source_id":"2307.00417","source_version":1,"attestation_state":"computed"},"signer":{"signer_id":"pith.science","signer_type":"pith_registry","key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54"},"created_at":"2026-07-05T06:26:55Z","supersedes":[],"prev_event":null,"signature":{"signature_status":"signed_v1","algorithm":"ed25519","key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","signature_b64":"VCzRWFpSzrVy+oGC7cO6nFHWG2qUyGr0U2L7/Kc3H07mehH20mT6yG0bd1BtVKkzK+RI2nb5CxuA4oII5FuzCQ==","signed_message":"open_graph_event_sha256_bytes","signed_at":"2026-07-05T14:58:21.462373Z"},"content_sha256":"462095ac08607f60e8a09baff7dc5d366dfadde15a713a1024c6f4520e0310d7","schema_version":"1.0","event_id":"sha256:462095ac08607f60e8a09baff7dc5d366dfadde15a713a1024c6f4520e0310d7"},{"event_type":"graph_snapshot","subject_pith_number":"pith:2023:SYRUPKFAE4AZHGQUTELY2JADLP","target":"graph","payload":{"graph_snapshot":{"paper":{"title":"Aggregation Consistency Errors in Semantic Layers and How to Avoid Them","license":"http://arxiv.org/licenses/nonexclusive-distrib/1.0/","headline":"","cross_cats":["cs.HC"],"primary_cat":"cs.DB","authors_text":"Eugene Wu, Pavan Kalyan Damalapati, Zezhou Huang","submitted_at":"2023-07-01T20:00:30Z","abstract_excerpt":"Analysts often struggle with analyzing data from multiple tables in a database due to their lack of knowledge on how to join and aggregate the data. To address this, data engineers pre-specify \"semantic layers\" which include the join conditions and \"metrics\" of interest with aggregation functions and expressions. However, joins can cause \"aggregation consistency issues\". For example, analysts may observe inflated total revenue caused by double counting from join fanouts. Existing BI tools rely on heuristics for deduplication, resulting in imprecise and challenging-to-understand outcomes. To ov"},"claims":{"count":0,"items":[],"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"source":{"id":"2307.00417","kind":"arxiv","version":1},"verdict":{"id":null,"model_set":{},"created_at":null,"strongest_claim":"","one_line_summary":"","pipeline_version":null,"weakest_assumption":"","pith_extraction_headline":""},"integrity":{"clean":true,"summary":{"advisory":0,"critical":0,"by_detector":{},"informational":0},"endpoint":"/pith/2307.00417/integrity.json","findings":[],"available":true,"detectors_run":[],"snapshot_sha256":"c28c3603d3b5d939e8dc4c7e95fa8dfce3d595e45f758748cecf8e644a296938"},"references":{"count":0,"sample":[],"resolved_work":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57","internal_anchors":0},"formal_canon":{"evidence_count":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"author_claims":{"count":0,"strong_count":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"builder_version":"pith-number-builder-2026-05-17-v1"},"verdict_id":null},"signer":{"signer_id":"pith.science","signer_type":"pith_registry","key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54"},"created_at":"2026-07-05T06:26:55Z","supersedes":[],"prev_event":null,"signature":{"signature_status":"signed_v1","algorithm":"ed25519","key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","signature_b64":"P0DTwm6d4TMhE6gBCie8Gas5BpcT62B4c+l5v+SLn1+cMCuCGDf+toKoDdIbC1ADBZtjehMsuMI35+rQ+doqBw==","signed_message":"open_graph_event_sha256_bytes","signed_at":"2026-07-05T14:58:21.462992Z"},"content_sha256":"b9f4e99719808bcc7415b51738cd767b2e04a4d3b3bd3b6a308fb3edc1040b52","schema_version":"1.0","event_id":"sha256:b9f4e99719808bcc7415b51738cd767b2e04a4d3b3bd3b6a308fb3edc1040b52"}],"timestamp_proofs":[],"mirror_hints":[{"mirror_type":"https","name":"Pith Resolver","base_url":"https://pith.science","bundle_url":"https://pith.science/pith/SYRUPKFAE4AZHGQUTELY2JADLP/bundle.json","state_url":"https://pith.science/pith/SYRUPKFAE4AZHGQUTELY2JADLP/state.json","well_known_bundle_url":"https://pith.science/.well-known/pith/SYRUPKFAE4AZHGQUTELY2JADLP/bundle.json","status":"primary"}],"public_keys":[{"key_id":"pith-v1-2026-05","algorithm":"ed25519","format":"raw","public_key_b64":"stVStoiQhXFxp4s2pdzPNoqVNBMojDU/fJ2db5S3CbM=","public_key_hex":"b2d552b68890857171a78b36a5dccf368a953413288c353f7c9d9d6f94b709b3","fingerprint_sha256_b32_first128bits":"RVFV5Z2OI2J3ZUO7ERDEBCYNKS","fingerprint_sha256_hex":"8d4b5ee74e4693bcd1df2446408b0d54","rotates_at":null,"url":"https://pith.science/pith-signing-key.json","notes":"Pith uses this Ed25519 key to sign canonical record SHA-256 digests. Verify with: ed25519_verify(public_key, message=canonical_sha256_bytes, signature=base64decode(signature_b64))."}],"merge_version":"pith-open-graph-merge-v1","built_at":"2026-07-05T14:58:21Z","links":{"resolver":"https://pith.science/pith/SYRUPKFAE4AZHGQUTELY2JADLP","bundle":"https://pith.science/pith/SYRUPKFAE4AZHGQUTELY2JADLP/bundle.json","state":"https://pith.science/pith/SYRUPKFAE4AZHGQUTELY2JADLP/state.json","well_known_bundle":"https://pith.science/.well-known/pith/SYRUPKFAE4AZHGQUTELY2JADLP/bundle.json"},"state":{"state_type":"pith_open_graph_state","state_version":"1.0","pith_number":"pith:2023:SYRUPKFAE4AZHGQUTELY2JADLP","merge_version":"pith-open-graph-merge-v1","event_count":2,"valid_event_count":2,"invalid_event_count":0,"equivocation_count":0,"current":{"canonical_record":{"metadata":{"abstract_canon_sha256":"12f6b529d20da1b3667ca43910585074f1e2ea5ef671b800e5baedcfed50536d","cross_cats_sorted":["cs.HC"],"license":"http://arxiv.org/licenses/nonexclusive-distrib/1.0/","primary_cat":"cs.DB","submitted_at":"2023-07-01T20:00:30Z","title_canon_sha256":"7d39cd69ee2e935b21701e9f8714416ce5812412bc9f92c7a5fbbb6a03d640fd"},"schema_version":"1.0","source":{"id":"2307.00417","kind":"arxiv","version":1}},"source_aliases":[{"alias_kind":"arxiv","alias_value":"2307.00417","created_at":"2026-07-05T06:26:55Z"},{"alias_kind":"arxiv_version","alias_value":"2307.00417v1","created_at":"2026-07-05T06:26:55Z"},{"alias_kind":"doi","alias_value":"10.48550/arxiv.2307.00417","created_at":"2026-07-05T06:26:55Z"},{"alias_kind":"pith_short_12","alias_value":"SYRUPKFAE4AZ","created_at":"2026-07-05T06:26:55Z"},{"alias_kind":"pith_short_16","alias_value":"SYRUPKFAE4AZHGQU","created_at":"2026-07-05T06:26:55Z"},{"alias_kind":"pith_short_8","alias_value":"SYRUPKFA","created_at":"2026-07-05T06:26:55Z"}],"graph_snapshots":[{"event_id":"sha256:b9f4e99719808bcc7415b51738cd767b2e04a4d3b3bd3b6a308fb3edc1040b52","target":"graph","created_at":"2026-07-05T06:26:55Z","signer":{"key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","signer_id":"pith.science","signer_type":"pith_registry"},"payload":{"graph_snapshot":{"author_claims":{"count":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57","strong_count":0},"builder_version":"pith-number-builder-2026-05-17-v1","claims":{"count":0,"items":[],"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"formal_canon":{"evidence_count":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"integrity":{"available":true,"clean":true,"detectors_run":[],"endpoint":"/pith/2307.00417/integrity.json","findings":[],"snapshot_sha256":"c28c3603d3b5d939e8dc4c7e95fa8dfce3d595e45f758748cecf8e644a296938","summary":{"advisory":0,"by_detector":{},"critical":0,"informational":0}},"paper":{"abstract_excerpt":"Analysts often struggle with analyzing data from multiple tables in a database due to their lack of knowledge on how to join and aggregate the data. To address this, data engineers pre-specify \"semantic layers\" which include the join conditions and \"metrics\" of interest with aggregation functions and expressions. However, joins can cause \"aggregation consistency issues\". For example, analysts may observe inflated total revenue caused by double counting from join fanouts. Existing BI tools rely on heuristics for deduplication, resulting in imprecise and challenging-to-understand outcomes. To ov","authors_text":"Eugene Wu, Pavan Kalyan Damalapati, Zezhou Huang","cross_cats":["cs.HC"],"headline":"","license":"http://arxiv.org/licenses/nonexclusive-distrib/1.0/","primary_cat":"cs.DB","submitted_at":"2023-07-01T20:00:30Z","title":"Aggregation Consistency Errors in Semantic Layers and How to Avoid Them"},"references":{"count":0,"internal_anchors":0,"resolved_work":0,"sample":[],"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"source":{"id":"2307.00417","kind":"arxiv","version":1},"verdict":{"created_at":null,"id":null,"model_set":{},"one_line_summary":"","pipeline_version":null,"pith_extraction_headline":"","strongest_claim":"","weakest_assumption":""}},"verdict_id":null}}],"author_attestations":[],"timestamp_anchors":[],"storage_attestations":[],"citation_signatures":[],"replication_records":[],"corrections":[],"mirror_hints":[],"record_created":{"event_id":"sha256:462095ac08607f60e8a09baff7dc5d366dfadde15a713a1024c6f4520e0310d7","target":"record","created_at":"2026-07-05T06:26:55Z","signer":{"key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","signer_id":"pith.science","signer_type":"pith_registry"},"payload":{"attestation_state":"computed","canonical_record":{"metadata":{"abstract_canon_sha256":"12f6b529d20da1b3667ca43910585074f1e2ea5ef671b800e5baedcfed50536d","cross_cats_sorted":["cs.HC"],"license":"http://arxiv.org/licenses/nonexclusive-distrib/1.0/","primary_cat":"cs.DB","submitted_at":"2023-07-01T20:00:30Z","title_canon_sha256":"7d39cd69ee2e935b21701e9f8714416ce5812412bc9f92c7a5fbbb6a03d640fd"},"schema_version":"1.0","source":{"id":"2307.00417","kind":"arxiv","version":1}},"canonical_sha256":"962347a8a02701939a1499178d24035bc8827db891e78a204e34b7b5e36f4b8c","receipt":{"algorithm":"ed25519","builder_version":"pith-number-builder-2026-05-17-v1","canonical_sha256":"962347a8a02701939a1499178d24035bc8827db891e78a204e34b7b5e36f4b8c","first_computed_at":"2026-07-05T06:26:55.908051Z","key_id":"pith-v1-2026-05","kind":"pith_receipt","last_reissued_at":"2026-07-05T06:26:55.908051Z","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","receipt_version":"0.3","signature_b64":"NfbvqHyoT4TztJxbuj3hWNkJSbdZxIH/jBPTZ2lvHLf6MJi3PQuFL8Aioy8oZco1GXfSmElbFO2XymY6X7mHDg==","signature_status":"signed_v1","signed_at":"2026-07-05T06:26:55.908559Z","signed_message":"canonical_sha256_bytes"},"source_id":"2307.00417","source_kind":"arxiv","source_version":1}}},"equivocations":[],"invalid_events":[],"applied_event_ids":["sha256:462095ac08607f60e8a09baff7dc5d366dfadde15a713a1024c6f4520e0310d7","sha256:b9f4e99719808bcc7415b51738cd767b2e04a4d3b3bd3b6a308fb3edc1040b52"],"state_sha256":"c8f1d31b5d04e87937d46b72c84a1a48800b83acec8fc6e3765ca9bae30a53ca"},"bundle_signature":{"signature_status":"signed_v1","algorithm":"ed25519","key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","signature_b64":"ukpYSrP1MUEEKLyHjG8Mzi6R7jAgKVHNDruwgTiuok3muQYMFKQBKDFyUvwBCZ7HhTRwiUAlTkwwFraU58l5DA==","signed_message":"bundle_sha256_bytes","signed_at":"2026-07-05T14:58:21.466873Z","bundle_sha256":"da3362c6f46a306c0430b4741e8c993784acaedb6fcdf9d17b6a4386d9af8ee3"}}