{"bundle_type":"pith_open_graph_bundle","bundle_version":"1.0","pith_number":"pith:2018:QT3CKYHYEL4FKLQ4TFPB7IM3RF","short_pith_number":"pith:QT3CKYHY","canonical_record":{"source":{"id":"1810.04599","kind":"arxiv","version":2},"metadata":{"license":"http://arxiv.org/licenses/nonexclusive-distrib/1.0/","primary_cat":"cs.DB","submitted_at":"2018-10-10T15:40:27Z","cross_cats_sorted":[],"title_canon_sha256":"f678aa6f156d9985d5b7b3e10787d33a04fc8503e93bad352c457e1bb6fc71f2","abstract_canon_sha256":"bad5eb17b78d72746aad4a688c20ea8ee2178af1cb8bc06b2ba576d6c8ea526b"},"schema_version":"1.0"},"canonical_sha256":"84f62560f822f8552e1c995e1fa19b895c80941f8ba81597f5f2270ed0bc611c","source":{"kind":"arxiv","id":"1810.04599","version":2},"source_aliases":[{"alias_kind":"arxiv","alias_value":"1810.04599","created_at":"2026-05-18T00:03:14Z"},{"alias_kind":"arxiv_version","alias_value":"1810.04599v2","created_at":"2026-05-18T00:03:14Z"},{"alias_kind":"doi","alias_value":"10.48550/arxiv.1810.04599","created_at":"2026-05-18T00:03:14Z"},{"alias_kind":"pith_short_12","alias_value":"QT3CKYHYEL4F","created_at":"2026-05-18T12:32:46Z"},{"alias_kind":"pith_short_16","alias_value":"QT3CKYHYEL4FKLQ4","created_at":"2026-05-18T12:32:46Z"},{"alias_kind":"pith_short_8","alias_value":"QT3CKYHY","created_at":"2026-05-18T12:32:46Z"}],"events":[{"event_type":"record_created","subject_pith_number":"pith:2018:QT3CKYHYEL4FKLQ4TFPB7IM3RF","target":"record","payload":{"canonical_record":{"source":{"id":"1810.04599","kind":"arxiv","version":2},"metadata":{"license":"http://arxiv.org/licenses/nonexclusive-distrib/1.0/","primary_cat":"cs.DB","submitted_at":"2018-10-10T15:40:27Z","cross_cats_sorted":[],"title_canon_sha256":"f678aa6f156d9985d5b7b3e10787d33a04fc8503e93bad352c457e1bb6fc71f2","abstract_canon_sha256":"bad5eb17b78d72746aad4a688c20ea8ee2178af1cb8bc06b2ba576d6c8ea526b"},"schema_version":"1.0"},"canonical_sha256":"84f62560f822f8552e1c995e1fa19b895c80941f8ba81597f5f2270ed0bc611c","receipt":{"kind":"pith_receipt","key_id":"pith-v1-2026-05","algorithm":"ed25519","signed_at":"2026-05-18T00:03:14.415442Z","signature_b64":"Jb7b8p1ENQvhqGKRXUqvQYDx/0Tjeh19PRND6xeMKxO/oRB74lrJNbKIrm/S0v2Rk9jbA8kU0r5xpJ0CUxEhAA==","signed_message":"canonical_sha256_bytes","builder_version":"pith-number-builder-2026-05-17-v1","receipt_version":"0.3","canonical_sha256":"84f62560f822f8552e1c995e1fa19b895c80941f8ba81597f5f2270ed0bc611c","last_reissued_at":"2026-05-18T00:03:14.414964Z","signature_status":"signed_v1","first_computed_at":"2026-05-18T00:03:14.414964Z","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54"},"source_kind":"arxiv","source_id":"1810.04599","source_version":2,"attestation_state":"computed"},"signer":{"signer_id":"pith.science","signer_type":"pith_registry","key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54"},"created_at":"2026-05-18T00:03:14Z","supersedes":[],"prev_event":null,"signature":{"signature_status":"signed_v1","algorithm":"ed25519","key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","signature_b64":"zdc1art8oBCrydZE3TD/1lAJ8xUrVOG2mzMW6CddFTELZxDgqS1OrDA4OZDQbgYrgkVyUjjuPsnRK0PHUFUDDQ==","signed_message":"open_graph_event_sha256_bytes","signed_at":"2026-06-01T07:30:46.487977Z"},"content_sha256":"ca784febcb55936f96d0d8096cd88787389700836611fd8f548df9f8d338e8a2","schema_version":"1.0","event_id":"sha256:ca784febcb55936f96d0d8096cd88787389700836611fd8f548df9f8d338e8a2"},{"event_type":"graph_snapshot","subject_pith_number":"pith:2018:QT3CKYHYEL4FKLQ4TFPB7IM3RF","target":"graph","payload":{"graph_snapshot":{"paper":{"title":"Understanding Data Science Lifecycle Provenance via Graph Segmentation and Summarization","license":"http://arxiv.org/licenses/nonexclusive-distrib/1.0/","headline":"","cross_cats":[],"primary_cat":"cs.DB","authors_text":"Amol Deshpande, Hui Miao","submitted_at":"2018-10-10T15:40:27Z","abstract_excerpt":"Increasingly modern data science platforms today have non-intrusive and extensible provenance ingestion mechanisms to collect rich provenance and context information, handle modifications to the same file using distinguishable versions, and use graph data models (e.g., property graphs) and query languages (e.g., Cypher) to represent and manipulate the stored provenance/context information. Due to the schema-later nature of the metadata, multiple versions of the same files, and unfamiliar artifacts introduced by team members, the \"provenance graph\" is verbose and evolving, and hard to understan"},"claims":{"count":0,"items":[],"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"source":{"id":"1810.04599","kind":"arxiv","version":2},"verdict":{"id":null,"model_set":{},"created_at":null,"strongest_claim":"","one_line_summary":"","pipeline_version":null,"weakest_assumption":"","pith_extraction_headline":""},"references":{"count":0,"sample":[],"resolved_work":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57","internal_anchors":0},"formal_canon":{"evidence_count":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"author_claims":{"count":0,"strong_count":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"builder_version":"pith-number-builder-2026-05-17-v1"},"verdict_id":null},"signer":{"signer_id":"pith.science","signer_type":"pith_registry","key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54"},"created_at":"2026-05-18T00:03:14Z","supersedes":[],"prev_event":null,"signature":{"signature_status":"signed_v1","algorithm":"ed25519","key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","signature_b64":"k51C5lhKSRyB9wErXaqwAszJhHCXEiyqZ5vF8JShwbofuQTjjZaLf0ruQ+9IimRidXpVqBCiMrzp95Om4l7CAQ==","signed_message":"open_graph_event_sha256_bytes","signed_at":"2026-06-01T07:30:46.488339Z"},"content_sha256":"3309ec1ec0a7cf27e3d39e021bed834b323486ce10340e61d98adec1f7d12822","schema_version":"1.0","event_id":"sha256:3309ec1ec0a7cf27e3d39e021bed834b323486ce10340e61d98adec1f7d12822"}],"timestamp_proofs":[],"mirror_hints":[{"mirror_type":"https","name":"Pith Resolver","base_url":"https://pith.science","bundle_url":"https://pith.science/pith/QT3CKYHYEL4FKLQ4TFPB7IM3RF/bundle.json","state_url":"https://pith.science/pith/QT3CKYHYEL4FKLQ4TFPB7IM3RF/state.json","well_known_bundle_url":"https://pith.science/.well-known/pith/QT3CKYHYEL4FKLQ4TFPB7IM3RF/bundle.json","status":"primary"}],"public_keys":[{"key_id":"pith-v1-2026-05","algorithm":"ed25519","format":"raw","public_key_b64":"stVStoiQhXFxp4s2pdzPNoqVNBMojDU/fJ2db5S3CbM=","public_key_hex":"b2d552b68890857171a78b36a5dccf368a953413288c353f7c9d9d6f94b709b3","fingerprint_sha256_b32_first128bits":"RVFV5Z2OI2J3ZUO7ERDEBCYNKS","fingerprint_sha256_hex":"8d4b5ee74e4693bcd1df2446408b0d54","rotates_at":null,"url":"https://pith.science/pith-signing-key.json","notes":"Pith uses this Ed25519 key to sign canonical record SHA-256 digests. Verify with: ed25519_verify(public_key, message=canonical_sha256_bytes, signature=base64decode(signature_b64))."}],"merge_version":"pith-open-graph-merge-v1","built_at":"2026-06-01T07:30:46Z","links":{"resolver":"https://pith.science/pith/QT3CKYHYEL4FKLQ4TFPB7IM3RF","bundle":"https://pith.science/pith/QT3CKYHYEL4FKLQ4TFPB7IM3RF/bundle.json","state":"https://pith.science/pith/QT3CKYHYEL4FKLQ4TFPB7IM3RF/state.json","well_known_bundle":"https://pith.science/.well-known/pith/QT3CKYHYEL4FKLQ4TFPB7IM3RF/bundle.json"},"state":{"state_type":"pith_open_graph_state","state_version":"1.0","pith_number":"pith:2018:QT3CKYHYEL4FKLQ4TFPB7IM3RF","merge_version":"pith-open-graph-merge-v1","event_count":2,"valid_event_count":2,"invalid_event_count":0,"equivocation_count":0,"current":{"canonical_record":{"metadata":{"abstract_canon_sha256":"bad5eb17b78d72746aad4a688c20ea8ee2178af1cb8bc06b2ba576d6c8ea526b","cross_cats_sorted":[],"license":"http://arxiv.org/licenses/nonexclusive-distrib/1.0/","primary_cat":"cs.DB","submitted_at":"2018-10-10T15:40:27Z","title_canon_sha256":"f678aa6f156d9985d5b7b3e10787d33a04fc8503e93bad352c457e1bb6fc71f2"},"schema_version":"1.0","source":{"id":"1810.04599","kind":"arxiv","version":2}},"source_aliases":[{"alias_kind":"arxiv","alias_value":"1810.04599","created_at":"2026-05-18T00:03:14Z"},{"alias_kind":"arxiv_version","alias_value":"1810.04599v2","created_at":"2026-05-18T00:03:14Z"},{"alias_kind":"doi","alias_value":"10.48550/arxiv.1810.04599","created_at":"2026-05-18T00:03:14Z"},{"alias_kind":"pith_short_12","alias_value":"QT3CKYHYEL4F","created_at":"2026-05-18T12:32:46Z"},{"alias_kind":"pith_short_16","alias_value":"QT3CKYHYEL4FKLQ4","created_at":"2026-05-18T12:32:46Z"},{"alias_kind":"pith_short_8","alias_value":"QT3CKYHY","created_at":"2026-05-18T12:32:46Z"}],"graph_snapshots":[{"event_id":"sha256:3309ec1ec0a7cf27e3d39e021bed834b323486ce10340e61d98adec1f7d12822","target":"graph","created_at":"2026-05-18T00:03:14Z","signer":{"key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","signer_id":"pith.science","signer_type":"pith_registry"},"payload":{"graph_snapshot":{"author_claims":{"count":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57","strong_count":0},"builder_version":"pith-number-builder-2026-05-17-v1","claims":{"count":0,"items":[],"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"formal_canon":{"evidence_count":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"paper":{"abstract_excerpt":"Increasingly modern data science platforms today have non-intrusive and extensible provenance ingestion mechanisms to collect rich provenance and context information, handle modifications to the same file using distinguishable versions, and use graph data models (e.g., property graphs) and query languages (e.g., Cypher) to represent and manipulate the stored provenance/context information. Due to the schema-later nature of the metadata, multiple versions of the same files, and unfamiliar artifacts introduced by team members, the \"provenance graph\" is verbose and evolving, and hard to understan","authors_text":"Amol Deshpande, Hui Miao","cross_cats":[],"headline":"","license":"http://arxiv.org/licenses/nonexclusive-distrib/1.0/","primary_cat":"cs.DB","submitted_at":"2018-10-10T15:40:27Z","title":"Understanding Data Science Lifecycle Provenance via Graph Segmentation and Summarization"},"references":{"count":0,"internal_anchors":0,"resolved_work":0,"sample":[],"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"source":{"id":"1810.04599","kind":"arxiv","version":2},"verdict":{"created_at":null,"id":null,"model_set":{},"one_line_summary":"","pipeline_version":null,"pith_extraction_headline":"","strongest_claim":"","weakest_assumption":""}},"verdict_id":null}}],"author_attestations":[],"timestamp_anchors":[],"storage_attestations":[],"citation_signatures":[],"replication_records":[],"corrections":[],"mirror_hints":[],"record_created":{"event_id":"sha256:ca784febcb55936f96d0d8096cd88787389700836611fd8f548df9f8d338e8a2","target":"record","created_at":"2026-05-18T00:03:14Z","signer":{"key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","signer_id":"pith.science","signer_type":"pith_registry"},"payload":{"attestation_state":"computed","canonical_record":{"metadata":{"abstract_canon_sha256":"bad5eb17b78d72746aad4a688c20ea8ee2178af1cb8bc06b2ba576d6c8ea526b","cross_cats_sorted":[],"license":"http://arxiv.org/licenses/nonexclusive-distrib/1.0/","primary_cat":"cs.DB","submitted_at":"2018-10-10T15:40:27Z","title_canon_sha256":"f678aa6f156d9985d5b7b3e10787d33a04fc8503e93bad352c457e1bb6fc71f2"},"schema_version":"1.0","source":{"id":"1810.04599","kind":"arxiv","version":2}},"canonical_sha256":"84f62560f822f8552e1c995e1fa19b895c80941f8ba81597f5f2270ed0bc611c","receipt":{"algorithm":"ed25519","builder_version":"pith-number-builder-2026-05-17-v1","canonical_sha256":"84f62560f822f8552e1c995e1fa19b895c80941f8ba81597f5f2270ed0bc611c","first_computed_at":"2026-05-18T00:03:14.414964Z","key_id":"pith-v1-2026-05","kind":"pith_receipt","last_reissued_at":"2026-05-18T00:03:14.414964Z","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","receipt_version":"0.3","signature_b64":"Jb7b8p1ENQvhqGKRXUqvQYDx/0Tjeh19PRND6xeMKxO/oRB74lrJNbKIrm/S0v2Rk9jbA8kU0r5xpJ0CUxEhAA==","signature_status":"signed_v1","signed_at":"2026-05-18T00:03:14.415442Z","signed_message":"canonical_sha256_bytes"},"source_id":"1810.04599","source_kind":"arxiv","source_version":2}}},"equivocations":[],"invalid_events":[],"applied_event_ids":["sha256:ca784febcb55936f96d0d8096cd88787389700836611fd8f548df9f8d338e8a2","sha256:3309ec1ec0a7cf27e3d39e021bed834b323486ce10340e61d98adec1f7d12822"],"state_sha256":"7882ce3a21a22e7db416a37b126a9354ef21273854a3d27f7bc9a29c0298ff13"},"bundle_signature":{"signature_status":"signed_v1","algorithm":"ed25519","key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","signature_b64":"79svTxB3yDywnN1A0TR9eV4kXrovxGn6iEAQazTlnR4TF2isQj4X+fTilVnj8ifYlyQtKCJd83VHIQOe5UdnBg==","signed_message":"bundle_sha256_bytes","signed_at":"2026-06-01T07:30:46.490236Z","bundle_sha256":"abed49b15d596e2b4f271eddc58c0e9d7f4769774a1c983806977b7175f0605d"}}