{"bundle_type":"pith_open_graph_bundle","bundle_version":"1.0","pith_number":"pith:2019:ED3G5PXPM6YSSVDYRKVTVL2XAH","short_pith_number":"pith:ED3G5PXP","canonical_record":{"source":{"id":"1907.01183","kind":"arxiv","version":1},"metadata":{"license":"http://creativecommons.org/licenses/by/4.0/","primary_cat":"cs.IR","submitted_at":"2019-07-02T05:58:18Z","cross_cats_sorted":["cs.DB"],"title_canon_sha256":"1ef0e9f655272e9544658fa2e87a3487719a7f83b468c6387876eaa07a5f3e00","abstract_canon_sha256":"6020135805bf5e1c6d9dc3a7022a315471a7d63391115091004c9df2945d444f"},"schema_version":"1.0"},"canonical_sha256":"20f66ebeef67b12954788aab3aaf5701fdf2bbe06562404f6dca7073aa0808fb","source":{"kind":"arxiv","id":"1907.01183","version":1},"source_aliases":[{"alias_kind":"arxiv","alias_value":"1907.01183","created_at":"2026-05-17T23:41:41Z"},{"alias_kind":"arxiv_version","alias_value":"1907.01183v1","created_at":"2026-05-17T23:41:41Z"},{"alias_kind":"doi","alias_value":"10.48550/arxiv.1907.01183","created_at":"2026-05-17T23:41:41Z"},{"alias_kind":"pith_short_12","alias_value":"ED3G5PXPM6YS","created_at":"2026-05-18T12:33:15Z"},{"alias_kind":"pith_short_16","alias_value":"ED3G5PXPM6YSSVDY","created_at":"2026-05-18T12:33:15Z"},{"alias_kind":"pith_short_8","alias_value":"ED3G5PXP","created_at":"2026-05-18T12:33:15Z"}],"events":[{"event_type":"record_created","subject_pith_number":"pith:2019:ED3G5PXPM6YSSVDYRKVTVL2XAH","target":"record","payload":{"canonical_record":{"source":{"id":"1907.01183","kind":"arxiv","version":1},"metadata":{"license":"http://creativecommons.org/licenses/by/4.0/","primary_cat":"cs.IR","submitted_at":"2019-07-02T05:58:18Z","cross_cats_sorted":["cs.DB"],"title_canon_sha256":"1ef0e9f655272e9544658fa2e87a3487719a7f83b468c6387876eaa07a5f3e00","abstract_canon_sha256":"6020135805bf5e1c6d9dc3a7022a315471a7d63391115091004c9df2945d444f"},"schema_version":"1.0"},"canonical_sha256":"20f66ebeef67b12954788aab3aaf5701fdf2bbe06562404f6dca7073aa0808fb","receipt":{"kind":"pith_receipt","key_id":"pith-v1-2026-05","algorithm":"ed25519","signed_at":"2026-05-17T23:41:41.047667Z","signature_b64":"NfFNbZNNApyUbpvDF++9dZLfDje9jdJ09EaY0ucm3l4FrflD09kN0RPbry+gI0ElqLx2iQprADG9L1Kt56tuDA==","signed_message":"canonical_sha256_bytes","builder_version":"pith-number-builder-2026-05-17-v1","receipt_version":"0.3","canonical_sha256":"20f66ebeef67b12954788aab3aaf5701fdf2bbe06562404f6dca7073aa0808fb","last_reissued_at":"2026-05-17T23:41:41.047115Z","signature_status":"signed_v1","first_computed_at":"2026-05-17T23:41:41.047115Z","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54"},"source_kind":"arxiv","source_id":"1907.01183","source_version":1,"attestation_state":"computed"},"signer":{"signer_id":"pith.science","signer_type":"pith_registry","key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54"},"created_at":"2026-05-17T23:41:41Z","supersedes":[],"prev_event":null,"signature":{"signature_status":"signed_v1","algorithm":"ed25519","key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","signature_b64":"Awej8Pkkly2iMY6OgjTVsFbOU1hiOyOzf1A+NuOAqqakDfV/phW7v/wjgyCyQQ2ZkiZaQxRfvqZBhMO3fqs/Bw==","signed_message":"open_graph_event_sha256_bytes","signed_at":"2026-05-26T00:35:46.140905Z"},"content_sha256":"a7ac013d3523a0d14d2e7b3490b965619c7de52d05814b75da472586251e767d","schema_version":"1.0","event_id":"sha256:a7ac013d3523a0d14d2e7b3490b965619c7de52d05814b75da472586251e767d"},{"event_type":"graph_snapshot","subject_pith_number":"pith:2019:ED3G5PXPM6YSSVDYRKVTVL2XAH","target":"graph","payload":{"graph_snapshot":{"paper":{"title":"A Framework for Evaluating Snippet Generation for Dataset Search","license":"http://creativecommons.org/licenses/by/4.0/","headline":"","cross_cats":["cs.DB"],"primary_cat":"cs.IR","authors_text":"Evgeny Kharlamov, Gong Cheng, Jeff Z. Pan, Jinchi Chen, Shuxin Li, Xiaxia Wang, Yuzhong Qu","submitted_at":"2019-07-02T05:58:18Z","abstract_excerpt":"Reusing existing datasets is of considerable significance to researchers and developers. Dataset search engines help a user find relevant datasets for reuse. They can present a snippet for each retrieved dataset to explain its relevance to the user's data needs. This emerging problem of snippet generation for dataset search has not received much research attention. To provide a basis for future research, we introduce a framework for quantitatively evaluating the quality of a dataset snippet. The proposed metrics assess the extent to which a snippet matches the query intent and covers the main "},"claims":{"count":0,"items":[],"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"source":{"id":"1907.01183","kind":"arxiv","version":1},"verdict":{"id":null,"model_set":{},"created_at":null,"strongest_claim":"","one_line_summary":"","pipeline_version":null,"weakest_assumption":"","pith_extraction_headline":""},"references":{"count":0,"sample":[],"resolved_work":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57","internal_anchors":0},"formal_canon":{"evidence_count":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"author_claims":{"count":0,"strong_count":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"builder_version":"pith-number-builder-2026-05-17-v1"},"verdict_id":null},"signer":{"signer_id":"pith.science","signer_type":"pith_registry","key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54"},"created_at":"2026-05-17T23:41:41Z","supersedes":[],"prev_event":null,"signature":{"signature_status":"signed_v1","algorithm":"ed25519","key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","signature_b64":"BB0oCtBuvdqreI3k5KH3dA90ZqxtkHbRGkNblEjHSzOWCfrl2d5Ek2eDaxVazzwzah6N01a2AKGaKLNEMmfIDw==","signed_message":"open_graph_event_sha256_bytes","signed_at":"2026-05-26T00:35:46.141265Z"},"content_sha256":"c9edad8b982c00b41ebd8a6eba2b4a1168572dfd07a8abb456fdc395c6a31b58","schema_version":"1.0","event_id":"sha256:c9edad8b982c00b41ebd8a6eba2b4a1168572dfd07a8abb456fdc395c6a31b58"}],"timestamp_proofs":[],"mirror_hints":[{"mirror_type":"https","name":"Pith Resolver","base_url":"https://pith.science","bundle_url":"https://pith.science/pith/ED3G5PXPM6YSSVDYRKVTVL2XAH/bundle.json","state_url":"https://pith.science/pith/ED3G5PXPM6YSSVDYRKVTVL2XAH/state.json","well_known_bundle_url":"https://pith.science/.well-known/pith/ED3G5PXPM6YSSVDYRKVTVL2XAH/bundle.json","status":"primary"}],"public_keys":[{"key_id":"pith-v1-2026-05","algorithm":"ed25519","format":"raw","public_key_b64":"stVStoiQhXFxp4s2pdzPNoqVNBMojDU/fJ2db5S3CbM=","public_key_hex":"b2d552b68890857171a78b36a5dccf368a953413288c353f7c9d9d6f94b709b3","fingerprint_sha256_b32_first128bits":"RVFV5Z2OI2J3ZUO7ERDEBCYNKS","fingerprint_sha256_hex":"8d4b5ee74e4693bcd1df2446408b0d54","rotates_at":null,"url":"https://pith.science/pith-signing-key.json","notes":"Pith uses this Ed25519 key to sign canonical record SHA-256 digests. Verify with: ed25519_verify(public_key, message=canonical_sha256_bytes, signature=base64decode(signature_b64))."}],"merge_version":"pith-open-graph-merge-v1","built_at":"2026-05-26T00:35:46Z","links":{"resolver":"https://pith.science/pith/ED3G5PXPM6YSSVDYRKVTVL2XAH","bundle":"https://pith.science/pith/ED3G5PXPM6YSSVDYRKVTVL2XAH/bundle.json","state":"https://pith.science/pith/ED3G5PXPM6YSSVDYRKVTVL2XAH/state.json","well_known_bundle":"https://pith.science/.well-known/pith/ED3G5PXPM6YSSVDYRKVTVL2XAH/bundle.json"},"state":{"state_type":"pith_open_graph_state","state_version":"1.0","pith_number":"pith:2019:ED3G5PXPM6YSSVDYRKVTVL2XAH","merge_version":"pith-open-graph-merge-v1","event_count":2,"valid_event_count":2,"invalid_event_count":0,"equivocation_count":0,"current":{"canonical_record":{"metadata":{"abstract_canon_sha256":"6020135805bf5e1c6d9dc3a7022a315471a7d63391115091004c9df2945d444f","cross_cats_sorted":["cs.DB"],"license":"http://creativecommons.org/licenses/by/4.0/","primary_cat":"cs.IR","submitted_at":"2019-07-02T05:58:18Z","title_canon_sha256":"1ef0e9f655272e9544658fa2e87a3487719a7f83b468c6387876eaa07a5f3e00"},"schema_version":"1.0","source":{"id":"1907.01183","kind":"arxiv","version":1}},"source_aliases":[{"alias_kind":"arxiv","alias_value":"1907.01183","created_at":"2026-05-17T23:41:41Z"},{"alias_kind":"arxiv_version","alias_value":"1907.01183v1","created_at":"2026-05-17T23:41:41Z"},{"alias_kind":"doi","alias_value":"10.48550/arxiv.1907.01183","created_at":"2026-05-17T23:41:41Z"},{"alias_kind":"pith_short_12","alias_value":"ED3G5PXPM6YS","created_at":"2026-05-18T12:33:15Z"},{"alias_kind":"pith_short_16","alias_value":"ED3G5PXPM6YSSVDY","created_at":"2026-05-18T12:33:15Z"},{"alias_kind":"pith_short_8","alias_value":"ED3G5PXP","created_at":"2026-05-18T12:33:15Z"}],"graph_snapshots":[{"event_id":"sha256:c9edad8b982c00b41ebd8a6eba2b4a1168572dfd07a8abb456fdc395c6a31b58","target":"graph","created_at":"2026-05-17T23:41:41Z","signer":{"key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","signer_id":"pith.science","signer_type":"pith_registry"},"payload":{"graph_snapshot":{"author_claims":{"count":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57","strong_count":0},"builder_version":"pith-number-builder-2026-05-17-v1","claims":{"count":0,"items":[],"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"formal_canon":{"evidence_count":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"paper":{"abstract_excerpt":"Reusing existing datasets is of considerable significance to researchers and developers. Dataset search engines help a user find relevant datasets for reuse. They can present a snippet for each retrieved dataset to explain its relevance to the user's data needs. This emerging problem of snippet generation for dataset search has not received much research attention. To provide a basis for future research, we introduce a framework for quantitatively evaluating the quality of a dataset snippet. The proposed metrics assess the extent to which a snippet matches the query intent and covers the main ","authors_text":"Evgeny Kharlamov, Gong Cheng, Jeff Z. Pan, Jinchi Chen, Shuxin Li, Xiaxia Wang, Yuzhong Qu","cross_cats":["cs.DB"],"headline":"","license":"http://creativecommons.org/licenses/by/4.0/","primary_cat":"cs.IR","submitted_at":"2019-07-02T05:58:18Z","title":"A Framework for Evaluating Snippet Generation for Dataset Search"},"references":{"count":0,"internal_anchors":0,"resolved_work":0,"sample":[],"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"source":{"id":"1907.01183","kind":"arxiv","version":1},"verdict":{"created_at":null,"id":null,"model_set":{},"one_line_summary":"","pipeline_version":null,"pith_extraction_headline":"","strongest_claim":"","weakest_assumption":""}},"verdict_id":null}}],"author_attestations":[],"timestamp_anchors":[],"storage_attestations":[],"citation_signatures":[],"replication_records":[],"corrections":[],"mirror_hints":[],"record_created":{"event_id":"sha256:a7ac013d3523a0d14d2e7b3490b965619c7de52d05814b75da472586251e767d","target":"record","created_at":"2026-05-17T23:41:41Z","signer":{"key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","signer_id":"pith.science","signer_type":"pith_registry"},"payload":{"attestation_state":"computed","canonical_record":{"metadata":{"abstract_canon_sha256":"6020135805bf5e1c6d9dc3a7022a315471a7d63391115091004c9df2945d444f","cross_cats_sorted":["cs.DB"],"license":"http://creativecommons.org/licenses/by/4.0/","primary_cat":"cs.IR","submitted_at":"2019-07-02T05:58:18Z","title_canon_sha256":"1ef0e9f655272e9544658fa2e87a3487719a7f83b468c6387876eaa07a5f3e00"},"schema_version":"1.0","source":{"id":"1907.01183","kind":"arxiv","version":1}},"canonical_sha256":"20f66ebeef67b12954788aab3aaf5701fdf2bbe06562404f6dca7073aa0808fb","receipt":{"algorithm":"ed25519","builder_version":"pith-number-builder-2026-05-17-v1","canonical_sha256":"20f66ebeef67b12954788aab3aaf5701fdf2bbe06562404f6dca7073aa0808fb","first_computed_at":"2026-05-17T23:41:41.047115Z","key_id":"pith-v1-2026-05","kind":"pith_receipt","last_reissued_at":"2026-05-17T23:41:41.047115Z","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","receipt_version":"0.3","signature_b64":"NfFNbZNNApyUbpvDF++9dZLfDje9jdJ09EaY0ucm3l4FrflD09kN0RPbry+gI0ElqLx2iQprADG9L1Kt56tuDA==","signature_status":"signed_v1","signed_at":"2026-05-17T23:41:41.047667Z","signed_message":"canonical_sha256_bytes"},"source_id":"1907.01183","source_kind":"arxiv","source_version":1}}},"equivocations":[],"invalid_events":[],"applied_event_ids":["sha256:a7ac013d3523a0d14d2e7b3490b965619c7de52d05814b75da472586251e767d","sha256:c9edad8b982c00b41ebd8a6eba2b4a1168572dfd07a8abb456fdc395c6a31b58"],"state_sha256":"c1a995fc8abb744abd0267242dac0f1557481e25b043530606568735c8efc0dc"},"bundle_signature":{"signature_status":"signed_v1","algorithm":"ed25519","key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","signature_b64":"Y9YJioufuDVOnAi0TEFcywC5EwxtjE6r4gzCfFWZhA3ldC0fM1rS08de5pN/cwzcHCikshP4r3XvbFpfqOSLBw==","signed_message":"bundle_sha256_bytes","signed_at":"2026-05-26T00:35:46.143706Z","bundle_sha256":"11b183a2781ba9684bc63a0962abde15f661e3ce51fe44b2bb88c8903d57b48c"}}