{"record_type":"pith_number_record","schema_url":"https://pith.science/schemas/pith-number/v1.json","pith_number":"pith:2018:GVUSPWDP55SGRPJUQJCUER72KJ","short_pith_number":"pith:GVUSPWDP","schema_version":"1.0","canonical_sha256":"356927d86fef6468bd3482454247fa52702bcb9cbcdf51a9e2e223f1fbf3ccd6","source":{"kind":"arxiv","id":"1805.08650","version":1},"attestation_state":"computed","paper":{"title":"Cache-based Multi-query Optimization for Data-intensive Scalable Computing Frameworks","license":"http://arxiv.org/licenses/nonexclusive-distrib/1.0/","headline":"","cross_cats":["cs.DC"],"primary_cat":"cs.DB","authors_text":"Damiano Carra, Pietro Michiardi, Sara Migliorini","submitted_at":"2018-05-22T14:59:02Z","abstract_excerpt":"In modern large-scale distributed systems, analytics jobs submitted by various users often share similar work, for example scanning and processing the same subset of data. Instead of optimizing jobs independently, which may result in redundant and wasteful processing, multi-query optimization techniques can be employed to save a considerable amount of cluster resources. In this work, we introduce a novel method combining in-memory cache primitives and multi-query optimization, to improve the efficiency of data-intensive, scalable computing frameworks. By careful selection and exploitation of c"},"verification_status":{"content_addressed":true,"pith_receipt":true,"author_attested":false,"weak_author_claims":0,"strong_author_claims":0,"externally_anchored":false,"storage_verified":false,"citation_signatures":0,"replication_records":0,"graph_snapshot":true,"references_resolved":false,"formal_links_present":false},"canonical_record":{"source":{"id":"1805.08650","kind":"arxiv","version":1},"metadata":{"license":"http://arxiv.org/licenses/nonexclusive-distrib/1.0/","primary_cat":"cs.DB","submitted_at":"2018-05-22T14:59:02Z","cross_cats_sorted":["cs.DC"],"title_canon_sha256":"c6d8e16c96916aaf0139a1e56ce4950c8763694cf2f411451ca24d552025182e","abstract_canon_sha256":"68ba8c4f1c52523b6581573ba73421a9fd07cae63b866c32843e0579080207b2"},"schema_version":"1.0"},"receipt":{"kind":"pith_receipt","key_id":"pith-v1-2026-05","algorithm":"ed25519","signed_at":"2026-05-18T00:15:25.555658Z","signature_b64":"6orS76b1oEZoLSdb6fLQU7xyw4wZBT8I8r5lB0osLu/OYmqdS3H46CfQx1o1IrFHhX/UuTBtlBTGC96sVlN5Bw==","signed_message":"canonical_sha256_bytes","builder_version":"pith-number-builder-2026-05-17-v1","receipt_version":"0.3","canonical_sha256":"356927d86fef6468bd3482454247fa52702bcb9cbcdf51a9e2e223f1fbf3ccd6","last_reissued_at":"2026-05-18T00:15:25.554923Z","signature_status":"signed_v1","first_computed_at":"2026-05-18T00:15:25.554923Z","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54"},"graph_snapshot":{"paper":{"title":"Cache-based Multi-query Optimization for Data-intensive Scalable Computing Frameworks","license":"http://arxiv.org/licenses/nonexclusive-distrib/1.0/","headline":"","cross_cats":["cs.DC"],"primary_cat":"cs.DB","authors_text":"Damiano Carra, Pietro Michiardi, Sara Migliorini","submitted_at":"2018-05-22T14:59:02Z","abstract_excerpt":"In modern large-scale distributed systems, analytics jobs submitted by various users often share similar work, for example scanning and processing the same subset of data. Instead of optimizing jobs independently, which may result in redundant and wasteful processing, multi-query optimization techniques can be employed to save a considerable amount of cluster resources. In this work, we introduce a novel method combining in-memory cache primitives and multi-query optimization, to improve the efficiency of data-intensive, scalable computing frameworks. By careful selection and exploitation of c"},"claims":{"count":0,"items":[],"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"source":{"id":"1805.08650","kind":"arxiv","version":1},"verdict":{"id":null,"model_set":{},"created_at":null,"strongest_claim":"","one_line_summary":"","pipeline_version":null,"weakest_assumption":"","pith_extraction_headline":""},"references":{"count":0,"sample":[],"resolved_work":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57","internal_anchors":0},"formal_canon":{"evidence_count":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"author_claims":{"count":0,"strong_count":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"builder_version":"pith-number-builder-2026-05-17-v1"},"aliases":[{"alias_kind":"arxiv","alias_value":"1805.08650","created_at":"2026-05-18T00:15:25.555052+00:00"},{"alias_kind":"arxiv_version","alias_value":"1805.08650v1","created_at":"2026-05-18T00:15:25.555052+00:00"},{"alias_kind":"doi","alias_value":"10.48550/arxiv.1805.08650","created_at":"2026-05-18T00:15:25.555052+00:00"},{"alias_kind":"pith_short_12","alias_value":"GVUSPWDP55SG","created_at":"2026-05-18T12:32:25.280505+00:00"},{"alias_kind":"pith_short_16","alias_value":"GVUSPWDP55SGRPJU","created_at":"2026-05-18T12:32:25.280505+00:00"},{"alias_kind":"pith_short_8","alias_value":"GVUSPWDP","created_at":"2026-05-18T12:32:25.280505+00:00"}],"events":[],"event_summary":{},"paper_claims":[],"inbound_citations":{"count":0,"internal_anchor_count":0,"sample":[]},"formal_canon":{"evidence_count":0,"sample":[],"anchors":[]},"links":{"html":"https://pith.science/pith/GVUSPWDP55SGRPJUQJCUER72KJ","json":"https://pith.science/pith/GVUSPWDP55SGRPJUQJCUER72KJ.json","graph_json":"https://pith.science/api/pith-number/GVUSPWDP55SGRPJUQJCUER72KJ/graph.json","events_json":"https://pith.science/api/pith-number/GVUSPWDP55SGRPJUQJCUER72KJ/events.json","paper":"https://pith.science/paper/GVUSPWDP"},"agent_actions":{"view_html":"https://pith.science/pith/GVUSPWDP55SGRPJUQJCUER72KJ","download_json":"https://pith.science/pith/GVUSPWDP55SGRPJUQJCUER72KJ.json","view_paper":"https://pith.science/paper/GVUSPWDP","resolve_alias":"https://pith.science/api/pith-number/resolve?arxiv=1805.08650&json=true","fetch_graph":"https://pith.science/api/pith-number/GVUSPWDP55SGRPJUQJCUER72KJ/graph.json","fetch_events":"https://pith.science/api/pith-number/GVUSPWDP55SGRPJUQJCUER72KJ/events.json","actions":{"anchor_timestamp":"https://pith.science/pith/GVUSPWDP55SGRPJUQJCUER72KJ/action/timestamp_anchor","attest_storage":"https://pith.science/pith/GVUSPWDP55SGRPJUQJCUER72KJ/action/storage_attestation","attest_author":"https://pith.science/pith/GVUSPWDP55SGRPJUQJCUER72KJ/action/author_attestation","sign_citation":"https://pith.science/pith/GVUSPWDP55SGRPJUQJCUER72KJ/action/citation_signature","submit_replication":"https://pith.science/pith/GVUSPWDP55SGRPJUQJCUER72KJ/action/replication_record"}},"created_at":"2026-05-18T00:15:25.555052+00:00","updated_at":"2026-05-18T00:15:25.555052+00:00"}