{"bundle_type":"pith_open_graph_bundle","bundle_version":"1.0","pith_number":"pith:2015:R2IDNGAPRXVP73HMRV5G2DTAW6","short_pith_number":"pith:R2IDNGAP","canonical_record":{"source":{"id":"1505.06807","kind":"arxiv","version":1},"metadata":{"license":"http://arxiv.org/licenses/nonexclusive-distrib/1.0/","primary_cat":"cs.LG","submitted_at":"2015-05-26T05:12:23Z","cross_cats_sorted":["cs.DC","cs.MS","stat.ML"],"title_canon_sha256":"35d4fd1ac1a6b2bc862196b53fff858d9e2e72039dba7ad5634a02208c11b960","abstract_canon_sha256":"b8b1cbecfbc438fcaa3da5afbbc4a820651df31851682f1c8e8a00bb75b077d7"},"schema_version":"1.0"},"canonical_sha256":"8e9036980f8deaffecec8d7a6d0e60b7b6b02deea092edbc6e45f388c95adb65","source":{"kind":"arxiv","id":"1505.06807","version":1},"source_aliases":[{"alias_kind":"arxiv","alias_value":"1505.06807","created_at":"2026-05-18T02:03:29Z"},{"alias_kind":"arxiv_version","alias_value":"1505.06807v1","created_at":"2026-05-18T02:03:29Z"},{"alias_kind":"doi","alias_value":"10.48550/arxiv.1505.06807","created_at":"2026-05-18T02:03:29Z"},{"alias_kind":"pith_short_12","alias_value":"R2IDNGAPRXVP","created_at":"2026-05-18T12:29:39Z"},{"alias_kind":"pith_short_16","alias_value":"R2IDNGAPRXVP73HM","created_at":"2026-05-18T12:29:39Z"},{"alias_kind":"pith_short_8","alias_value":"R2IDNGAP","created_at":"2026-05-18T12:29:39Z"}],"events":[{"event_type":"record_created","subject_pith_number":"pith:2015:R2IDNGAPRXVP73HMRV5G2DTAW6","target":"record","payload":{"canonical_record":{"source":{"id":"1505.06807","kind":"arxiv","version":1},"metadata":{"license":"http://arxiv.org/licenses/nonexclusive-distrib/1.0/","primary_cat":"cs.LG","submitted_at":"2015-05-26T05:12:23Z","cross_cats_sorted":["cs.DC","cs.MS","stat.ML"],"title_canon_sha256":"35d4fd1ac1a6b2bc862196b53fff858d9e2e72039dba7ad5634a02208c11b960","abstract_canon_sha256":"b8b1cbecfbc438fcaa3da5afbbc4a820651df31851682f1c8e8a00bb75b077d7"},"schema_version":"1.0"},"canonical_sha256":"8e9036980f8deaffecec8d7a6d0e60b7b6b02deea092edbc6e45f388c95adb65","receipt":{"kind":"pith_receipt","key_id":"pith-v1-2026-05","algorithm":"ed25519","signed_at":"2026-05-18T02:03:29.930047Z","signature_b64":"hNfMK0T/DEMNcLPM8tDPkNo8KvOU54SPFUwh/tAx6gtOUN8Ny3X/nXy0A5kSQJ0vCBaWdIRbhS93+p+CCSi5DA==","signed_message":"canonical_sha256_bytes","builder_version":"pith-number-builder-2026-05-17-v1","receipt_version":"0.3","canonical_sha256":"8e9036980f8deaffecec8d7a6d0e60b7b6b02deea092edbc6e45f388c95adb65","last_reissued_at":"2026-05-18T02:03:29.929459Z","signature_status":"signed_v1","first_computed_at":"2026-05-18T02:03:29.929459Z","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54"},"source_kind":"arxiv","source_id":"1505.06807","source_version":1,"attestation_state":"computed"},"signer":{"signer_id":"pith.science","signer_type":"pith_registry","key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54"},"created_at":"2026-05-18T02:03:29Z","supersedes":[],"prev_event":null,"signature":{"signature_status":"signed_v1","algorithm":"ed25519","key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","signature_b64":"jLbc9eOlZXN1NZ7TKhke1ZlbAxYH9HknCu+2rEEmkG0oqkCJVZHY5KzEP/0k6/gMgsx6GTwxZjF8G2faBo+lBg==","signed_message":"open_graph_event_sha256_bytes","signed_at":"2026-05-19T19:00:38.554907Z"},"content_sha256":"db539994469907138d6f77a95be8c4172ad9f5a625971c8b24cc9ea19ad90bcd","schema_version":"1.0","event_id":"sha256:db539994469907138d6f77a95be8c4172ad9f5a625971c8b24cc9ea19ad90bcd"},{"event_type":"graph_snapshot","subject_pith_number":"pith:2015:R2IDNGAPRXVP73HMRV5G2DTAW6","target":"graph","payload":{"graph_snapshot":{"paper":{"title":"MLlib: Machine Learning in Apache Spark","license":"http://arxiv.org/licenses/nonexclusive-distrib/1.0/","headline":"","cross_cats":["cs.DC","cs.MS","stat.ML"],"primary_cat":"cs.LG","authors_text":"Ameet Talwalkar, Burak Yavuz, Davies Liu, DB Tsai, Doris Xin, Evan Sparks, Jeremy Freeman, Joseph Bradley, Manish Amde, Matei Zaharia, Michael J. Franklin, Reynold Xin, Reza Zadeh, Sean Owen, Shivaram Venkataraman, Xiangrui Meng","submitted_at":"2015-05-26T05:12:23Z","abstract_excerpt":"Apache Spark is a popular open-source platform for large-scale data processing that is well-suited for iterative machine learning tasks. In this paper we present MLlib, Spark's open-source distributed machine learning library. MLlib provides efficient functionality for a wide range of learning settings and includes several underlying statistical, optimization, and linear algebra primitives. Shipped with Spark, MLlib supports several languages and provides a high-level API that leverages Spark's rich ecosystem to simplify the development of end-to-end machine learning pipelines. MLlib has exper"},"claims":{"count":0,"items":[],"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"source":{"id":"1505.06807","kind":"arxiv","version":1},"verdict":{"id":null,"model_set":{},"created_at":null,"strongest_claim":"","one_line_summary":"","pipeline_version":null,"weakest_assumption":"","pith_extraction_headline":""},"references":{"count":0,"sample":[],"resolved_work":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57","internal_anchors":0},"formal_canon":{"evidence_count":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"author_claims":{"count":0,"strong_count":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"builder_version":"pith-number-builder-2026-05-17-v1"},"verdict_id":null},"signer":{"signer_id":"pith.science","signer_type":"pith_registry","key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54"},"created_at":"2026-05-18T02:03:29Z","supersedes":[],"prev_event":null,"signature":{"signature_status":"signed_v1","algorithm":"ed25519","key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","signature_b64":"t8R/6s9M+FYoPD76UHSPrsPx0y1PJJF/yH59sPMiRPaq2mUS3RPaXRyyL/TsZqnAlaN7RYTNcSrOAWBR0dwvCg==","signed_message":"open_graph_event_sha256_bytes","signed_at":"2026-05-19T19:00:38.555263Z"},"content_sha256":"108d35701e425c97d5d680688dd80281458e1b44793e83afd68e3189e0500dd8","schema_version":"1.0","event_id":"sha256:108d35701e425c97d5d680688dd80281458e1b44793e83afd68e3189e0500dd8"}],"timestamp_proofs":[],"mirror_hints":[{"mirror_type":"https","name":"Pith Resolver","base_url":"https://pith.science","bundle_url":"https://pith.science/pith/R2IDNGAPRXVP73HMRV5G2DTAW6/bundle.json","state_url":"https://pith.science/pith/R2IDNGAPRXVP73HMRV5G2DTAW6/state.json","well_known_bundle_url":"https://pith.science/.well-known/pith/R2IDNGAPRXVP73HMRV5G2DTAW6/bundle.json","status":"primary"}],"public_keys":[{"key_id":"pith-v1-2026-05","algorithm":"ed25519","format":"raw","public_key_b64":"stVStoiQhXFxp4s2pdzPNoqVNBMojDU/fJ2db5S3CbM=","public_key_hex":"b2d552b68890857171a78b36a5dccf368a953413288c353f7c9d9d6f94b709b3","fingerprint_sha256_b32_first128bits":"RVFV5Z2OI2J3ZUO7ERDEBCYNKS","fingerprint_sha256_hex":"8d4b5ee74e4693bcd1df2446408b0d54","rotates_at":null,"url":"https://pith.science/pith-signing-key.json","notes":"Pith uses this Ed25519 key to sign canonical record SHA-256 digests. Verify with: ed25519_verify(public_key, message=canonical_sha256_bytes, signature=base64decode(signature_b64))."}],"merge_version":"pith-open-graph-merge-v1","built_at":"2026-05-19T19:00:38Z","links":{"resolver":"https://pith.science/pith/R2IDNGAPRXVP73HMRV5G2DTAW6","bundle":"https://pith.science/pith/R2IDNGAPRXVP73HMRV5G2DTAW6/bundle.json","state":"https://pith.science/pith/R2IDNGAPRXVP73HMRV5G2DTAW6/state.json","well_known_bundle":"https://pith.science/.well-known/pith/R2IDNGAPRXVP73HMRV5G2DTAW6/bundle.json"},"state":{"state_type":"pith_open_graph_state","state_version":"1.0","pith_number":"pith:2015:R2IDNGAPRXVP73HMRV5G2DTAW6","merge_version":"pith-open-graph-merge-v1","event_count":2,"valid_event_count":2,"invalid_event_count":0,"equivocation_count":0,"current":{"canonical_record":{"metadata":{"abstract_canon_sha256":"b8b1cbecfbc438fcaa3da5afbbc4a820651df31851682f1c8e8a00bb75b077d7","cross_cats_sorted":["cs.DC","cs.MS","stat.ML"],"license":"http://arxiv.org/licenses/nonexclusive-distrib/1.0/","primary_cat":"cs.LG","submitted_at":"2015-05-26T05:12:23Z","title_canon_sha256":"35d4fd1ac1a6b2bc862196b53fff858d9e2e72039dba7ad5634a02208c11b960"},"schema_version":"1.0","source":{"id":"1505.06807","kind":"arxiv","version":1}},"source_aliases":[{"alias_kind":"arxiv","alias_value":"1505.06807","created_at":"2026-05-18T02:03:29Z"},{"alias_kind":"arxiv_version","alias_value":"1505.06807v1","created_at":"2026-05-18T02:03:29Z"},{"alias_kind":"doi","alias_value":"10.48550/arxiv.1505.06807","created_at":"2026-05-18T02:03:29Z"},{"alias_kind":"pith_short_12","alias_value":"R2IDNGAPRXVP","created_at":"2026-05-18T12:29:39Z"},{"alias_kind":"pith_short_16","alias_value":"R2IDNGAPRXVP73HM","created_at":"2026-05-18T12:29:39Z"},{"alias_kind":"pith_short_8","alias_value":"R2IDNGAP","created_at":"2026-05-18T12:29:39Z"}],"graph_snapshots":[{"event_id":"sha256:108d35701e425c97d5d680688dd80281458e1b44793e83afd68e3189e0500dd8","target":"graph","created_at":"2026-05-18T02:03:29Z","signer":{"key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","signer_id":"pith.science","signer_type":"pith_registry"},"payload":{"graph_snapshot":{"author_claims":{"count":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57","strong_count":0},"builder_version":"pith-number-builder-2026-05-17-v1","claims":{"count":0,"items":[],"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"formal_canon":{"evidence_count":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"paper":{"abstract_excerpt":"Apache Spark is a popular open-source platform for large-scale data processing that is well-suited for iterative machine learning tasks. In this paper we present MLlib, Spark's open-source distributed machine learning library. MLlib provides efficient functionality for a wide range of learning settings and includes several underlying statistical, optimization, and linear algebra primitives. Shipped with Spark, MLlib supports several languages and provides a high-level API that leverages Spark's rich ecosystem to simplify the development of end-to-end machine learning pipelines. MLlib has exper","authors_text":"Ameet Talwalkar, Burak Yavuz, Davies Liu, DB Tsai, Doris Xin, Evan Sparks, Jeremy Freeman, Joseph Bradley, Manish Amde, Matei Zaharia, Michael J. Franklin, Reynold Xin, Reza Zadeh, Sean Owen, Shivaram Venkataraman, Xiangrui Meng","cross_cats":["cs.DC","cs.MS","stat.ML"],"headline":"","license":"http://arxiv.org/licenses/nonexclusive-distrib/1.0/","primary_cat":"cs.LG","submitted_at":"2015-05-26T05:12:23Z","title":"MLlib: Machine Learning in Apache Spark"},"references":{"count":0,"internal_anchors":0,"resolved_work":0,"sample":[],"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"source":{"id":"1505.06807","kind":"arxiv","version":1},"verdict":{"created_at":null,"id":null,"model_set":{},"one_line_summary":"","pipeline_version":null,"pith_extraction_headline":"","strongest_claim":"","weakest_assumption":""}},"verdict_id":null}}],"author_attestations":[],"timestamp_anchors":[],"storage_attestations":[],"citation_signatures":[],"replication_records":[],"corrections":[],"mirror_hints":[],"record_created":{"event_id":"sha256:db539994469907138d6f77a95be8c4172ad9f5a625971c8b24cc9ea19ad90bcd","target":"record","created_at":"2026-05-18T02:03:29Z","signer":{"key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","signer_id":"pith.science","signer_type":"pith_registry"},"payload":{"attestation_state":"computed","canonical_record":{"metadata":{"abstract_canon_sha256":"b8b1cbecfbc438fcaa3da5afbbc4a820651df31851682f1c8e8a00bb75b077d7","cross_cats_sorted":["cs.DC","cs.MS","stat.ML"],"license":"http://arxiv.org/licenses/nonexclusive-distrib/1.0/","primary_cat":"cs.LG","submitted_at":"2015-05-26T05:12:23Z","title_canon_sha256":"35d4fd1ac1a6b2bc862196b53fff858d9e2e72039dba7ad5634a02208c11b960"},"schema_version":"1.0","source":{"id":"1505.06807","kind":"arxiv","version":1}},"canonical_sha256":"8e9036980f8deaffecec8d7a6d0e60b7b6b02deea092edbc6e45f388c95adb65","receipt":{"algorithm":"ed25519","builder_version":"pith-number-builder-2026-05-17-v1","canonical_sha256":"8e9036980f8deaffecec8d7a6d0e60b7b6b02deea092edbc6e45f388c95adb65","first_computed_at":"2026-05-18T02:03:29.929459Z","key_id":"pith-v1-2026-05","kind":"pith_receipt","last_reissued_at":"2026-05-18T02:03:29.929459Z","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","receipt_version":"0.3","signature_b64":"hNfMK0T/DEMNcLPM8tDPkNo8KvOU54SPFUwh/tAx6gtOUN8Ny3X/nXy0A5kSQJ0vCBaWdIRbhS93+p+CCSi5DA==","signature_status":"signed_v1","signed_at":"2026-05-18T02:03:29.930047Z","signed_message":"canonical_sha256_bytes"},"source_id":"1505.06807","source_kind":"arxiv","source_version":1}}},"equivocations":[],"invalid_events":[],"applied_event_ids":["sha256:db539994469907138d6f77a95be8c4172ad9f5a625971c8b24cc9ea19ad90bcd","sha256:108d35701e425c97d5d680688dd80281458e1b44793e83afd68e3189e0500dd8"],"state_sha256":"1b35d17a350bd4f408afbf650d862f728e22c5bfa5c784c24780463586cbdad7"},"bundle_signature":{"signature_status":"signed_v1","algorithm":"ed25519","key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","signature_b64":"/Pm5FOZlfnhxPj834zamNq7kiY8fLQzsLQUs3AWM3AlbxWxydI7sZWIyK87dviC4w4D0l12i548FPj1g0oa7DQ==","signed_message":"bundle_sha256_bytes","signed_at":"2026-05-19T19:00:38.557395Z","bundle_sha256":"7af7010f55cd16e5bad221eddcc21dcc451d23d93e722b21d482fab4bc4ea433"}}