{"bundle_type":"pith_open_graph_bundle","bundle_version":"1.0","pith_number":"pith:2015:KJZNAAO3NAL337DZWXD6UXIKKU","short_pith_number":"pith:KJZNAAO3","canonical_record":{"source":{"id":"1510.05041","kind":"arxiv","version":1},"metadata":{"license":"http://arxiv.org/licenses/nonexclusive-distrib/1.0/","primary_cat":"cs.DC","submitted_at":"2015-10-16T22:34:24Z","cross_cats_sorted":[],"title_canon_sha256":"4dc35a81e5c4cc558369b861ef6585a62a26520ce70baf4568718eebcadbb609","abstract_canon_sha256":"212850317d2311a062cb0b52190580ee7aa3068d2aa707ca8fa3f543e112a2c7"},"schema_version":"1.0"},"canonical_sha256":"5272d001db6817bdfc79b5c7ea5d0a5510c6f1fbad729ca7f74e7730d2fac918","source":{"kind":"arxiv","id":"1510.05041","version":1},"source_aliases":[{"alias_kind":"arxiv","alias_value":"1510.05041","created_at":"2026-05-18T01:29:53Z"},{"alias_kind":"arxiv_version","alias_value":"1510.05041v1","created_at":"2026-05-18T01:29:53Z"},{"alias_kind":"doi","alias_value":"10.48550/arxiv.1510.05041","created_at":"2026-05-18T01:29:53Z"},{"alias_kind":"pith_short_12","alias_value":"KJZNAAO3NAL3","created_at":"2026-05-18T12:29:29Z"},{"alias_kind":"pith_short_16","alias_value":"KJZNAAO3NAL337DZ","created_at":"2026-05-18T12:29:29Z"},{"alias_kind":"pith_short_8","alias_value":"KJZNAAO3","created_at":"2026-05-18T12:29:29Z"}],"events":[{"event_type":"record_created","subject_pith_number":"pith:2015:KJZNAAO3NAL337DZWXD6UXIKKU","target":"record","payload":{"canonical_record":{"source":{"id":"1510.05041","kind":"arxiv","version":1},"metadata":{"license":"http://arxiv.org/licenses/nonexclusive-distrib/1.0/","primary_cat":"cs.DC","submitted_at":"2015-10-16T22:34:24Z","cross_cats_sorted":[],"title_canon_sha256":"4dc35a81e5c4cc558369b861ef6585a62a26520ce70baf4568718eebcadbb609","abstract_canon_sha256":"212850317d2311a062cb0b52190580ee7aa3068d2aa707ca8fa3f543e112a2c7"},"schema_version":"1.0"},"canonical_sha256":"5272d001db6817bdfc79b5c7ea5d0a5510c6f1fbad729ca7f74e7730d2fac918","receipt":{"kind":"pith_receipt","key_id":"pith-v1-2026-05","algorithm":"ed25519","signed_at":"2026-05-18T01:29:53.345572Z","signature_b64":"5bbYiEqebUcxblw1TiERo+OHf/ybDNx5E3s8MY9GtMqmzJT4VjwQ2lM7pUhIk9kwymoSjsWxXGPN1zwZI8LkCQ==","signed_message":"canonical_sha256_bytes","builder_version":"pith-number-builder-2026-05-17-v1","receipt_version":"0.3","canonical_sha256":"5272d001db6817bdfc79b5c7ea5d0a5510c6f1fbad729ca7f74e7730d2fac918","last_reissued_at":"2026-05-18T01:29:53.344977Z","signature_status":"signed_v1","first_computed_at":"2026-05-18T01:29:53.344977Z","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54"},"source_kind":"arxiv","source_id":"1510.05041","source_version":1,"attestation_state":"computed"},"signer":{"signer_id":"pith.science","signer_type":"pith_registry","key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54"},"created_at":"2026-05-18T01:29:53Z","supersedes":[],"prev_event":null,"signature":{"signature_status":"signed_v1","algorithm":"ed25519","key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","signature_b64":"+F440DBdmGr1M+0lqZ/BYkWSLHxI4ypMlMWWJCAwbrh1t7C+z160nHq4A1s7lFPkj4MReEGFSQHe6UES+NjRBQ==","signed_message":"open_graph_event_sha256_bytes","signed_at":"2026-06-04T21:48:19.770213Z"},"content_sha256":"5b36359767c3917fd31e5bde73641810f728058773343e6bac5531c6e04812e1","schema_version":"1.0","event_id":"sha256:5b36359767c3917fd31e5bde73641810f728058773343e6bac5531c6e04812e1"},{"event_type":"graph_snapshot","subject_pith_number":"pith:2015:KJZNAAO3NAL337DZWXD6UXIKKU","target":"graph","payload":{"graph_snapshot":{"paper":{"title":"BLASX: A High Performance Level-3 BLAS Library for Heterogeneous Multi-GPU Computing","license":"http://arxiv.org/licenses/nonexclusive-distrib/1.0/","headline":"","cross_cats":[],"primary_cat":"cs.DC","authors_text":"Jianxiong Xiao, Linnan Wang, Wei Wu, Yi Yang","submitted_at":"2015-10-16T22:34:24Z","abstract_excerpt":"Basic Linear Algebra Subprograms (BLAS) are a set of low level linear algebra kernels widely adopted by applications involved with the deep learning and scientific computing. The massive and economic computing power brought forth by the emerging GPU architectures drives interest in implementation of compute-intensive level 3 BLAS on multi-GPU systems. In this paper, we investigate existing multi-GPU level 3 BLAS and present that 1) issues, such as the improper load balancing, inefficient communication, insufficient GPU stream level concurrency and data caching, impede current implementations f"},"claims":{"count":0,"items":[],"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"source":{"id":"1510.05041","kind":"arxiv","version":1},"verdict":{"id":null,"model_set":{},"created_at":null,"strongest_claim":"","one_line_summary":"","pipeline_version":null,"weakest_assumption":"","pith_extraction_headline":""},"references":{"count":0,"sample":[],"resolved_work":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57","internal_anchors":0},"formal_canon":{"evidence_count":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"author_claims":{"count":0,"strong_count":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"builder_version":"pith-number-builder-2026-05-17-v1"},"verdict_id":null},"signer":{"signer_id":"pith.science","signer_type":"pith_registry","key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54"},"created_at":"2026-05-18T01:29:53Z","supersedes":[],"prev_event":null,"signature":{"signature_status":"signed_v1","algorithm":"ed25519","key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","signature_b64":"Gp4fLrX3jKMZOaqC1q6An3V4SUvqdOCknHdNzwI6JnoAAcY6QINr13+NHq1jPiyVPflgqblJOR/W7bid28jgBw==","signed_message":"open_graph_event_sha256_bytes","signed_at":"2026-06-04T21:48:19.770573Z"},"content_sha256":"d726273cd0f18b57dd468a6d42965b3dd3cca32f3de86891b912176e2a89428d","schema_version":"1.0","event_id":"sha256:d726273cd0f18b57dd468a6d42965b3dd3cca32f3de86891b912176e2a89428d"}],"timestamp_proofs":[],"mirror_hints":[{"mirror_type":"https","name":"Pith Resolver","base_url":"https://pith.science","bundle_url":"https://pith.science/pith/KJZNAAO3NAL337DZWXD6UXIKKU/bundle.json","state_url":"https://pith.science/pith/KJZNAAO3NAL337DZWXD6UXIKKU/state.json","well_known_bundle_url":"https://pith.science/.well-known/pith/KJZNAAO3NAL337DZWXD6UXIKKU/bundle.json","status":"primary"}],"public_keys":[{"key_id":"pith-v1-2026-05","algorithm":"ed25519","format":"raw","public_key_b64":"stVStoiQhXFxp4s2pdzPNoqVNBMojDU/fJ2db5S3CbM=","public_key_hex":"b2d552b68890857171a78b36a5dccf368a953413288c353f7c9d9d6f94b709b3","fingerprint_sha256_b32_first128bits":"RVFV5Z2OI2J3ZUO7ERDEBCYNKS","fingerprint_sha256_hex":"8d4b5ee74e4693bcd1df2446408b0d54","rotates_at":null,"url":"https://pith.science/pith-signing-key.json","notes":"Pith uses this Ed25519 key to sign canonical record SHA-256 digests. Verify with: ed25519_verify(public_key, message=canonical_sha256_bytes, signature=base64decode(signature_b64))."}],"merge_version":"pith-open-graph-merge-v1","built_at":"2026-06-04T21:48:19Z","links":{"resolver":"https://pith.science/pith/KJZNAAO3NAL337DZWXD6UXIKKU","bundle":"https://pith.science/pith/KJZNAAO3NAL337DZWXD6UXIKKU/bundle.json","state":"https://pith.science/pith/KJZNAAO3NAL337DZWXD6UXIKKU/state.json","well_known_bundle":"https://pith.science/.well-known/pith/KJZNAAO3NAL337DZWXD6UXIKKU/bundle.json"},"state":{"state_type":"pith_open_graph_state","state_version":"1.0","pith_number":"pith:2015:KJZNAAO3NAL337DZWXD6UXIKKU","merge_version":"pith-open-graph-merge-v1","event_count":2,"valid_event_count":2,"invalid_event_count":0,"equivocation_count":0,"current":{"canonical_record":{"metadata":{"abstract_canon_sha256":"212850317d2311a062cb0b52190580ee7aa3068d2aa707ca8fa3f543e112a2c7","cross_cats_sorted":[],"license":"http://arxiv.org/licenses/nonexclusive-distrib/1.0/","primary_cat":"cs.DC","submitted_at":"2015-10-16T22:34:24Z","title_canon_sha256":"4dc35a81e5c4cc558369b861ef6585a62a26520ce70baf4568718eebcadbb609"},"schema_version":"1.0","source":{"id":"1510.05041","kind":"arxiv","version":1}},"source_aliases":[{"alias_kind":"arxiv","alias_value":"1510.05041","created_at":"2026-05-18T01:29:53Z"},{"alias_kind":"arxiv_version","alias_value":"1510.05041v1","created_at":"2026-05-18T01:29:53Z"},{"alias_kind":"doi","alias_value":"10.48550/arxiv.1510.05041","created_at":"2026-05-18T01:29:53Z"},{"alias_kind":"pith_short_12","alias_value":"KJZNAAO3NAL3","created_at":"2026-05-18T12:29:29Z"},{"alias_kind":"pith_short_16","alias_value":"KJZNAAO3NAL337DZ","created_at":"2026-05-18T12:29:29Z"},{"alias_kind":"pith_short_8","alias_value":"KJZNAAO3","created_at":"2026-05-18T12:29:29Z"}],"graph_snapshots":[{"event_id":"sha256:d726273cd0f18b57dd468a6d42965b3dd3cca32f3de86891b912176e2a89428d","target":"graph","created_at":"2026-05-18T01:29:53Z","signer":{"key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","signer_id":"pith.science","signer_type":"pith_registry"},"payload":{"graph_snapshot":{"author_claims":{"count":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57","strong_count":0},"builder_version":"pith-number-builder-2026-05-17-v1","claims":{"count":0,"items":[],"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"formal_canon":{"evidence_count":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"paper":{"abstract_excerpt":"Basic Linear Algebra Subprograms (BLAS) are a set of low level linear algebra kernels widely adopted by applications involved with the deep learning and scientific computing. The massive and economic computing power brought forth by the emerging GPU architectures drives interest in implementation of compute-intensive level 3 BLAS on multi-GPU systems. In this paper, we investigate existing multi-GPU level 3 BLAS and present that 1) issues, such as the improper load balancing, inefficient communication, insufficient GPU stream level concurrency and data caching, impede current implementations f","authors_text":"Jianxiong Xiao, Linnan Wang, Wei Wu, Yi Yang","cross_cats":[],"headline":"","license":"http://arxiv.org/licenses/nonexclusive-distrib/1.0/","primary_cat":"cs.DC","submitted_at":"2015-10-16T22:34:24Z","title":"BLASX: A High Performance Level-3 BLAS Library for Heterogeneous Multi-GPU Computing"},"references":{"count":0,"internal_anchors":0,"resolved_work":0,"sample":[],"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"source":{"id":"1510.05041","kind":"arxiv","version":1},"verdict":{"created_at":null,"id":null,"model_set":{},"one_line_summary":"","pipeline_version":null,"pith_extraction_headline":"","strongest_claim":"","weakest_assumption":""}},"verdict_id":null}}],"author_attestations":[],"timestamp_anchors":[],"storage_attestations":[],"citation_signatures":[],"replication_records":[],"corrections":[],"mirror_hints":[],"record_created":{"event_id":"sha256:5b36359767c3917fd31e5bde73641810f728058773343e6bac5531c6e04812e1","target":"record","created_at":"2026-05-18T01:29:53Z","signer":{"key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","signer_id":"pith.science","signer_type":"pith_registry"},"payload":{"attestation_state":"computed","canonical_record":{"metadata":{"abstract_canon_sha256":"212850317d2311a062cb0b52190580ee7aa3068d2aa707ca8fa3f543e112a2c7","cross_cats_sorted":[],"license":"http://arxiv.org/licenses/nonexclusive-distrib/1.0/","primary_cat":"cs.DC","submitted_at":"2015-10-16T22:34:24Z","title_canon_sha256":"4dc35a81e5c4cc558369b861ef6585a62a26520ce70baf4568718eebcadbb609"},"schema_version":"1.0","source":{"id":"1510.05041","kind":"arxiv","version":1}},"canonical_sha256":"5272d001db6817bdfc79b5c7ea5d0a5510c6f1fbad729ca7f74e7730d2fac918","receipt":{"algorithm":"ed25519","builder_version":"pith-number-builder-2026-05-17-v1","canonical_sha256":"5272d001db6817bdfc79b5c7ea5d0a5510c6f1fbad729ca7f74e7730d2fac918","first_computed_at":"2026-05-18T01:29:53.344977Z","key_id":"pith-v1-2026-05","kind":"pith_receipt","last_reissued_at":"2026-05-18T01:29:53.344977Z","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","receipt_version":"0.3","signature_b64":"5bbYiEqebUcxblw1TiERo+OHf/ybDNx5E3s8MY9GtMqmzJT4VjwQ2lM7pUhIk9kwymoSjsWxXGPN1zwZI8LkCQ==","signature_status":"signed_v1","signed_at":"2026-05-18T01:29:53.345572Z","signed_message":"canonical_sha256_bytes"},"source_id":"1510.05041","source_kind":"arxiv","source_version":1}}},"equivocations":[],"invalid_events":[],"applied_event_ids":["sha256:5b36359767c3917fd31e5bde73641810f728058773343e6bac5531c6e04812e1","sha256:d726273cd0f18b57dd468a6d42965b3dd3cca32f3de86891b912176e2a89428d"],"state_sha256":"6d06c941aa57e0648c77d32b843284535e5700a83eeccf77852c6d9adb6dd67f"},"bundle_signature":{"signature_status":"signed_v1","algorithm":"ed25519","key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","signature_b64":"+MWyPwgWLcSrUbqGWZxh+xOZEVngfOlYrx+qSgxKR5Pvu7APGmFIpcFUaBf1u0dbYVl/RIoCbo0xOKAi83XSBg==","signed_message":"bundle_sha256_bytes","signed_at":"2026-06-04T21:48:19.772560Z","bundle_sha256":"4898d5621a2dad2011dbafcf48cb22636bed7347a13495aac86b43e76945cbd7"}}