{"record_type":"pith_number_record","schema_url":"https://pith.science/schemas/pith-number/v1.json","pith_number":"pith:2015:KJZNAAO3NAL337DZWXD6UXIKKU","short_pith_number":"pith:KJZNAAO3","schema_version":"1.0","canonical_sha256":"5272d001db6817bdfc79b5c7ea5d0a5510c6f1fbad729ca7f74e7730d2fac918","source":{"kind":"arxiv","id":"1510.05041","version":1},"attestation_state":"computed","paper":{"title":"BLASX: A High Performance Level-3 BLAS Library for Heterogeneous Multi-GPU Computing","license":"http://arxiv.org/licenses/nonexclusive-distrib/1.0/","headline":"","cross_cats":[],"primary_cat":"cs.DC","authors_text":"Jianxiong Xiao, Linnan Wang, Wei Wu, Yi Yang","submitted_at":"2015-10-16T22:34:24Z","abstract_excerpt":"Basic Linear Algebra Subprograms (BLAS) are a set of low level linear algebra kernels widely adopted by applications involved with the deep learning and scientific computing. The massive and economic computing power brought forth by the emerging GPU architectures drives interest in implementation of compute-intensive level 3 BLAS on multi-GPU systems. In this paper, we investigate existing multi-GPU level 3 BLAS and present that 1) issues, such as the improper load balancing, inefficient communication, insufficient GPU stream level concurrency and data caching, impede current implementations f"},"verification_status":{"content_addressed":true,"pith_receipt":true,"author_attested":false,"weak_author_claims":0,"strong_author_claims":0,"externally_anchored":false,"storage_verified":false,"citation_signatures":0,"replication_records":0,"graph_snapshot":true,"references_resolved":false,"formal_links_present":false},"canonical_record":{"source":{"id":"1510.05041","kind":"arxiv","version":1},"metadata":{"license":"http://arxiv.org/licenses/nonexclusive-distrib/1.0/","primary_cat":"cs.DC","submitted_at":"2015-10-16T22:34:24Z","cross_cats_sorted":[],"title_canon_sha256":"4dc35a81e5c4cc558369b861ef6585a62a26520ce70baf4568718eebcadbb609","abstract_canon_sha256":"212850317d2311a062cb0b52190580ee7aa3068d2aa707ca8fa3f543e112a2c7"},"schema_version":"1.0"},"receipt":{"kind":"pith_receipt","key_id":"pith-v1-2026-05","algorithm":"ed25519","signed_at":"2026-05-18T01:29:53.345572Z","signature_b64":"5bbYiEqebUcxblw1TiERo+OHf/ybDNx5E3s8MY9GtMqmzJT4VjwQ2lM7pUhIk9kwymoSjsWxXGPN1zwZI8LkCQ==","signed_message":"canonical_sha256_bytes","builder_version":"pith-number-builder-2026-05-17-v1","receipt_version":"0.3","canonical_sha256":"5272d001db6817bdfc79b5c7ea5d0a5510c6f1fbad729ca7f74e7730d2fac918","last_reissued_at":"2026-05-18T01:29:53.344977Z","signature_status":"signed_v1","first_computed_at":"2026-05-18T01:29:53.344977Z","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54"},"graph_snapshot":{"paper":{"title":"BLASX: A High Performance Level-3 BLAS Library for Heterogeneous Multi-GPU Computing","license":"http://arxiv.org/licenses/nonexclusive-distrib/1.0/","headline":"","cross_cats":[],"primary_cat":"cs.DC","authors_text":"Jianxiong Xiao, Linnan Wang, Wei Wu, Yi Yang","submitted_at":"2015-10-16T22:34:24Z","abstract_excerpt":"Basic Linear Algebra Subprograms (BLAS) are a set of low level linear algebra kernels widely adopted by applications involved with the deep learning and scientific computing. The massive and economic computing power brought forth by the emerging GPU architectures drives interest in implementation of compute-intensive level 3 BLAS on multi-GPU systems. In this paper, we investigate existing multi-GPU level 3 BLAS and present that 1) issues, such as the improper load balancing, inefficient communication, insufficient GPU stream level concurrency and data caching, impede current implementations f"},"claims":{"count":0,"items":[],"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"source":{"id":"1510.05041","kind":"arxiv","version":1},"verdict":{"id":null,"model_set":{},"created_at":null,"strongest_claim":"","one_line_summary":"","pipeline_version":null,"weakest_assumption":"","pith_extraction_headline":""},"references":{"count":0,"sample":[],"resolved_work":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57","internal_anchors":0},"formal_canon":{"evidence_count":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"author_claims":{"count":0,"strong_count":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"builder_version":"pith-number-builder-2026-05-17-v1"},"aliases":[{"alias_kind":"arxiv","alias_value":"1510.05041","created_at":"2026-05-18T01:29:53.345063+00:00"},{"alias_kind":"arxiv_version","alias_value":"1510.05041v1","created_at":"2026-05-18T01:29:53.345063+00:00"},{"alias_kind":"doi","alias_value":"10.48550/arxiv.1510.05041","created_at":"2026-05-18T01:29:53.345063+00:00"},{"alias_kind":"pith_short_12","alias_value":"KJZNAAO3NAL3","created_at":"2026-05-18T12:29:29.992203+00:00"},{"alias_kind":"pith_short_16","alias_value":"KJZNAAO3NAL337DZ","created_at":"2026-05-18T12:29:29.992203+00:00"},{"alias_kind":"pith_short_8","alias_value":"KJZNAAO3","created_at":"2026-05-18T12:29:29.992203+00:00"}],"events":[],"event_summary":{},"paper_claims":[],"inbound_citations":{"count":0,"internal_anchor_count":0,"sample":[]},"formal_canon":{"evidence_count":0,"sample":[],"anchors":[]},"links":{"html":"https://pith.science/pith/KJZNAAO3NAL337DZWXD6UXIKKU","json":"https://pith.science/pith/KJZNAAO3NAL337DZWXD6UXIKKU.json","graph_json":"https://pith.science/api/pith-number/KJZNAAO3NAL337DZWXD6UXIKKU/graph.json","events_json":"https://pith.science/api/pith-number/KJZNAAO3NAL337DZWXD6UXIKKU/events.json","paper":"https://pith.science/paper/KJZNAAO3"},"agent_actions":{"view_html":"https://pith.science/pith/KJZNAAO3NAL337DZWXD6UXIKKU","download_json":"https://pith.science/pith/KJZNAAO3NAL337DZWXD6UXIKKU.json","view_paper":"https://pith.science/paper/KJZNAAO3","resolve_alias":"https://pith.science/api/pith-number/resolve?arxiv=1510.05041&json=true","fetch_graph":"https://pith.science/api/pith-number/KJZNAAO3NAL337DZWXD6UXIKKU/graph.json","fetch_events":"https://pith.science/api/pith-number/KJZNAAO3NAL337DZWXD6UXIKKU/events.json","actions":{"anchor_timestamp":"https://pith.science/pith/KJZNAAO3NAL337DZWXD6UXIKKU/action/timestamp_anchor","attest_storage":"https://pith.science/pith/KJZNAAO3NAL337DZWXD6UXIKKU/action/storage_attestation","attest_author":"https://pith.science/pith/KJZNAAO3NAL337DZWXD6UXIKKU/action/author_attestation","sign_citation":"https://pith.science/pith/KJZNAAO3NAL337DZWXD6UXIKKU/action/citation_signature","submit_replication":"https://pith.science/pith/KJZNAAO3NAL337DZWXD6UXIKKU/action/replication_record"}},"created_at":"2026-05-18T01:29:53.345063+00:00","updated_at":"2026-05-18T01:29:53.345063+00:00"}