{"bundle_type":"pith_open_graph_bundle","bundle_version":"1.0","pith_number":"pith:2019:A44HR6T2DB3ZOE3XH2CILN3VZQ","short_pith_number":"pith:A44HR6T2","canonical_record":{"source":{"id":"1906.00532","kind":"arxiv","version":2},"metadata":{"license":"http://arxiv.org/licenses/nonexclusive-distrib/1.0/","primary_cat":"cs.LG","submitted_at":"2019-06-03T02:29:22Z","cross_cats_sorted":[],"title_canon_sha256":"e3fe60c7f4ff36129ef126786ecbefcc8cc92de5d37dcb6548d83bde1229962b","abstract_canon_sha256":"07345bad92e9464844ede82e3e94242c514f2d138766c0bb13d4e52734414bbe"},"schema_version":"1.0"},"canonical_sha256":"073878fa7a18779713773e8485b775cc35ab38aabc1b8a357013e592afb5f5e4","source":{"kind":"arxiv","id":"1906.00532","version":2},"source_aliases":[{"alias_kind":"arxiv","alias_value":"1906.00532","created_at":"2026-05-17T23:43:55Z"},{"alias_kind":"arxiv_version","alias_value":"1906.00532v2","created_at":"2026-05-17T23:43:55Z"},{"alias_kind":"doi","alias_value":"10.48550/arxiv.1906.00532","created_at":"2026-05-17T23:43:55Z"},{"alias_kind":"pith_short_12","alias_value":"A44HR6T2DB3Z","created_at":"2026-05-18T12:33:12Z"},{"alias_kind":"pith_short_16","alias_value":"A44HR6T2DB3ZOE3X","created_at":"2026-05-18T12:33:12Z"},{"alias_kind":"pith_short_8","alias_value":"A44HR6T2","created_at":"2026-05-18T12:33:12Z"}],"events":[{"event_type":"record_created","subject_pith_number":"pith:2019:A44HR6T2DB3ZOE3XH2CILN3VZQ","target":"record","payload":{"canonical_record":{"source":{"id":"1906.00532","kind":"arxiv","version":2},"metadata":{"license":"http://arxiv.org/licenses/nonexclusive-distrib/1.0/","primary_cat":"cs.LG","submitted_at":"2019-06-03T02:29:22Z","cross_cats_sorted":[],"title_canon_sha256":"e3fe60c7f4ff36129ef126786ecbefcc8cc92de5d37dcb6548d83bde1229962b","abstract_canon_sha256":"07345bad92e9464844ede82e3e94242c514f2d138766c0bb13d4e52734414bbe"},"schema_version":"1.0"},"canonical_sha256":"073878fa7a18779713773e8485b775cc35ab38aabc1b8a357013e592afb5f5e4","receipt":{"kind":"pith_receipt","key_id":"pith-v1-2026-05","algorithm":"ed25519","signed_at":"2026-05-17T23:43:55.900821Z","signature_b64":"+lf1lHbQCtnY14tNJnZpyQs8AGJCElzOsFLKoNWimzygqQGTnudj88nr4rhMOeaFcRWK4H8PG1nnK84v31SaBg==","signed_message":"canonical_sha256_bytes","builder_version":"pith-number-builder-2026-05-17-v1","receipt_version":"0.3","canonical_sha256":"073878fa7a18779713773e8485b775cc35ab38aabc1b8a357013e592afb5f5e4","last_reissued_at":"2026-05-17T23:43:55.900147Z","signature_status":"signed_v1","first_computed_at":"2026-05-17T23:43:55.900147Z","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54"},"source_kind":"arxiv","source_id":"1906.00532","source_version":2,"attestation_state":"computed"},"signer":{"signer_id":"pith.science","signer_type":"pith_registry","key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54"},"created_at":"2026-05-17T23:43:55Z","supersedes":[],"prev_event":null,"signature":{"signature_status":"signed_v1","algorithm":"ed25519","key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","signature_b64":"QZ7FKIGFVTKNKcBGrPCjj9h1M4P8eRaEZDyYkdDelDfJwo2oMSpyKTHZrwfqQ3WKJIfz4PS2Aatk9KqIe+gfBQ==","signed_message":"open_graph_event_sha256_bytes","signed_at":"2026-05-27T02:34:43.284576Z"},"content_sha256":"918ecbb3c5f3b3c19d61afaebb434c6deba911fcd18fb82fae4e15ffca305779","schema_version":"1.0","event_id":"sha256:918ecbb3c5f3b3c19d61afaebb434c6deba911fcd18fb82fae4e15ffca305779"},{"event_type":"graph_snapshot","subject_pith_number":"pith:2019:A44HR6T2DB3ZOE3XH2CILN3VZQ","target":"graph","payload":{"graph_snapshot":{"paper":{"title":"Efficient 8-Bit Quantization of Transformer Neural Machine Language Translation Model","license":"http://arxiv.org/licenses/nonexclusive-distrib/1.0/","headline":"","cross_cats":[],"primary_cat":"cs.LG","authors_text":"Aishwarya Bhandare, Deepthi Karkada, Kushal Datta, Sun Choi, Vamsi Sripathi, Vikram Saletore, Vivek Menon","submitted_at":"2019-06-03T02:29:22Z","abstract_excerpt":"In this work, we quantize a trained Transformer machine language translation model leveraging INT8/VNNI instructions in the latest Intel$^\\circledR$ Xeon$^\\circledR$ Cascade Lake processors to improve inference performance while maintaining less than 0.5$\\%$ drop in accuracy. To the best of our knowledge, this is the first attempt in the industry to quantize the Transformer model. This has high impact as it clearly demonstrates the various complexities of quantizing the language translation model. We present novel quantization techniques directly in TensorFlow to opportunistically replace 32-b"},"claims":{"count":0,"items":[],"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"source":{"id":"1906.00532","kind":"arxiv","version":2},"verdict":{"id":null,"model_set":{},"created_at":null,"strongest_claim":"","one_line_summary":"","pipeline_version":null,"weakest_assumption":"","pith_extraction_headline":""},"references":{"count":0,"sample":[],"resolved_work":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57","internal_anchors":0},"formal_canon":{"evidence_count":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"author_claims":{"count":0,"strong_count":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"builder_version":"pith-number-builder-2026-05-17-v1"},"verdict_id":null},"signer":{"signer_id":"pith.science","signer_type":"pith_registry","key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54"},"created_at":"2026-05-17T23:43:55Z","supersedes":[],"prev_event":null,"signature":{"signature_status":"signed_v1","algorithm":"ed25519","key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","signature_b64":"KCuhpabYlumaMFybUe8XN+JiilsQhnODHzAkViyQQ7ebzddawrxxsekYxSiY+hLvrrFREp2wr9UJQe16d1QwBg==","signed_message":"open_graph_event_sha256_bytes","signed_at":"2026-05-27T02:34:43.284938Z"},"content_sha256":"451b48cecc2e5c441605a98779c5d3d727aaddbe360c819b495d47e6383a79f2","schema_version":"1.0","event_id":"sha256:451b48cecc2e5c441605a98779c5d3d727aaddbe360c819b495d47e6383a79f2"}],"timestamp_proofs":[],"mirror_hints":[{"mirror_type":"https","name":"Pith Resolver","base_url":"https://pith.science","bundle_url":"https://pith.science/pith/A44HR6T2DB3ZOE3XH2CILN3VZQ/bundle.json","state_url":"https://pith.science/pith/A44HR6T2DB3ZOE3XH2CILN3VZQ/state.json","well_known_bundle_url":"https://pith.science/.well-known/pith/A44HR6T2DB3ZOE3XH2CILN3VZQ/bundle.json","status":"primary"}],"public_keys":[{"key_id":"pith-v1-2026-05","algorithm":"ed25519","format":"raw","public_key_b64":"stVStoiQhXFxp4s2pdzPNoqVNBMojDU/fJ2db5S3CbM=","public_key_hex":"b2d552b68890857171a78b36a5dccf368a953413288c353f7c9d9d6f94b709b3","fingerprint_sha256_b32_first128bits":"RVFV5Z2OI2J3ZUO7ERDEBCYNKS","fingerprint_sha256_hex":"8d4b5ee74e4693bcd1df2446408b0d54","rotates_at":null,"url":"https://pith.science/pith-signing-key.json","notes":"Pith uses this Ed25519 key to sign canonical record SHA-256 digests. Verify with: ed25519_verify(public_key, message=canonical_sha256_bytes, signature=base64decode(signature_b64))."}],"merge_version":"pith-open-graph-merge-v1","built_at":"2026-05-27T02:34:43Z","links":{"resolver":"https://pith.science/pith/A44HR6T2DB3ZOE3XH2CILN3VZQ","bundle":"https://pith.science/pith/A44HR6T2DB3ZOE3XH2CILN3VZQ/bundle.json","state":"https://pith.science/pith/A44HR6T2DB3ZOE3XH2CILN3VZQ/state.json","well_known_bundle":"https://pith.science/.well-known/pith/A44HR6T2DB3ZOE3XH2CILN3VZQ/bundle.json"},"state":{"state_type":"pith_open_graph_state","state_version":"1.0","pith_number":"pith:2019:A44HR6T2DB3ZOE3XH2CILN3VZQ","merge_version":"pith-open-graph-merge-v1","event_count":2,"valid_event_count":2,"invalid_event_count":0,"equivocation_count":0,"current":{"canonical_record":{"metadata":{"abstract_canon_sha256":"07345bad92e9464844ede82e3e94242c514f2d138766c0bb13d4e52734414bbe","cross_cats_sorted":[],"license":"http://arxiv.org/licenses/nonexclusive-distrib/1.0/","primary_cat":"cs.LG","submitted_at":"2019-06-03T02:29:22Z","title_canon_sha256":"e3fe60c7f4ff36129ef126786ecbefcc8cc92de5d37dcb6548d83bde1229962b"},"schema_version":"1.0","source":{"id":"1906.00532","kind":"arxiv","version":2}},"source_aliases":[{"alias_kind":"arxiv","alias_value":"1906.00532","created_at":"2026-05-17T23:43:55Z"},{"alias_kind":"arxiv_version","alias_value":"1906.00532v2","created_at":"2026-05-17T23:43:55Z"},{"alias_kind":"doi","alias_value":"10.48550/arxiv.1906.00532","created_at":"2026-05-17T23:43:55Z"},{"alias_kind":"pith_short_12","alias_value":"A44HR6T2DB3Z","created_at":"2026-05-18T12:33:12Z"},{"alias_kind":"pith_short_16","alias_value":"A44HR6T2DB3ZOE3X","created_at":"2026-05-18T12:33:12Z"},{"alias_kind":"pith_short_8","alias_value":"A44HR6T2","created_at":"2026-05-18T12:33:12Z"}],"graph_snapshots":[{"event_id":"sha256:451b48cecc2e5c441605a98779c5d3d727aaddbe360c819b495d47e6383a79f2","target":"graph","created_at":"2026-05-17T23:43:55Z","signer":{"key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","signer_id":"pith.science","signer_type":"pith_registry"},"payload":{"graph_snapshot":{"author_claims":{"count":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57","strong_count":0},"builder_version":"pith-number-builder-2026-05-17-v1","claims":{"count":0,"items":[],"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"formal_canon":{"evidence_count":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"paper":{"abstract_excerpt":"In this work, we quantize a trained Transformer machine language translation model leveraging INT8/VNNI instructions in the latest Intel$^\\circledR$ Xeon$^\\circledR$ Cascade Lake processors to improve inference performance while maintaining less than 0.5$\\%$ drop in accuracy. To the best of our knowledge, this is the first attempt in the industry to quantize the Transformer model. This has high impact as it clearly demonstrates the various complexities of quantizing the language translation model. We present novel quantization techniques directly in TensorFlow to opportunistically replace 32-b","authors_text":"Aishwarya Bhandare, Deepthi Karkada, Kushal Datta, Sun Choi, Vamsi Sripathi, Vikram Saletore, Vivek Menon","cross_cats":[],"headline":"","license":"http://arxiv.org/licenses/nonexclusive-distrib/1.0/","primary_cat":"cs.LG","submitted_at":"2019-06-03T02:29:22Z","title":"Efficient 8-Bit Quantization of Transformer Neural Machine Language Translation Model"},"references":{"count":0,"internal_anchors":0,"resolved_work":0,"sample":[],"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"source":{"id":"1906.00532","kind":"arxiv","version":2},"verdict":{"created_at":null,"id":null,"model_set":{},"one_line_summary":"","pipeline_version":null,"pith_extraction_headline":"","strongest_claim":"","weakest_assumption":""}},"verdict_id":null}}],"author_attestations":[],"timestamp_anchors":[],"storage_attestations":[],"citation_signatures":[],"replication_records":[],"corrections":[],"mirror_hints":[],"record_created":{"event_id":"sha256:918ecbb3c5f3b3c19d61afaebb434c6deba911fcd18fb82fae4e15ffca305779","target":"record","created_at":"2026-05-17T23:43:55Z","signer":{"key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","signer_id":"pith.science","signer_type":"pith_registry"},"payload":{"attestation_state":"computed","canonical_record":{"metadata":{"abstract_canon_sha256":"07345bad92e9464844ede82e3e94242c514f2d138766c0bb13d4e52734414bbe","cross_cats_sorted":[],"license":"http://arxiv.org/licenses/nonexclusive-distrib/1.0/","primary_cat":"cs.LG","submitted_at":"2019-06-03T02:29:22Z","title_canon_sha256":"e3fe60c7f4ff36129ef126786ecbefcc8cc92de5d37dcb6548d83bde1229962b"},"schema_version":"1.0","source":{"id":"1906.00532","kind":"arxiv","version":2}},"canonical_sha256":"073878fa7a18779713773e8485b775cc35ab38aabc1b8a357013e592afb5f5e4","receipt":{"algorithm":"ed25519","builder_version":"pith-number-builder-2026-05-17-v1","canonical_sha256":"073878fa7a18779713773e8485b775cc35ab38aabc1b8a357013e592afb5f5e4","first_computed_at":"2026-05-17T23:43:55.900147Z","key_id":"pith-v1-2026-05","kind":"pith_receipt","last_reissued_at":"2026-05-17T23:43:55.900147Z","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","receipt_version":"0.3","signature_b64":"+lf1lHbQCtnY14tNJnZpyQs8AGJCElzOsFLKoNWimzygqQGTnudj88nr4rhMOeaFcRWK4H8PG1nnK84v31SaBg==","signature_status":"signed_v1","signed_at":"2026-05-17T23:43:55.900821Z","signed_message":"canonical_sha256_bytes"},"source_id":"1906.00532","source_kind":"arxiv","source_version":2}}},"equivocations":[],"invalid_events":[],"applied_event_ids":["sha256:918ecbb3c5f3b3c19d61afaebb434c6deba911fcd18fb82fae4e15ffca305779","sha256:451b48cecc2e5c441605a98779c5d3d727aaddbe360c819b495d47e6383a79f2"],"state_sha256":"5219a43e22c290992ebfff9e1056b1e3bf7bab58fa9f65f0f7d82cadc2801936"},"bundle_signature":{"signature_status":"signed_v1","algorithm":"ed25519","key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","signature_b64":"VyTq5Mg5xiahZsa9wj/4vRjfHzfJ1pZaWAdNutFhZQHs5L0KvGcuxw6HRJcRKVOPSCcDUWdoCMADl791e59fAQ==","signed_message":"bundle_sha256_bytes","signed_at":"2026-05-27T02:34:43.287170Z","bundle_sha256":"dd5da97ec982f1914fe0d175c5f447a609a42ecb6a1ec5ea8756f845bee560a6"}}