{"record_type":"pith_number_record","schema_url":"https://pith.science/schemas/pith-number/v1.json","pith_number":"pith:2026:H7MFXKAP45HVEBZYYORIM7C55D","short_pith_number":"pith:H7MFXKAP","schema_version":"1.0","canonical_sha256":"3fd85ba80fe74f520738c3a2867c5de8fcc88f19c03e67ce959f8d2753a71dad","source":{"kind":"arxiv","id":"2605.19561","version":1},"attestation_state":"computed","paper":{"title":"TORQ: Two-Level Orthogonal Rotation for MXFP4 Quantization","license":"http://creativecommons.org/licenses/by/4.0/","headline":"","cross_cats":["cs.AI"],"primary_cat":"cs.LG","authors_text":"Dawei Yang, Xing Hu, Zukang Xu","submitted_at":"2026-05-19T09:05:47Z","abstract_excerpt":"As Large Language Models (LLMs) advance toward practical deployment, the Microscaling FP4 (MXFP4) format has emerged as a cornerstone for next-generation low-bit inference, owing to its ability to balance high dynamic range with hardware efficiency. However, directly applying MXFP4 to LLM activation quantization inevitably leads to significant accuracy degradation. In this paper, we theoretically analyze the error structure of MXFP4 activation quantization, revealing that the root cause of this performance drop lies in two structural imbalances between activation distributions and the MXFP4 bl"},"verification_status":{"content_addressed":true,"pith_receipt":true,"author_attested":false,"weak_author_claims":0,"strong_author_claims":0,"externally_anchored":false,"storage_verified":false,"citation_signatures":0,"replication_records":0,"graph_snapshot":true,"references_resolved":false,"formal_links_present":false},"canonical_record":{"source":{"id":"2605.19561","kind":"arxiv","version":1},"metadata":{"license":"http://creativecommons.org/licenses/by/4.0/","primary_cat":"cs.LG","submitted_at":"2026-05-19T09:05:47Z","cross_cats_sorted":["cs.AI"],"title_canon_sha256":"33336ee6f1341008c060722314696d867b0bc2ab18b5fb77ba25d95f36857490","abstract_canon_sha256":"7b3bbbb7f2401e3fd6845e99129008b287b15cd4922c4926a40737a41cf70685"},"schema_version":"1.0"},"receipt":{"kind":"pith_receipt","key_id":"pith-v1-2026-05","algorithm":"ed25519","signed_at":"2026-05-20T01:05:51.861254Z","signature_b64":"KxqjexJW1PbQ8LVy6j2VjYdyz4ofaahCS2FlKHEW+g0NJaXnNNmCEO1yC1A5OqZw4t72xz0zoLdlsvCFObVaCw==","signed_message":"canonical_sha256_bytes","builder_version":"pith-number-builder-2026-05-17-v1","receipt_version":"0.3","canonical_sha256":"3fd85ba80fe74f520738c3a2867c5de8fcc88f19c03e67ce959f8d2753a71dad","last_reissued_at":"2026-05-20T01:05:51.860542Z","signature_status":"signed_v1","first_computed_at":"2026-05-20T01:05:51.860542Z","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54"},"graph_snapshot":{"paper":{"title":"TORQ: Two-Level Orthogonal Rotation for MXFP4 Quantization","license":"http://creativecommons.org/licenses/by/4.0/","headline":"","cross_cats":["cs.AI"],"primary_cat":"cs.LG","authors_text":"Dawei Yang, Xing Hu, Zukang Xu","submitted_at":"2026-05-19T09:05:47Z","abstract_excerpt":"As Large Language Models (LLMs) advance toward practical deployment, the Microscaling FP4 (MXFP4) format has emerged as a cornerstone for next-generation low-bit inference, owing to its ability to balance high dynamic range with hardware efficiency. However, directly applying MXFP4 to LLM activation quantization inevitably leads to significant accuracy degradation. In this paper, we theoretically analyze the error structure of MXFP4 activation quantization, revealing that the root cause of this performance drop lies in two structural imbalances between activation distributions and the MXFP4 bl"},"claims":{"count":0,"items":[],"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"source":{"id":"2605.19561","kind":"arxiv","version":1},"verdict":{"id":null,"model_set":{},"created_at":null,"strongest_claim":"","one_line_summary":"","pipeline_version":null,"weakest_assumption":"","pith_extraction_headline":""},"integrity":{"clean":true,"summary":{"advisory":0,"critical":0,"by_detector":{},"informational":0},"endpoint":"/pith/2605.19561/integrity.json","findings":[],"available":true,"detectors_run":[],"snapshot_sha256":"c28c3603d3b5d939e8dc4c7e95fa8dfce3d595e45f758748cecf8e644a296938"},"references":{"count":0,"sample":[],"resolved_work":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57","internal_anchors":0},"formal_canon":{"evidence_count":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"author_claims":{"count":0,"strong_count":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"builder_version":"pith-number-builder-2026-05-17-v1"},"aliases":[{"alias_kind":"arxiv","alias_value":"2605.19561","created_at":"2026-05-20T01:05:51.860651+00:00"},{"alias_kind":"arxiv_version","alias_value":"2605.19561v1","created_at":"2026-05-20T01:05:51.860651+00:00"},{"alias_kind":"doi","alias_value":"10.48550/arxiv.2605.19561","created_at":"2026-05-20T01:05:51.860651+00:00"},{"alias_kind":"pith_short_12","alias_value":"H7MFXKAP45HV","created_at":"2026-05-20T01:05:51.860651+00:00"},{"alias_kind":"pith_short_16","alias_value":"H7MFXKAP45HVEBZY","created_at":"2026-05-20T01:05:51.860651+00:00"},{"alias_kind":"pith_short_8","alias_value":"H7MFXKAP","created_at":"2026-05-20T01:05:51.860651+00:00"}],"events":[],"event_summary":{},"paper_claims":[],"inbound_citations":{"count":0,"internal_anchor_count":0,"sample":[]},"formal_canon":{"evidence_count":0,"sample":[],"anchors":[]},"links":{"html":"https://pith.science/pith/H7MFXKAP45HVEBZYYORIM7C55D","json":"https://pith.science/pith/H7MFXKAP45HVEBZYYORIM7C55D.json","graph_json":"https://pith.science/api/pith-number/H7MFXKAP45HVEBZYYORIM7C55D/graph.json","events_json":"https://pith.science/api/pith-number/H7MFXKAP45HVEBZYYORIM7C55D/events.json","paper":"https://pith.science/paper/H7MFXKAP"},"agent_actions":{"view_html":"https://pith.science/pith/H7MFXKAP45HVEBZYYORIM7C55D","download_json":"https://pith.science/pith/H7MFXKAP45HVEBZYYORIM7C55D.json","view_paper":"https://pith.science/paper/H7MFXKAP","resolve_alias":"https://pith.science/api/pith-number/resolve?arxiv=2605.19561&json=true","fetch_graph":"https://pith.science/api/pith-number/H7MFXKAP45HVEBZYYORIM7C55D/graph.json","fetch_events":"https://pith.science/api/pith-number/H7MFXKAP45HVEBZYYORIM7C55D/events.json","actions":{"anchor_timestamp":"https://pith.science/pith/H7MFXKAP45HVEBZYYORIM7C55D/action/timestamp_anchor","attest_storage":"https://pith.science/pith/H7MFXKAP45HVEBZYYORIM7C55D/action/storage_attestation","attest_author":"https://pith.science/pith/H7MFXKAP45HVEBZYYORIM7C55D/action/author_attestation","sign_citation":"https://pith.science/pith/H7MFXKAP45HVEBZYYORIM7C55D/action/citation_signature","submit_replication":"https://pith.science/pith/H7MFXKAP45HVEBZYYORIM7C55D/action/replication_record"}},"created_at":"2026-05-20T01:05:51.860651+00:00","updated_at":"2026-05-20T01:05:51.860651+00:00"}