{"record_type":"pith_number_record","schema_url":"https://pith.science/schemas/pith-number/v1.json","pith_number":"pith:2026:U4TAMNHX5QHDQJ74ON4AOLF63B","short_pith_number":"pith:U4TAMNHX","schema_version":"1.0","canonical_sha256":"a7260634f7ec0e3827fc7378072cbed8608ae069df9051296d3565170e9b31dd","source":{"kind":"arxiv","id":"2605.20670","version":1},"attestation_state":"computed","paper":{"title":"LT2: Linear-Time Looped Transformers","license":"http://creativecommons.org/licenses/by-nc-nd/4.0/","headline":"","cross_cats":[],"primary_cat":"cs.LG","authors_text":"Chunyuan Deng, Hanjie Chen, Jiarui Liu, Rui-Jie Zhu, T. S. Eugene Ng, Yizhe Zhang, Yuanyuan Xu","submitted_at":"2026-05-20T03:36:44Z","abstract_excerpt":"Looped Transformers (LT) have emerged as a powerful architecture by iterating their layers multiple times before decoding the final token. However, pairing them with full attention retains quadratic complexity, making them computationally expensive and slow. We introduce LT2 (Linear-Time Looped Transformers), a family of looped architectures that replace quadratic softmax attention with subquadratic, linear-time attention. We study two variants: LT2-linear with linear attention and LT2-sparse with sparse attention. We find that looping uniquely synergizes with these variants: it enables iterat"},"verification_status":{"content_addressed":true,"pith_receipt":true,"author_attested":false,"weak_author_claims":0,"strong_author_claims":0,"externally_anchored":false,"storage_verified":false,"citation_signatures":0,"replication_records":0,"graph_snapshot":true,"references_resolved":false,"formal_links_present":false},"canonical_record":{"source":{"id":"2605.20670","kind":"arxiv","version":1},"metadata":{"license":"http://creativecommons.org/licenses/by-nc-nd/4.0/","primary_cat":"cs.LG","submitted_at":"2026-05-20T03:36:44Z","cross_cats_sorted":[],"title_canon_sha256":"fa1e2b6c355692644211c42a5067cf7d565bc3c31b79b2731f6cd91b894d3649","abstract_canon_sha256":"2955aaa2afba1feb09a0fbf9f3e42996152499b73012c87e6713693b20b9c0d9"},"schema_version":"1.0"},"receipt":{"kind":"pith_receipt","key_id":"pith-v1-2026-05","algorithm":"ed25519","signed_at":"2026-05-21T01:04:48.371999Z","signature_b64":"eCKQ6icZyQMB7r7NeN/714bEUXU/SM+nW65minfYyXNV6ZeIQNN1+POWwW41Kej+53JyES/TYfNxYPYm/25pBw==","signed_message":"canonical_sha256_bytes","builder_version":"pith-number-builder-2026-05-17-v1","receipt_version":"0.3","canonical_sha256":"a7260634f7ec0e3827fc7378072cbed8608ae069df9051296d3565170e9b31dd","last_reissued_at":"2026-05-21T01:04:48.371298Z","signature_status":"signed_v1","first_computed_at":"2026-05-21T01:04:48.371298Z","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54"},"graph_snapshot":{"paper":{"title":"LT2: Linear-Time Looped Transformers","license":"http://creativecommons.org/licenses/by-nc-nd/4.0/","headline":"","cross_cats":[],"primary_cat":"cs.LG","authors_text":"Chunyuan Deng, Hanjie Chen, Jiarui Liu, Rui-Jie Zhu, T. S. Eugene Ng, Yizhe Zhang, Yuanyuan Xu","submitted_at":"2026-05-20T03:36:44Z","abstract_excerpt":"Looped Transformers (LT) have emerged as a powerful architecture by iterating their layers multiple times before decoding the final token. However, pairing them with full attention retains quadratic complexity, making them computationally expensive and slow. We introduce LT2 (Linear-Time Looped Transformers), a family of looped architectures that replace quadratic softmax attention with subquadratic, linear-time attention. We study two variants: LT2-linear with linear attention and LT2-sparse with sparse attention. We find that looping uniquely synergizes with these variants: it enables iterat"},"claims":{"count":0,"items":[],"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"source":{"id":"2605.20670","kind":"arxiv","version":1},"verdict":{"id":null,"model_set":{},"created_at":null,"strongest_claim":"","one_line_summary":"","pipeline_version":null,"weakest_assumption":"","pith_extraction_headline":""},"integrity":{"clean":true,"summary":{"advisory":0,"critical":0,"by_detector":{},"informational":0},"endpoint":"/pith/2605.20670/integrity.json","findings":[],"available":true,"detectors_run":[],"snapshot_sha256":"c28c3603d3b5d939e8dc4c7e95fa8dfce3d595e45f758748cecf8e644a296938"},"references":{"count":0,"sample":[],"resolved_work":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57","internal_anchors":0},"formal_canon":{"evidence_count":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"author_claims":{"count":0,"strong_count":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"builder_version":"pith-number-builder-2026-05-17-v1"},"aliases":[{"alias_kind":"arxiv","alias_value":"2605.20670","created_at":"2026-05-21T01:04:48.371411+00:00"},{"alias_kind":"arxiv_version","alias_value":"2605.20670v1","created_at":"2026-05-21T01:04:48.371411+00:00"},{"alias_kind":"doi","alias_value":"10.48550/arxiv.2605.20670","created_at":"2026-05-21T01:04:48.371411+00:00"},{"alias_kind":"pith_short_12","alias_value":"U4TAMNHX5QHD","created_at":"2026-05-21T01:04:48.371411+00:00"},{"alias_kind":"pith_short_16","alias_value":"U4TAMNHX5QHDQJ74","created_at":"2026-05-21T01:04:48.371411+00:00"},{"alias_kind":"pith_short_8","alias_value":"U4TAMNHX","created_at":"2026-05-21T01:04:48.371411+00:00"}],"events":[],"event_summary":{},"paper_claims":[],"inbound_citations":{"count":0,"internal_anchor_count":0,"sample":[]},"formal_canon":{"evidence_count":0,"sample":[],"anchors":[]},"links":{"html":"https://pith.science/pith/U4TAMNHX5QHDQJ74ON4AOLF63B","json":"https://pith.science/pith/U4TAMNHX5QHDQJ74ON4AOLF63B.json","graph_json":"https://pith.science/api/pith-number/U4TAMNHX5QHDQJ74ON4AOLF63B/graph.json","events_json":"https://pith.science/api/pith-number/U4TAMNHX5QHDQJ74ON4AOLF63B/events.json","paper":"https://pith.science/paper/U4TAMNHX"},"agent_actions":{"view_html":"https://pith.science/pith/U4TAMNHX5QHDQJ74ON4AOLF63B","download_json":"https://pith.science/pith/U4TAMNHX5QHDQJ74ON4AOLF63B.json","view_paper":"https://pith.science/paper/U4TAMNHX","resolve_alias":"https://pith.science/api/pith-number/resolve?arxiv=2605.20670&json=true","fetch_graph":"https://pith.science/api/pith-number/U4TAMNHX5QHDQJ74ON4AOLF63B/graph.json","fetch_events":"https://pith.science/api/pith-number/U4TAMNHX5QHDQJ74ON4AOLF63B/events.json","actions":{"anchor_timestamp":"https://pith.science/pith/U4TAMNHX5QHDQJ74ON4AOLF63B/action/timestamp_anchor","attest_storage":"https://pith.science/pith/U4TAMNHX5QHDQJ74ON4AOLF63B/action/storage_attestation","attest_author":"https://pith.science/pith/U4TAMNHX5QHDQJ74ON4AOLF63B/action/author_attestation","sign_citation":"https://pith.science/pith/U4TAMNHX5QHDQJ74ON4AOLF63B/action/citation_signature","submit_replication":"https://pith.science/pith/U4TAMNHX5QHDQJ74ON4AOLF63B/action/replication_record"}},"created_at":"2026-05-21T01:04:48.371411+00:00","updated_at":"2026-05-21T01:04:48.371411+00:00"}