{"bundle_type":"pith_open_graph_bundle","bundle_version":"1.0","pith_number":"pith:2023:WWMGNKMITKHW6I236PQ5LJCDZA","short_pith_number":"pith:WWMGNKMI","canonical_record":{"source":{"id":"2311.02382","kind":"arxiv","version":2},"metadata":{"license":"http://arxiv.org/licenses/nonexclusive-distrib/1.0/","primary_cat":"cs.DC","submitted_at":"2023-11-04T11:38:53Z","cross_cats_sorted":["cs.AI"],"title_canon_sha256":"c70e186cbc624522207fec85021fcf98c3f8fe79fce51a93de48f231daec130f","abstract_canon_sha256":"a7a0af2cd954f65e8c147b735e4c8df33c9c83bd80c76acd91eba94637b64f56"},"schema_version":"1.0"},"canonical_sha256":"b59866a9889a8f6f235bf3e1d5a443c8193104354d93b66fd0ae58feba7ea607","source":{"kind":"arxiv","id":"2311.02382","version":2},"source_aliases":[{"alias_kind":"arxiv","alias_value":"2311.02382","created_at":"2026-07-05T07:10:30Z"},{"alias_kind":"arxiv_version","alias_value":"2311.02382v2","created_at":"2026-07-05T07:10:30Z"},{"alias_kind":"doi","alias_value":"10.48550/arxiv.2311.02382","created_at":"2026-07-05T07:10:30Z"},{"alias_kind":"pith_short_12","alias_value":"WWMGNKMITKHW","created_at":"2026-07-05T07:10:30Z"},{"alias_kind":"pith_short_16","alias_value":"WWMGNKMITKHW6I23","created_at":"2026-07-05T07:10:30Z"},{"alias_kind":"pith_short_8","alias_value":"WWMGNKMI","created_at":"2026-07-05T07:10:30Z"}],"events":[{"event_type":"record_created","subject_pith_number":"pith:2023:WWMGNKMITKHW6I236PQ5LJCDZA","target":"record","payload":{"canonical_record":{"source":{"id":"2311.02382","kind":"arxiv","version":2},"metadata":{"license":"http://arxiv.org/licenses/nonexclusive-distrib/1.0/","primary_cat":"cs.DC","submitted_at":"2023-11-04T11:38:53Z","cross_cats_sorted":["cs.AI"],"title_canon_sha256":"c70e186cbc624522207fec85021fcf98c3f8fe79fce51a93de48f231daec130f","abstract_canon_sha256":"a7a0af2cd954f65e8c147b735e4c8df33c9c83bd80c76acd91eba94637b64f56"},"schema_version":"1.0"},"canonical_sha256":"b59866a9889a8f6f235bf3e1d5a443c8193104354d93b66fd0ae58feba7ea607","receipt":{"kind":"pith_receipt","key_id":"pith-v1-2026-05","algorithm":"ed25519","signed_at":"2026-07-05T07:10:30.711593Z","signature_b64":"XnIipsztZ4hfYX6+2MZqGMmNqSYZu5MZiPSN1E3fbC2LGT1YDcHjD/rG5u3mqr25aBue16OFp4etr8r6vxehBA==","signed_message":"canonical_sha256_bytes","builder_version":"pith-number-builder-2026-05-17-v1","receipt_version":"0.3","canonical_sha256":"b59866a9889a8f6f235bf3e1d5a443c8193104354d93b66fd0ae58feba7ea607","last_reissued_at":"2026-07-05T07:10:30.711031Z","signature_status":"signed_v1","first_computed_at":"2026-07-05T07:10:30.711031Z","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54"},"source_kind":"arxiv","source_id":"2311.02382","source_version":2,"attestation_state":"computed"},"signer":{"signer_id":"pith.science","signer_type":"pith_registry","key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54"},"created_at":"2026-07-05T07:10:30Z","supersedes":[],"prev_event":null,"signature":{"signature_status":"signed_v1","algorithm":"ed25519","key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","signature_b64":"CntaVP/okm/hR3d3qpD4+mQ7aia3oQe3d8T6GdQ2kyI7GzFP+t5OeWNjF+h7K/1px7BYTVt84wJYC6n7vtozDQ==","signed_message":"open_graph_event_sha256_bytes","signed_at":"2026-07-05T14:36:45.743702Z"},"content_sha256":"48f45229713c64d64f4f8136e3b4b8f689b95dfa4f3d160674fcc1c5546320e3","schema_version":"1.0","event_id":"sha256:48f45229713c64d64f4f8136e3b4b8f689b95dfa4f3d160674fcc1c5546320e3"},{"event_type":"graph_snapshot","subject_pith_number":"pith:2023:WWMGNKMITKHW6I236PQ5LJCDZA","target":"graph","payload":{"graph_snapshot":{"paper":{"title":"Ultra-Long Sequence Distributed Transformer","license":"http://arxiv.org/licenses/nonexclusive-distrib/1.0/","headline":"","cross_cats":["cs.AI"],"primary_cat":"cs.DC","authors_text":"Aristeidis Tsaris, Hong-Jun Yoon, Isaac Lyngaas, John Gouley, Mayanka Chandra Shekar, Mohamed Wahib, Peng Chen, Sajal Dash, Tao Luo, Xiao Wang","submitted_at":"2023-11-04T11:38:53Z","abstract_excerpt":"Transformer models trained on long sequences often achieve higher accuracy than short sequences. Unfortunately, conventional transformers struggle with long sequence training due to the overwhelming computation and memory requirements. Existing methods for long sequence training offer limited speedup and memory reduction, and may compromise accuracy. This paper presents a novel and efficient distributed training method, the Long Short-Sequence Transformer (LSS Transformer), for training transformer with long sequences. It distributes a long sequence into segments among GPUs, with each GPU comp"},"claims":{"count":0,"items":[],"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"source":{"id":"2311.02382","kind":"arxiv","version":2},"verdict":{"id":null,"model_set":{},"created_at":null,"strongest_claim":"","one_line_summary":"","pipeline_version":null,"weakest_assumption":"","pith_extraction_headline":""},"integrity":{"clean":true,"summary":{"advisory":0,"critical":0,"by_detector":{},"informational":0},"endpoint":"/pith/2311.02382/integrity.json","findings":[],"available":true,"detectors_run":[],"snapshot_sha256":"c28c3603d3b5d939e8dc4c7e95fa8dfce3d595e45f758748cecf8e644a296938"},"references":{"count":0,"sample":[],"resolved_work":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57","internal_anchors":0},"formal_canon":{"evidence_count":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"author_claims":{"count":0,"strong_count":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"builder_version":"pith-number-builder-2026-05-17-v1"},"verdict_id":null},"signer":{"signer_id":"pith.science","signer_type":"pith_registry","key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54"},"created_at":"2026-07-05T07:10:30Z","supersedes":[],"prev_event":null,"signature":{"signature_status":"signed_v1","algorithm":"ed25519","key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","signature_b64":"n2JAx0VZkQwTMr/vZslsm3jiU2IKxjvBMgRM3CL2FoEwNGI191T4XPldOPFnnUjVDuGBqiHKT7qlam2/MZuiDA==","signed_message":"open_graph_event_sha256_bytes","signed_at":"2026-07-05T14:36:45.744329Z"},"content_sha256":"ad360a9109aff8e8decb549d5443a14d26c3d574ca9f7591a27fc5f29f75d390","schema_version":"1.0","event_id":"sha256:ad360a9109aff8e8decb549d5443a14d26c3d574ca9f7591a27fc5f29f75d390"}],"timestamp_proofs":[],"mirror_hints":[{"mirror_type":"https","name":"Pith Resolver","base_url":"https://pith.science","bundle_url":"https://pith.science/pith/WWMGNKMITKHW6I236PQ5LJCDZA/bundle.json","state_url":"https://pith.science/pith/WWMGNKMITKHW6I236PQ5LJCDZA/state.json","well_known_bundle_url":"https://pith.science/.well-known/pith/WWMGNKMITKHW6I236PQ5LJCDZA/bundle.json","status":"primary"}],"public_keys":[{"key_id":"pith-v1-2026-05","algorithm":"ed25519","format":"raw","public_key_b64":"stVStoiQhXFxp4s2pdzPNoqVNBMojDU/fJ2db5S3CbM=","public_key_hex":"b2d552b68890857171a78b36a5dccf368a953413288c353f7c9d9d6f94b709b3","fingerprint_sha256_b32_first128bits":"RVFV5Z2OI2J3ZUO7ERDEBCYNKS","fingerprint_sha256_hex":"8d4b5ee74e4693bcd1df2446408b0d54","rotates_at":null,"url":"https://pith.science/pith-signing-key.json","notes":"Pith uses this Ed25519 key to sign canonical record SHA-256 digests. Verify with: ed25519_verify(public_key, message=canonical_sha256_bytes, signature=base64decode(signature_b64))."}],"merge_version":"pith-open-graph-merge-v1","built_at":"2026-07-05T14:36:45Z","links":{"resolver":"https://pith.science/pith/WWMGNKMITKHW6I236PQ5LJCDZA","bundle":"https://pith.science/pith/WWMGNKMITKHW6I236PQ5LJCDZA/bundle.json","state":"https://pith.science/pith/WWMGNKMITKHW6I236PQ5LJCDZA/state.json","well_known_bundle":"https://pith.science/.well-known/pith/WWMGNKMITKHW6I236PQ5LJCDZA/bundle.json"},"state":{"state_type":"pith_open_graph_state","state_version":"1.0","pith_number":"pith:2023:WWMGNKMITKHW6I236PQ5LJCDZA","merge_version":"pith-open-graph-merge-v1","event_count":2,"valid_event_count":2,"invalid_event_count":0,"equivocation_count":0,"current":{"canonical_record":{"metadata":{"abstract_canon_sha256":"a7a0af2cd954f65e8c147b735e4c8df33c9c83bd80c76acd91eba94637b64f56","cross_cats_sorted":["cs.AI"],"license":"http://arxiv.org/licenses/nonexclusive-distrib/1.0/","primary_cat":"cs.DC","submitted_at":"2023-11-04T11:38:53Z","title_canon_sha256":"c70e186cbc624522207fec85021fcf98c3f8fe79fce51a93de48f231daec130f"},"schema_version":"1.0","source":{"id":"2311.02382","kind":"arxiv","version":2}},"source_aliases":[{"alias_kind":"arxiv","alias_value":"2311.02382","created_at":"2026-07-05T07:10:30Z"},{"alias_kind":"arxiv_version","alias_value":"2311.02382v2","created_at":"2026-07-05T07:10:30Z"},{"alias_kind":"doi","alias_value":"10.48550/arxiv.2311.02382","created_at":"2026-07-05T07:10:30Z"},{"alias_kind":"pith_short_12","alias_value":"WWMGNKMITKHW","created_at":"2026-07-05T07:10:30Z"},{"alias_kind":"pith_short_16","alias_value":"WWMGNKMITKHW6I23","created_at":"2026-07-05T07:10:30Z"},{"alias_kind":"pith_short_8","alias_value":"WWMGNKMI","created_at":"2026-07-05T07:10:30Z"}],"graph_snapshots":[{"event_id":"sha256:ad360a9109aff8e8decb549d5443a14d26c3d574ca9f7591a27fc5f29f75d390","target":"graph","created_at":"2026-07-05T07:10:30Z","signer":{"key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","signer_id":"pith.science","signer_type":"pith_registry"},"payload":{"graph_snapshot":{"author_claims":{"count":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57","strong_count":0},"builder_version":"pith-number-builder-2026-05-17-v1","claims":{"count":0,"items":[],"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"formal_canon":{"evidence_count":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"integrity":{"available":true,"clean":true,"detectors_run":[],"endpoint":"/pith/2311.02382/integrity.json","findings":[],"snapshot_sha256":"c28c3603d3b5d939e8dc4c7e95fa8dfce3d595e45f758748cecf8e644a296938","summary":{"advisory":0,"by_detector":{},"critical":0,"informational":0}},"paper":{"abstract_excerpt":"Transformer models trained on long sequences often achieve higher accuracy than short sequences. Unfortunately, conventional transformers struggle with long sequence training due to the overwhelming computation and memory requirements. Existing methods for long sequence training offer limited speedup and memory reduction, and may compromise accuracy. This paper presents a novel and efficient distributed training method, the Long Short-Sequence Transformer (LSS Transformer), for training transformer with long sequences. It distributes a long sequence into segments among GPUs, with each GPU comp","authors_text":"Aristeidis Tsaris, Hong-Jun Yoon, Isaac Lyngaas, John Gouley, Mayanka Chandra Shekar, Mohamed Wahib, Peng Chen, Sajal Dash, Tao Luo, Xiao Wang","cross_cats":["cs.AI"],"headline":"","license":"http://arxiv.org/licenses/nonexclusive-distrib/1.0/","primary_cat":"cs.DC","submitted_at":"2023-11-04T11:38:53Z","title":"Ultra-Long Sequence Distributed Transformer"},"references":{"count":0,"internal_anchors":0,"resolved_work":0,"sample":[],"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"source":{"id":"2311.02382","kind":"arxiv","version":2},"verdict":{"created_at":null,"id":null,"model_set":{},"one_line_summary":"","pipeline_version":null,"pith_extraction_headline":"","strongest_claim":"","weakest_assumption":""}},"verdict_id":null}}],"author_attestations":[],"timestamp_anchors":[],"storage_attestations":[],"citation_signatures":[],"replication_records":[],"corrections":[],"mirror_hints":[],"record_created":{"event_id":"sha256:48f45229713c64d64f4f8136e3b4b8f689b95dfa4f3d160674fcc1c5546320e3","target":"record","created_at":"2026-07-05T07:10:30Z","signer":{"key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","signer_id":"pith.science","signer_type":"pith_registry"},"payload":{"attestation_state":"computed","canonical_record":{"metadata":{"abstract_canon_sha256":"a7a0af2cd954f65e8c147b735e4c8df33c9c83bd80c76acd91eba94637b64f56","cross_cats_sorted":["cs.AI"],"license":"http://arxiv.org/licenses/nonexclusive-distrib/1.0/","primary_cat":"cs.DC","submitted_at":"2023-11-04T11:38:53Z","title_canon_sha256":"c70e186cbc624522207fec85021fcf98c3f8fe79fce51a93de48f231daec130f"},"schema_version":"1.0","source":{"id":"2311.02382","kind":"arxiv","version":2}},"canonical_sha256":"b59866a9889a8f6f235bf3e1d5a443c8193104354d93b66fd0ae58feba7ea607","receipt":{"algorithm":"ed25519","builder_version":"pith-number-builder-2026-05-17-v1","canonical_sha256":"b59866a9889a8f6f235bf3e1d5a443c8193104354d93b66fd0ae58feba7ea607","first_computed_at":"2026-07-05T07:10:30.711031Z","key_id":"pith-v1-2026-05","kind":"pith_receipt","last_reissued_at":"2026-07-05T07:10:30.711031Z","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","receipt_version":"0.3","signature_b64":"XnIipsztZ4hfYX6+2MZqGMmNqSYZu5MZiPSN1E3fbC2LGT1YDcHjD/rG5u3mqr25aBue16OFp4etr8r6vxehBA==","signature_status":"signed_v1","signed_at":"2026-07-05T07:10:30.711593Z","signed_message":"canonical_sha256_bytes"},"source_id":"2311.02382","source_kind":"arxiv","source_version":2}}},"equivocations":[],"invalid_events":[],"applied_event_ids":["sha256:48f45229713c64d64f4f8136e3b4b8f689b95dfa4f3d160674fcc1c5546320e3","sha256:ad360a9109aff8e8decb549d5443a14d26c3d574ca9f7591a27fc5f29f75d390"],"state_sha256":"6e994c54a6c769bd665f9504d71a2e9c6d68dfaac2e0020f751f7712a97ae867"},"bundle_signature":{"signature_status":"signed_v1","algorithm":"ed25519","key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","signature_b64":"o2S7CeHjgJL8Jh6BMFVkvmjaF6ArFi79h+ZEU38lKpS3Wn9Kbk3gaVM7/r6Rikc0ffq7LUfxWcS4oUJDSLnLBw==","signed_message":"bundle_sha256_bytes","signed_at":"2026-07-05T14:36:45.748519Z","bundle_sha256":"0946be22a6cd8eec42bc5a6def95b4077193fb31bebe0a4da3c6fc6fedfb734c"}}