{"bundle_type":"pith_open_graph_bundle","bundle_version":"1.0","pith_number":"pith:2018:AGOEIKKK7KQNYNZJAQOAVDR4SR","short_pith_number":"pith:AGOEIKKK","canonical_record":{"source":{"id":"1810.10045","kind":"arxiv","version":1},"metadata":{"license":"http://arxiv.org/licenses/nonexclusive-distrib/1.0/","primary_cat":"cs.CL","submitted_at":"2018-10-23T18:44:55Z","cross_cats_sorted":[],"title_canon_sha256":"1cf45aa43ea9e6d1a599a6d73f77042f702f0ebbe11f41a15413838ac83f4f84","abstract_canon_sha256":"327e441e401393f4d4ffead080913483439d333e3fdeb1f4d1e2f9719032b5bf"},"schema_version":"1.0"},"canonical_sha256":"019c44294afaa0dc3729041c0a8e3c9443bd21c320e8462a4c2040e8b191fce0","source":{"kind":"arxiv","id":"1810.10045","version":1},"source_aliases":[{"alias_kind":"arxiv","alias_value":"1810.10045","created_at":"2026-05-18T00:02:24Z"},{"alias_kind":"arxiv_version","alias_value":"1810.10045v1","created_at":"2026-05-18T00:02:24Z"},{"alias_kind":"doi","alias_value":"10.48550/arxiv.1810.10045","created_at":"2026-05-18T00:02:24Z"},{"alias_kind":"pith_short_12","alias_value":"AGOEIKKK7KQN","created_at":"2026-05-18T12:32:13Z"},{"alias_kind":"pith_short_16","alias_value":"AGOEIKKK7KQNYNZJ","created_at":"2026-05-18T12:32:13Z"},{"alias_kind":"pith_short_8","alias_value":"AGOEIKKK","created_at":"2026-05-18T12:32:13Z"}],"events":[{"event_type":"record_created","subject_pith_number":"pith:2018:AGOEIKKK7KQNYNZJAQOAVDR4SR","target":"record","payload":{"canonical_record":{"source":{"id":"1810.10045","kind":"arxiv","version":1},"metadata":{"license":"http://arxiv.org/licenses/nonexclusive-distrib/1.0/","primary_cat":"cs.CL","submitted_at":"2018-10-23T18:44:55Z","cross_cats_sorted":[],"title_canon_sha256":"1cf45aa43ea9e6d1a599a6d73f77042f702f0ebbe11f41a15413838ac83f4f84","abstract_canon_sha256":"327e441e401393f4d4ffead080913483439d333e3fdeb1f4d1e2f9719032b5bf"},"schema_version":"1.0"},"canonical_sha256":"019c44294afaa0dc3729041c0a8e3c9443bd21c320e8462a4c2040e8b191fce0","receipt":{"kind":"pith_receipt","key_id":"pith-v1-2026-05","algorithm":"ed25519","signed_at":"2026-05-18T00:02:24.397089Z","signature_b64":"N8zLa+KIkFnchdEPWbrnffiz0UCK4KqhDdbT83Zfrw+2jK4pM7zQGkWvLBAUMi9Ast8rQoIHQEK0Ko8unbvcAA==","signed_message":"canonical_sha256_bytes","builder_version":"pith-number-builder-2026-05-17-v1","receipt_version":"0.3","canonical_sha256":"019c44294afaa0dc3729041c0a8e3c9443bd21c320e8462a4c2040e8b191fce0","last_reissued_at":"2026-05-18T00:02:24.396449Z","signature_status":"signed_v1","first_computed_at":"2026-05-18T00:02:24.396449Z","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54"},"source_kind":"arxiv","source_id":"1810.10045","source_version":1,"attestation_state":"computed"},"signer":{"signer_id":"pith.science","signer_type":"pith_registry","key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54"},"created_at":"2026-05-18T00:02:24Z","supersedes":[],"prev_event":null,"signature":{"signature_status":"signed_v1","algorithm":"ed25519","key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","signature_b64":"pHJhlXdB2O75k/AaMA1kTEMk0sbVmOYs532sDi6kvkXvXYpcrWplhGfAuOOUy+1rdfElllVXmkFuIFgoZNPRAA==","signed_message":"open_graph_event_sha256_bytes","signed_at":"2026-06-08T02:35:42.314555Z"},"content_sha256":"df49ab144b3827eb95c3bdfa33f95ac31bcf5ddcbc1331c58796c9db3317156c","schema_version":"1.0","event_id":"sha256:df49ab144b3827eb95c3bdfa33f95ac31bcf5ddcbc1331c58796c9db3317156c"},{"event_type":"graph_snapshot","subject_pith_number":"pith:2018:AGOEIKKK7KQNYNZJAQOAVDR4SR","target":"graph","payload":{"graph_snapshot":{"paper":{"title":"Language Modeling at Scale","license":"http://arxiv.org/licenses/nonexclusive-distrib/1.0/","headline":"","cross_cats":[],"primary_cat":"cs.CL","authors_text":"Gregory Diamos, Heewoo Jun, Jiaji Huang, Kenneth Church, Milind Chabbi, Mostofa Patwary","submitted_at":"2018-10-23T18:44:55Z","abstract_excerpt":"We show how Zipf's Law can be used to scale up language modeling (LM) to take advantage of more training data and more GPUs. LM plays a key role in many important natural language applications such as speech recognition and machine translation. Scaling up LM is important since it is widely accepted by the community that there is no data like more data. Eventually, we would like to train on terabytes (TBs) of text (trillions of words). Modern training methods are far from this goal, because of various bottlenecks, especially memory (within GPUs) and communication (across GPUs). This paper shows"},"claims":{"count":0,"items":[],"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"source":{"id":"1810.10045","kind":"arxiv","version":1},"verdict":{"id":null,"model_set":{},"created_at":null,"strongest_claim":"","one_line_summary":"","pipeline_version":null,"weakest_assumption":"","pith_extraction_headline":""},"references":{"count":0,"sample":[],"resolved_work":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57","internal_anchors":0},"formal_canon":{"evidence_count":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"author_claims":{"count":0,"strong_count":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"builder_version":"pith-number-builder-2026-05-17-v1"},"verdict_id":null},"signer":{"signer_id":"pith.science","signer_type":"pith_registry","key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54"},"created_at":"2026-05-18T00:02:24Z","supersedes":[],"prev_event":null,"signature":{"signature_status":"signed_v1","algorithm":"ed25519","key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","signature_b64":"un7Q2l53vOC9XgAj8n6/c1ecOsaa8hMSNkoTWHFZKVkBBbGflc2Rt75UDx6mxLooSK9OVn+9NHzPlYBxeRUXDQ==","signed_message":"open_graph_event_sha256_bytes","signed_at":"2026-06-08T02:35:42.315206Z"},"content_sha256":"8cb412fd5f0318e14f336d327084de4b93137df1c778d743a00e4bb70e279f6f","schema_version":"1.0","event_id":"sha256:8cb412fd5f0318e14f336d327084de4b93137df1c778d743a00e4bb70e279f6f"}],"timestamp_proofs":[],"mirror_hints":[{"mirror_type":"https","name":"Pith Resolver","base_url":"https://pith.science","bundle_url":"https://pith.science/pith/AGOEIKKK7KQNYNZJAQOAVDR4SR/bundle.json","state_url":"https://pith.science/pith/AGOEIKKK7KQNYNZJAQOAVDR4SR/state.json","well_known_bundle_url":"https://pith.science/.well-known/pith/AGOEIKKK7KQNYNZJAQOAVDR4SR/bundle.json","status":"primary"}],"public_keys":[{"key_id":"pith-v1-2026-05","algorithm":"ed25519","format":"raw","public_key_b64":"stVStoiQhXFxp4s2pdzPNoqVNBMojDU/fJ2db5S3CbM=","public_key_hex":"b2d552b68890857171a78b36a5dccf368a953413288c353f7c9d9d6f94b709b3","fingerprint_sha256_b32_first128bits":"RVFV5Z2OI2J3ZUO7ERDEBCYNKS","fingerprint_sha256_hex":"8d4b5ee74e4693bcd1df2446408b0d54","rotates_at":null,"url":"https://pith.science/pith-signing-key.json","notes":"Pith uses this Ed25519 key to sign canonical record SHA-256 digests. Verify with: ed25519_verify(public_key, message=canonical_sha256_bytes, signature=base64decode(signature_b64))."}],"merge_version":"pith-open-graph-merge-v1","built_at":"2026-06-08T02:35:42Z","links":{"resolver":"https://pith.science/pith/AGOEIKKK7KQNYNZJAQOAVDR4SR","bundle":"https://pith.science/pith/AGOEIKKK7KQNYNZJAQOAVDR4SR/bundle.json","state":"https://pith.science/pith/AGOEIKKK7KQNYNZJAQOAVDR4SR/state.json","well_known_bundle":"https://pith.science/.well-known/pith/AGOEIKKK7KQNYNZJAQOAVDR4SR/bundle.json"},"state":{"state_type":"pith_open_graph_state","state_version":"1.0","pith_number":"pith:2018:AGOEIKKK7KQNYNZJAQOAVDR4SR","merge_version":"pith-open-graph-merge-v1","event_count":2,"valid_event_count":2,"invalid_event_count":0,"equivocation_count":0,"current":{"canonical_record":{"metadata":{"abstract_canon_sha256":"327e441e401393f4d4ffead080913483439d333e3fdeb1f4d1e2f9719032b5bf","cross_cats_sorted":[],"license":"http://arxiv.org/licenses/nonexclusive-distrib/1.0/","primary_cat":"cs.CL","submitted_at":"2018-10-23T18:44:55Z","title_canon_sha256":"1cf45aa43ea9e6d1a599a6d73f77042f702f0ebbe11f41a15413838ac83f4f84"},"schema_version":"1.0","source":{"id":"1810.10045","kind":"arxiv","version":1}},"source_aliases":[{"alias_kind":"arxiv","alias_value":"1810.10045","created_at":"2026-05-18T00:02:24Z"},{"alias_kind":"arxiv_version","alias_value":"1810.10045v1","created_at":"2026-05-18T00:02:24Z"},{"alias_kind":"doi","alias_value":"10.48550/arxiv.1810.10045","created_at":"2026-05-18T00:02:24Z"},{"alias_kind":"pith_short_12","alias_value":"AGOEIKKK7KQN","created_at":"2026-05-18T12:32:13Z"},{"alias_kind":"pith_short_16","alias_value":"AGOEIKKK7KQNYNZJ","created_at":"2026-05-18T12:32:13Z"},{"alias_kind":"pith_short_8","alias_value":"AGOEIKKK","created_at":"2026-05-18T12:32:13Z"}],"graph_snapshots":[{"event_id":"sha256:8cb412fd5f0318e14f336d327084de4b93137df1c778d743a00e4bb70e279f6f","target":"graph","created_at":"2026-05-18T00:02:24Z","signer":{"key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","signer_id":"pith.science","signer_type":"pith_registry"},"payload":{"graph_snapshot":{"author_claims":{"count":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57","strong_count":0},"builder_version":"pith-number-builder-2026-05-17-v1","claims":{"count":0,"items":[],"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"formal_canon":{"evidence_count":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"paper":{"abstract_excerpt":"We show how Zipf's Law can be used to scale up language modeling (LM) to take advantage of more training data and more GPUs. LM plays a key role in many important natural language applications such as speech recognition and machine translation. Scaling up LM is important since it is widely accepted by the community that there is no data like more data. Eventually, we would like to train on terabytes (TBs) of text (trillions of words). Modern training methods are far from this goal, because of various bottlenecks, especially memory (within GPUs) and communication (across GPUs). This paper shows","authors_text":"Gregory Diamos, Heewoo Jun, Jiaji Huang, Kenneth Church, Milind Chabbi, Mostofa Patwary","cross_cats":[],"headline":"","license":"http://arxiv.org/licenses/nonexclusive-distrib/1.0/","primary_cat":"cs.CL","submitted_at":"2018-10-23T18:44:55Z","title":"Language Modeling at Scale"},"references":{"count":0,"internal_anchors":0,"resolved_work":0,"sample":[],"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"source":{"id":"1810.10045","kind":"arxiv","version":1},"verdict":{"created_at":null,"id":null,"model_set":{},"one_line_summary":"","pipeline_version":null,"pith_extraction_headline":"","strongest_claim":"","weakest_assumption":""}},"verdict_id":null}}],"author_attestations":[],"timestamp_anchors":[],"storage_attestations":[],"citation_signatures":[],"replication_records":[],"corrections":[],"mirror_hints":[],"record_created":{"event_id":"sha256:df49ab144b3827eb95c3bdfa33f95ac31bcf5ddcbc1331c58796c9db3317156c","target":"record","created_at":"2026-05-18T00:02:24Z","signer":{"key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","signer_id":"pith.science","signer_type":"pith_registry"},"payload":{"attestation_state":"computed","canonical_record":{"metadata":{"abstract_canon_sha256":"327e441e401393f4d4ffead080913483439d333e3fdeb1f4d1e2f9719032b5bf","cross_cats_sorted":[],"license":"http://arxiv.org/licenses/nonexclusive-distrib/1.0/","primary_cat":"cs.CL","submitted_at":"2018-10-23T18:44:55Z","title_canon_sha256":"1cf45aa43ea9e6d1a599a6d73f77042f702f0ebbe11f41a15413838ac83f4f84"},"schema_version":"1.0","source":{"id":"1810.10045","kind":"arxiv","version":1}},"canonical_sha256":"019c44294afaa0dc3729041c0a8e3c9443bd21c320e8462a4c2040e8b191fce0","receipt":{"algorithm":"ed25519","builder_version":"pith-number-builder-2026-05-17-v1","canonical_sha256":"019c44294afaa0dc3729041c0a8e3c9443bd21c320e8462a4c2040e8b191fce0","first_computed_at":"2026-05-18T00:02:24.396449Z","key_id":"pith-v1-2026-05","kind":"pith_receipt","last_reissued_at":"2026-05-18T00:02:24.396449Z","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","receipt_version":"0.3","signature_b64":"N8zLa+KIkFnchdEPWbrnffiz0UCK4KqhDdbT83Zfrw+2jK4pM7zQGkWvLBAUMi9Ast8rQoIHQEK0Ko8unbvcAA==","signature_status":"signed_v1","signed_at":"2026-05-18T00:02:24.397089Z","signed_message":"canonical_sha256_bytes"},"source_id":"1810.10045","source_kind":"arxiv","source_version":1}}},"equivocations":[],"invalid_events":[],"applied_event_ids":["sha256:df49ab144b3827eb95c3bdfa33f95ac31bcf5ddcbc1331c58796c9db3317156c","sha256:8cb412fd5f0318e14f336d327084de4b93137df1c778d743a00e4bb70e279f6f"],"state_sha256":"c72bcc1e2b845f3fab7625cbaaa83dec1619cb14b39691bbc3c946a024e5773b"},"bundle_signature":{"signature_status":"signed_v1","algorithm":"ed25519","key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","signature_b64":"e3X/mKjVmPiRvzN5P6rM96ZSf6jBo35vtd4kvILYKaO1rteoEQnCiUIGG9GzFYddw95kPCkJUliJR4uJvdw7BA==","signed_message":"bundle_sha256_bytes","signed_at":"2026-06-08T02:35:42.319057Z","bundle_sha256":"abdbc74b39e1c7f4b3660f0098c44f8b1e67c3dcb172d32d63db3d4c8879082e"}}