{"bundle_type":"pith_open_graph_bundle","bundle_version":"1.0","pith_number":"pith:2015:BTLHJN2ZY7ZDLRUVMFRA73EMB3","short_pith_number":"pith:BTLHJN2Z","canonical_record":{"source":{"id":"1502.01446","kind":"arxiv","version":1},"metadata":{"license":"http://arxiv.org/licenses/nonexclusive-distrib/1.0/","primary_cat":"cs.CL","submitted_at":"2015-02-05T07:42:18Z","cross_cats_sorted":[],"title_canon_sha256":"7d93ee69fd4907bc499c0707fc51dc094ad1a9a556991791a19425080df521ec","abstract_canon_sha256":"8dd18b1239ff819217eca8206f7e93c9e211355df3aa7171c86c79fced27b5db"},"schema_version":"1.0"},"canonical_sha256":"0cd674b759c7f235c69561620fec8c0ec42d489aab1051295d1488d225de4601","source":{"kind":"arxiv","id":"1502.01446","version":1},"source_aliases":[{"alias_kind":"arxiv","alias_value":"1502.01446","created_at":"2026-05-18T02:27:52Z"},{"alias_kind":"arxiv_version","alias_value":"1502.01446v1","created_at":"2026-05-18T02:27:52Z"},{"alias_kind":"doi","alias_value":"10.48550/arxiv.1502.01446","created_at":"2026-05-18T02:27:52Z"},{"alias_kind":"pith_short_12","alias_value":"BTLHJN2ZY7ZD","created_at":"2026-05-18T12:29:14Z"},{"alias_kind":"pith_short_16","alias_value":"BTLHJN2ZY7ZDLRUV","created_at":"2026-05-18T12:29:14Z"},{"alias_kind":"pith_short_8","alias_value":"BTLHJN2Z","created_at":"2026-05-18T12:29:14Z"}],"events":[{"event_type":"record_created","subject_pith_number":"pith:2015:BTLHJN2ZY7ZDLRUVMFRA73EMB3","target":"record","payload":{"canonical_record":{"source":{"id":"1502.01446","kind":"arxiv","version":1},"metadata":{"license":"http://arxiv.org/licenses/nonexclusive-distrib/1.0/","primary_cat":"cs.CL","submitted_at":"2015-02-05T07:42:18Z","cross_cats_sorted":[],"title_canon_sha256":"7d93ee69fd4907bc499c0707fc51dc094ad1a9a556991791a19425080df521ec","abstract_canon_sha256":"8dd18b1239ff819217eca8206f7e93c9e211355df3aa7171c86c79fced27b5db"},"schema_version":"1.0"},"canonical_sha256":"0cd674b759c7f235c69561620fec8c0ec42d489aab1051295d1488d225de4601","receipt":{"kind":"pith_receipt","key_id":"pith-v1-2026-05","algorithm":"ed25519","signed_at":"2026-05-18T02:27:52.031474Z","signature_b64":"pa9cSbjKRx8bkA3EFtf6WqLmeKGx8FPdX+KkeZ54j9k6Jww6RtJr08uQW7fV8+NHeYMMtnXFPnwZKq+ACxGyCg==","signed_message":"canonical_sha256_bytes","builder_version":"pith-number-builder-2026-05-17-v1","receipt_version":"0.3","canonical_sha256":"0cd674b759c7f235c69561620fec8c0ec42d489aab1051295d1488d225de4601","last_reissued_at":"2026-05-18T02:27:52.030999Z","signature_status":"signed_v1","first_computed_at":"2026-05-18T02:27:52.030999Z","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54"},"source_kind":"arxiv","source_id":"1502.01446","source_version":1,"attestation_state":"computed"},"signer":{"signer_id":"pith.science","signer_type":"pith_registry","key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54"},"created_at":"2026-05-18T02:27:52Z","supersedes":[],"prev_event":null,"signature":{"signature_status":"signed_v1","algorithm":"ed25519","key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","signature_b64":"nL/xIj6BeoK6cUGiYyCDde6/TPHwilekqhJbvo5j9wLcPwV/PoxprfaRBr3xHdLR2lPcIL6Z/u1LBI6EaFdzBQ==","signed_message":"open_graph_event_sha256_bytes","signed_at":"2026-05-25T12:02:36.959000Z"},"content_sha256":"52ff0e802202a32d88227c4a9cf03b097dc1d9f1798a2552513efb14f449250f","schema_version":"1.0","event_id":"sha256:52ff0e802202a32d88227c4a9cf03b097dc1d9f1798a2552513efb14f449250f"},{"event_type":"graph_snapshot","subject_pith_number":"pith:2015:BTLHJN2ZY7ZDLRUVMFRA73EMB3","target":"graph","payload":{"graph_snapshot":{"paper":{"title":"Beyond Word-based Language Model in Statistical Machine Translation","license":"http://arxiv.org/licenses/nonexclusive-distrib/1.0/","headline":"","cross_cats":[],"primary_cat":"cs.CL","authors_text":"Chengqing Zong, Jiajun Zhang, Ming Zhou, Mu Li, Shujie Liu","submitted_at":"2015-02-05T07:42:18Z","abstract_excerpt":"Language model is one of the most important modules in statistical machine translation and currently the word-based language model dominants this community. However, many translation models (e.g. phrase-based models) generate the target language sentences by rendering and compositing the phrases rather than the words. Thus, it is much more reasonable to model dependency between phrases, but few research work succeed in solving this problem. In this paper, we tackle this problem by designing a novel phrase-based language model which attempts to solve three key sub-problems: 1, how to define a p"},"claims":{"count":0,"items":[],"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"source":{"id":"1502.01446","kind":"arxiv","version":1},"verdict":{"id":null,"model_set":{},"created_at":null,"strongest_claim":"","one_line_summary":"","pipeline_version":null,"weakest_assumption":"","pith_extraction_headline":""},"references":{"count":0,"sample":[],"resolved_work":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57","internal_anchors":0},"formal_canon":{"evidence_count":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"author_claims":{"count":0,"strong_count":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"builder_version":"pith-number-builder-2026-05-17-v1"},"verdict_id":null},"signer":{"signer_id":"pith.science","signer_type":"pith_registry","key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54"},"created_at":"2026-05-18T02:27:52Z","supersedes":[],"prev_event":null,"signature":{"signature_status":"signed_v1","algorithm":"ed25519","key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","signature_b64":"yOdt2vmzU3+x7t+F/D8he6yeNH7L+HQWnilxSpbiZqlYEt8semS1o5TepzaCTPhV2U46t/noJjunFV3H96tOAw==","signed_message":"open_graph_event_sha256_bytes","signed_at":"2026-05-25T12:02:36.959484Z"},"content_sha256":"0ebd5f5b95f1e48f612b1428043e921f30f2e37d65b30f8c55b195fcead034ca","schema_version":"1.0","event_id":"sha256:0ebd5f5b95f1e48f612b1428043e921f30f2e37d65b30f8c55b195fcead034ca"}],"timestamp_proofs":[],"mirror_hints":[{"mirror_type":"https","name":"Pith Resolver","base_url":"https://pith.science","bundle_url":"https://pith.science/pith/BTLHJN2ZY7ZDLRUVMFRA73EMB3/bundle.json","state_url":"https://pith.science/pith/BTLHJN2ZY7ZDLRUVMFRA73EMB3/state.json","well_known_bundle_url":"https://pith.science/.well-known/pith/BTLHJN2ZY7ZDLRUVMFRA73EMB3/bundle.json","status":"primary"}],"public_keys":[{"key_id":"pith-v1-2026-05","algorithm":"ed25519","format":"raw","public_key_b64":"stVStoiQhXFxp4s2pdzPNoqVNBMojDU/fJ2db5S3CbM=","public_key_hex":"b2d552b68890857171a78b36a5dccf368a953413288c353f7c9d9d6f94b709b3","fingerprint_sha256_b32_first128bits":"RVFV5Z2OI2J3ZUO7ERDEBCYNKS","fingerprint_sha256_hex":"8d4b5ee74e4693bcd1df2446408b0d54","rotates_at":null,"url":"https://pith.science/pith-signing-key.json","notes":"Pith uses this Ed25519 key to sign canonical record SHA-256 digests. Verify with: ed25519_verify(public_key, message=canonical_sha256_bytes, signature=base64decode(signature_b64))."}],"merge_version":"pith-open-graph-merge-v1","built_at":"2026-05-25T12:02:36Z","links":{"resolver":"https://pith.science/pith/BTLHJN2ZY7ZDLRUVMFRA73EMB3","bundle":"https://pith.science/pith/BTLHJN2ZY7ZDLRUVMFRA73EMB3/bundle.json","state":"https://pith.science/pith/BTLHJN2ZY7ZDLRUVMFRA73EMB3/state.json","well_known_bundle":"https://pith.science/.well-known/pith/BTLHJN2ZY7ZDLRUVMFRA73EMB3/bundle.json"},"state":{"state_type":"pith_open_graph_state","state_version":"1.0","pith_number":"pith:2015:BTLHJN2ZY7ZDLRUVMFRA73EMB3","merge_version":"pith-open-graph-merge-v1","event_count":2,"valid_event_count":2,"invalid_event_count":0,"equivocation_count":0,"current":{"canonical_record":{"metadata":{"abstract_canon_sha256":"8dd18b1239ff819217eca8206f7e93c9e211355df3aa7171c86c79fced27b5db","cross_cats_sorted":[],"license":"http://arxiv.org/licenses/nonexclusive-distrib/1.0/","primary_cat":"cs.CL","submitted_at":"2015-02-05T07:42:18Z","title_canon_sha256":"7d93ee69fd4907bc499c0707fc51dc094ad1a9a556991791a19425080df521ec"},"schema_version":"1.0","source":{"id":"1502.01446","kind":"arxiv","version":1}},"source_aliases":[{"alias_kind":"arxiv","alias_value":"1502.01446","created_at":"2026-05-18T02:27:52Z"},{"alias_kind":"arxiv_version","alias_value":"1502.01446v1","created_at":"2026-05-18T02:27:52Z"},{"alias_kind":"doi","alias_value":"10.48550/arxiv.1502.01446","created_at":"2026-05-18T02:27:52Z"},{"alias_kind":"pith_short_12","alias_value":"BTLHJN2ZY7ZD","created_at":"2026-05-18T12:29:14Z"},{"alias_kind":"pith_short_16","alias_value":"BTLHJN2ZY7ZDLRUV","created_at":"2026-05-18T12:29:14Z"},{"alias_kind":"pith_short_8","alias_value":"BTLHJN2Z","created_at":"2026-05-18T12:29:14Z"}],"graph_snapshots":[{"event_id":"sha256:0ebd5f5b95f1e48f612b1428043e921f30f2e37d65b30f8c55b195fcead034ca","target":"graph","created_at":"2026-05-18T02:27:52Z","signer":{"key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","signer_id":"pith.science","signer_type":"pith_registry"},"payload":{"graph_snapshot":{"author_claims":{"count":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57","strong_count":0},"builder_version":"pith-number-builder-2026-05-17-v1","claims":{"count":0,"items":[],"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"formal_canon":{"evidence_count":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"paper":{"abstract_excerpt":"Language model is one of the most important modules in statistical machine translation and currently the word-based language model dominants this community. However, many translation models (e.g. phrase-based models) generate the target language sentences by rendering and compositing the phrases rather than the words. Thus, it is much more reasonable to model dependency between phrases, but few research work succeed in solving this problem. In this paper, we tackle this problem by designing a novel phrase-based language model which attempts to solve three key sub-problems: 1, how to define a p","authors_text":"Chengqing Zong, Jiajun Zhang, Ming Zhou, Mu Li, Shujie Liu","cross_cats":[],"headline":"","license":"http://arxiv.org/licenses/nonexclusive-distrib/1.0/","primary_cat":"cs.CL","submitted_at":"2015-02-05T07:42:18Z","title":"Beyond Word-based Language Model in Statistical Machine Translation"},"references":{"count":0,"internal_anchors":0,"resolved_work":0,"sample":[],"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"source":{"id":"1502.01446","kind":"arxiv","version":1},"verdict":{"created_at":null,"id":null,"model_set":{},"one_line_summary":"","pipeline_version":null,"pith_extraction_headline":"","strongest_claim":"","weakest_assumption":""}},"verdict_id":null}}],"author_attestations":[],"timestamp_anchors":[],"storage_attestations":[],"citation_signatures":[],"replication_records":[],"corrections":[],"mirror_hints":[],"record_created":{"event_id":"sha256:52ff0e802202a32d88227c4a9cf03b097dc1d9f1798a2552513efb14f449250f","target":"record","created_at":"2026-05-18T02:27:52Z","signer":{"key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","signer_id":"pith.science","signer_type":"pith_registry"},"payload":{"attestation_state":"computed","canonical_record":{"metadata":{"abstract_canon_sha256":"8dd18b1239ff819217eca8206f7e93c9e211355df3aa7171c86c79fced27b5db","cross_cats_sorted":[],"license":"http://arxiv.org/licenses/nonexclusive-distrib/1.0/","primary_cat":"cs.CL","submitted_at":"2015-02-05T07:42:18Z","title_canon_sha256":"7d93ee69fd4907bc499c0707fc51dc094ad1a9a556991791a19425080df521ec"},"schema_version":"1.0","source":{"id":"1502.01446","kind":"arxiv","version":1}},"canonical_sha256":"0cd674b759c7f235c69561620fec8c0ec42d489aab1051295d1488d225de4601","receipt":{"algorithm":"ed25519","builder_version":"pith-number-builder-2026-05-17-v1","canonical_sha256":"0cd674b759c7f235c69561620fec8c0ec42d489aab1051295d1488d225de4601","first_computed_at":"2026-05-18T02:27:52.030999Z","key_id":"pith-v1-2026-05","kind":"pith_receipt","last_reissued_at":"2026-05-18T02:27:52.030999Z","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","receipt_version":"0.3","signature_b64":"pa9cSbjKRx8bkA3EFtf6WqLmeKGx8FPdX+KkeZ54j9k6Jww6RtJr08uQW7fV8+NHeYMMtnXFPnwZKq+ACxGyCg==","signature_status":"signed_v1","signed_at":"2026-05-18T02:27:52.031474Z","signed_message":"canonical_sha256_bytes"},"source_id":"1502.01446","source_kind":"arxiv","source_version":1}}},"equivocations":[],"invalid_events":[],"applied_event_ids":["sha256:52ff0e802202a32d88227c4a9cf03b097dc1d9f1798a2552513efb14f449250f","sha256:0ebd5f5b95f1e48f612b1428043e921f30f2e37d65b30f8c55b195fcead034ca"],"state_sha256":"a1810731f81945100d8a0dd8f615bf00826c66958369ce2739ae3694eda59e5b"},"bundle_signature":{"signature_status":"signed_v1","algorithm":"ed25519","key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","signature_b64":"CFhCPW8F36aS6vfEUlu7GrupBBvEFD6zr9vkCQrS10pEWEaC/XYwzAxSPrfcNRpThCtf9BqYPQrE98hr2Y5xBA==","signed_message":"bundle_sha256_bytes","signed_at":"2026-05-25T12:02:36.962615Z","bundle_sha256":"0aabda4de4efb54f6a5af971ee9f99e4dc2188576bdffbdaae6a544bbf08b9b7"}}