{"bundle_type":"pith_open_graph_bundle","bundle_version":"1.0","pith_number":"pith:2018:IBCEZFKZ3H47BO4T672ZATTLPW","short_pith_number":"pith:IBCEZFKZ","canonical_record":{"source":{"id":"1803.01090","kind":"arxiv","version":1},"metadata":{"license":"http://arxiv.org/licenses/nonexclusive-distrib/1.0/","primary_cat":"cs.CL","submitted_at":"2018-03-03T02:08:46Z","cross_cats_sorted":[],"title_canon_sha256":"288f1fd632629b321a63dbc4aaf14d586935ee4fb1a65b6410cefbe6eaa3b404","abstract_canon_sha256":"e39d75b3a25b41aa1fb3ec925f598e8e344ba6e7fe0dc62cff3fc7de55051959"},"schema_version":"1.0"},"canonical_sha256":"40444c9559d9f9f0bb93f7f5904e6b7db24fa48d7c7e69a56c2f6923dbd939a1","source":{"kind":"arxiv","id":"1803.01090","version":1},"source_aliases":[{"alias_kind":"arxiv","alias_value":"1803.01090","created_at":"2026-05-18T00:22:01Z"},{"alias_kind":"arxiv_version","alias_value":"1803.01090v1","created_at":"2026-05-18T00:22:01Z"},{"alias_kind":"doi","alias_value":"10.48550/arxiv.1803.01090","created_at":"2026-05-18T00:22:01Z"},{"alias_kind":"pith_short_12","alias_value":"IBCEZFKZ3H47","created_at":"2026-05-18T12:32:28Z"},{"alias_kind":"pith_short_16","alias_value":"IBCEZFKZ3H47BO4T","created_at":"2026-05-18T12:32:28Z"},{"alias_kind":"pith_short_8","alias_value":"IBCEZFKZ","created_at":"2026-05-18T12:32:28Z"}],"events":[{"event_type":"record_created","subject_pith_number":"pith:2018:IBCEZFKZ3H47BO4T672ZATTLPW","target":"record","payload":{"canonical_record":{"source":{"id":"1803.01090","kind":"arxiv","version":1},"metadata":{"license":"http://arxiv.org/licenses/nonexclusive-distrib/1.0/","primary_cat":"cs.CL","submitted_at":"2018-03-03T02:08:46Z","cross_cats_sorted":[],"title_canon_sha256":"288f1fd632629b321a63dbc4aaf14d586935ee4fb1a65b6410cefbe6eaa3b404","abstract_canon_sha256":"e39d75b3a25b41aa1fb3ec925f598e8e344ba6e7fe0dc62cff3fc7de55051959"},"schema_version":"1.0"},"canonical_sha256":"40444c9559d9f9f0bb93f7f5904e6b7db24fa48d7c7e69a56c2f6923dbd939a1","receipt":{"kind":"pith_receipt","key_id":"pith-v1-2026-05","algorithm":"ed25519","signed_at":"2026-05-18T00:22:01.791686Z","signature_b64":"6Q4e7U03N+BuVZpPiFKJgyHPrebsH7UG5ATHxnpGzvVltsCFjqR4q+TS9ndU0RY97eLeXj9PWyImLkWkeK6jCw==","signed_message":"canonical_sha256_bytes","builder_version":"pith-number-builder-2026-05-17-v1","receipt_version":"0.3","canonical_sha256":"40444c9559d9f9f0bb93f7f5904e6b7db24fa48d7c7e69a56c2f6923dbd939a1","last_reissued_at":"2026-05-18T00:22:01.791130Z","signature_status":"signed_v1","first_computed_at":"2026-05-18T00:22:01.791130Z","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54"},"source_kind":"arxiv","source_id":"1803.01090","source_version":1,"attestation_state":"computed"},"signer":{"signer_id":"pith.science","signer_type":"pith_registry","key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54"},"created_at":"2026-05-18T00:22:01Z","supersedes":[],"prev_event":null,"signature":{"signature_status":"signed_v1","algorithm":"ed25519","key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","signature_b64":"bDskDxd/uPnni9J6ip55pHNwl2T8OH5jpQ8JrgWD2BjEEwLPDOgyquSniPyLsSVzpU36z0KrWzfYraxocozuBw==","signed_message":"open_graph_event_sha256_bytes","signed_at":"2026-05-27T05:33:49.052028Z"},"content_sha256":"4343c26ef61afdb0edee850c4c44cdb7b245fdf5d84e8f241f66a72b111ef01f","schema_version":"1.0","event_id":"sha256:4343c26ef61afdb0edee850c4c44cdb7b245fdf5d84e8f241f66a72b111ef01f"},{"event_type":"graph_snapshot","subject_pith_number":"pith:2018:IBCEZFKZ3H47BO4T672ZATTLPW","target":"graph","payload":{"graph_snapshot":{"paper":{"title":"On Modular Training of Neural Acoustics-to-Word Model for LVCSR","license":"http://arxiv.org/licenses/nonexclusive-distrib/1.0/","headline":"","cross_cats":[],"primary_cat":"cs.CL","authors_text":"Hao Li, Kai Yu, Qi Liu, Zhehuai Chen","submitted_at":"2018-03-03T02:08:46Z","abstract_excerpt":"End-to-end (E2E) automatic speech recognition (ASR) systems directly map acoustics to words using a unified model. Previous works mostly focus on E2E training a single model which integrates acoustic and language model into a whole. Although E2E training benefits from sequence modeling and simplified decoding pipelines, large amount of transcribed acoustic data is usually required, and traditional acoustic and language modelling techniques cannot be utilized. In this paper, a novel modular training framework of E2E ASR is proposed to separately train neural acoustic and language models during "},"claims":{"count":0,"items":[],"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"source":{"id":"1803.01090","kind":"arxiv","version":1},"verdict":{"id":null,"model_set":{},"created_at":null,"strongest_claim":"","one_line_summary":"","pipeline_version":null,"weakest_assumption":"","pith_extraction_headline":""},"references":{"count":0,"sample":[],"resolved_work":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57","internal_anchors":0},"formal_canon":{"evidence_count":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"author_claims":{"count":0,"strong_count":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"builder_version":"pith-number-builder-2026-05-17-v1"},"verdict_id":null},"signer":{"signer_id":"pith.science","signer_type":"pith_registry","key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54"},"created_at":"2026-05-18T00:22:01Z","supersedes":[],"prev_event":null,"signature":{"signature_status":"signed_v1","algorithm":"ed25519","key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","signature_b64":"4xatx56lYGsRDHRDdmiaZ8JJ+jTtSZNbvBtY460AyN7dZQAnxV7LDGQnyPmiMydj+chRzIOYZaVmolNeIPmwCw==","signed_message":"open_graph_event_sha256_bytes","signed_at":"2026-05-27T05:33:49.052647Z"},"content_sha256":"669c72f20d51f2602a62f4c47fdbcddcb352ea471d444241ae0082379e541dfa","schema_version":"1.0","event_id":"sha256:669c72f20d51f2602a62f4c47fdbcddcb352ea471d444241ae0082379e541dfa"}],"timestamp_proofs":[],"mirror_hints":[{"mirror_type":"https","name":"Pith Resolver","base_url":"https://pith.science","bundle_url":"https://pith.science/pith/IBCEZFKZ3H47BO4T672ZATTLPW/bundle.json","state_url":"https://pith.science/pith/IBCEZFKZ3H47BO4T672ZATTLPW/state.json","well_known_bundle_url":"https://pith.science/.well-known/pith/IBCEZFKZ3H47BO4T672ZATTLPW/bundle.json","status":"primary"}],"public_keys":[{"key_id":"pith-v1-2026-05","algorithm":"ed25519","format":"raw","public_key_b64":"stVStoiQhXFxp4s2pdzPNoqVNBMojDU/fJ2db5S3CbM=","public_key_hex":"b2d552b68890857171a78b36a5dccf368a953413288c353f7c9d9d6f94b709b3","fingerprint_sha256_b32_first128bits":"RVFV5Z2OI2J3ZUO7ERDEBCYNKS","fingerprint_sha256_hex":"8d4b5ee74e4693bcd1df2446408b0d54","rotates_at":null,"url":"https://pith.science/pith-signing-key.json","notes":"Pith uses this Ed25519 key to sign canonical record SHA-256 digests. Verify with: ed25519_verify(public_key, message=canonical_sha256_bytes, signature=base64decode(signature_b64))."}],"merge_version":"pith-open-graph-merge-v1","built_at":"2026-05-27T05:33:49Z","links":{"resolver":"https://pith.science/pith/IBCEZFKZ3H47BO4T672ZATTLPW","bundle":"https://pith.science/pith/IBCEZFKZ3H47BO4T672ZATTLPW/bundle.json","state":"https://pith.science/pith/IBCEZFKZ3H47BO4T672ZATTLPW/state.json","well_known_bundle":"https://pith.science/.well-known/pith/IBCEZFKZ3H47BO4T672ZATTLPW/bundle.json"},"state":{"state_type":"pith_open_graph_state","state_version":"1.0","pith_number":"pith:2018:IBCEZFKZ3H47BO4T672ZATTLPW","merge_version":"pith-open-graph-merge-v1","event_count":2,"valid_event_count":2,"invalid_event_count":0,"equivocation_count":0,"current":{"canonical_record":{"metadata":{"abstract_canon_sha256":"e39d75b3a25b41aa1fb3ec925f598e8e344ba6e7fe0dc62cff3fc7de55051959","cross_cats_sorted":[],"license":"http://arxiv.org/licenses/nonexclusive-distrib/1.0/","primary_cat":"cs.CL","submitted_at":"2018-03-03T02:08:46Z","title_canon_sha256":"288f1fd632629b321a63dbc4aaf14d586935ee4fb1a65b6410cefbe6eaa3b404"},"schema_version":"1.0","source":{"id":"1803.01090","kind":"arxiv","version":1}},"source_aliases":[{"alias_kind":"arxiv","alias_value":"1803.01090","created_at":"2026-05-18T00:22:01Z"},{"alias_kind":"arxiv_version","alias_value":"1803.01090v1","created_at":"2026-05-18T00:22:01Z"},{"alias_kind":"doi","alias_value":"10.48550/arxiv.1803.01090","created_at":"2026-05-18T00:22:01Z"},{"alias_kind":"pith_short_12","alias_value":"IBCEZFKZ3H47","created_at":"2026-05-18T12:32:28Z"},{"alias_kind":"pith_short_16","alias_value":"IBCEZFKZ3H47BO4T","created_at":"2026-05-18T12:32:28Z"},{"alias_kind":"pith_short_8","alias_value":"IBCEZFKZ","created_at":"2026-05-18T12:32:28Z"}],"graph_snapshots":[{"event_id":"sha256:669c72f20d51f2602a62f4c47fdbcddcb352ea471d444241ae0082379e541dfa","target":"graph","created_at":"2026-05-18T00:22:01Z","signer":{"key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","signer_id":"pith.science","signer_type":"pith_registry"},"payload":{"graph_snapshot":{"author_claims":{"count":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57","strong_count":0},"builder_version":"pith-number-builder-2026-05-17-v1","claims":{"count":0,"items":[],"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"formal_canon":{"evidence_count":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"paper":{"abstract_excerpt":"End-to-end (E2E) automatic speech recognition (ASR) systems directly map acoustics to words using a unified model. Previous works mostly focus on E2E training a single model which integrates acoustic and language model into a whole. Although E2E training benefits from sequence modeling and simplified decoding pipelines, large amount of transcribed acoustic data is usually required, and traditional acoustic and language modelling techniques cannot be utilized. In this paper, a novel modular training framework of E2E ASR is proposed to separately train neural acoustic and language models during ","authors_text":"Hao Li, Kai Yu, Qi Liu, Zhehuai Chen","cross_cats":[],"headline":"","license":"http://arxiv.org/licenses/nonexclusive-distrib/1.0/","primary_cat":"cs.CL","submitted_at":"2018-03-03T02:08:46Z","title":"On Modular Training of Neural Acoustics-to-Word Model for LVCSR"},"references":{"count":0,"internal_anchors":0,"resolved_work":0,"sample":[],"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"source":{"id":"1803.01090","kind":"arxiv","version":1},"verdict":{"created_at":null,"id":null,"model_set":{},"one_line_summary":"","pipeline_version":null,"pith_extraction_headline":"","strongest_claim":"","weakest_assumption":""}},"verdict_id":null}}],"author_attestations":[],"timestamp_anchors":[],"storage_attestations":[],"citation_signatures":[],"replication_records":[],"corrections":[],"mirror_hints":[],"record_created":{"event_id":"sha256:4343c26ef61afdb0edee850c4c44cdb7b245fdf5d84e8f241f66a72b111ef01f","target":"record","created_at":"2026-05-18T00:22:01Z","signer":{"key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","signer_id":"pith.science","signer_type":"pith_registry"},"payload":{"attestation_state":"computed","canonical_record":{"metadata":{"abstract_canon_sha256":"e39d75b3a25b41aa1fb3ec925f598e8e344ba6e7fe0dc62cff3fc7de55051959","cross_cats_sorted":[],"license":"http://arxiv.org/licenses/nonexclusive-distrib/1.0/","primary_cat":"cs.CL","submitted_at":"2018-03-03T02:08:46Z","title_canon_sha256":"288f1fd632629b321a63dbc4aaf14d586935ee4fb1a65b6410cefbe6eaa3b404"},"schema_version":"1.0","source":{"id":"1803.01090","kind":"arxiv","version":1}},"canonical_sha256":"40444c9559d9f9f0bb93f7f5904e6b7db24fa48d7c7e69a56c2f6923dbd939a1","receipt":{"algorithm":"ed25519","builder_version":"pith-number-builder-2026-05-17-v1","canonical_sha256":"40444c9559d9f9f0bb93f7f5904e6b7db24fa48d7c7e69a56c2f6923dbd939a1","first_computed_at":"2026-05-18T00:22:01.791130Z","key_id":"pith-v1-2026-05","kind":"pith_receipt","last_reissued_at":"2026-05-18T00:22:01.791130Z","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","receipt_version":"0.3","signature_b64":"6Q4e7U03N+BuVZpPiFKJgyHPrebsH7UG5ATHxnpGzvVltsCFjqR4q+TS9ndU0RY97eLeXj9PWyImLkWkeK6jCw==","signature_status":"signed_v1","signed_at":"2026-05-18T00:22:01.791686Z","signed_message":"canonical_sha256_bytes"},"source_id":"1803.01090","source_kind":"arxiv","source_version":1}}},"equivocations":[],"invalid_events":[],"applied_event_ids":["sha256:4343c26ef61afdb0edee850c4c44cdb7b245fdf5d84e8f241f66a72b111ef01f","sha256:669c72f20d51f2602a62f4c47fdbcddcb352ea471d444241ae0082379e541dfa"],"state_sha256":"2b778d009f446b9748e759a8e2cc23855747722456fe7f3fb6dd7db7cd01e217"},"bundle_signature":{"signature_status":"signed_v1","algorithm":"ed25519","key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","signature_b64":"G5IeDgHtIQ3oqJ+Eh69YMOI7t192WPj1vLyY7AB2z/UciziF2u6tPSZk6w/mCQEoF3DRanwUIAUCjY04+jldCQ==","signed_message":"bundle_sha256_bytes","signed_at":"2026-05-27T05:33:49.055748Z","bundle_sha256":"db1400e090f29d0689ee1d1c29df6586f36910ca30ca9f9709d96b3346e240fb"}}