{"bundle_type":"pith_open_graph_bundle","bundle_version":"1.0","pith_number":"pith:2019:3JB5DNQIR3FMCEK67HNOBR4C34","short_pith_number":"pith:3JB5DNQI","canonical_record":{"source":{"id":"1905.13150","kind":"arxiv","version":2},"metadata":{"license":"http://arxiv.org/licenses/nonexclusive-distrib/1.0/","primary_cat":"cs.CL","submitted_at":"2019-05-30T16:12:26Z","cross_cats_sorted":["cs.SD","eess.AS"],"title_canon_sha256":"59f0b60da042c59b4b39b05375711044cbfb79703f5cb58285224f47e53880b3","abstract_canon_sha256":"e10917c65d308bb15ef04e5530172cbfaf835c9e8d1d78f529e4833072fe821a"},"schema_version":"1.0"},"canonical_sha256":"da43d1b6088ecac1115ef9dae0c782df09c200bff05f824886dacd68bce0703a","source":{"kind":"arxiv","id":"1905.13150","version":2},"source_aliases":[{"alias_kind":"arxiv","alias_value":"1905.13150","created_at":"2026-05-17T23:40:43Z"},{"alias_kind":"arxiv_version","alias_value":"1905.13150v2","created_at":"2026-05-17T23:40:43Z"},{"alias_kind":"doi","alias_value":"10.48550/arxiv.1905.13150","created_at":"2026-05-17T23:40:43Z"},{"alias_kind":"pith_short_12","alias_value":"3JB5DNQIR3FM","created_at":"2026-05-18T12:33:07Z"},{"alias_kind":"pith_short_16","alias_value":"3JB5DNQIR3FMCEK6","created_at":"2026-05-18T12:33:07Z"},{"alias_kind":"pith_short_8","alias_value":"3JB5DNQI","created_at":"2026-05-18T12:33:07Z"}],"events":[{"event_type":"record_created","subject_pith_number":"pith:2019:3JB5DNQIR3FMCEK67HNOBR4C34","target":"record","payload":{"canonical_record":{"source":{"id":"1905.13150","kind":"arxiv","version":2},"metadata":{"license":"http://arxiv.org/licenses/nonexclusive-distrib/1.0/","primary_cat":"cs.CL","submitted_at":"2019-05-30T16:12:26Z","cross_cats_sorted":["cs.SD","eess.AS"],"title_canon_sha256":"59f0b60da042c59b4b39b05375711044cbfb79703f5cb58285224f47e53880b3","abstract_canon_sha256":"e10917c65d308bb15ef04e5530172cbfaf835c9e8d1d78f529e4833072fe821a"},"schema_version":"1.0"},"canonical_sha256":"da43d1b6088ecac1115ef9dae0c782df09c200bff05f824886dacd68bce0703a","receipt":{"kind":"pith_receipt","key_id":"pith-v1-2026-05","algorithm":"ed25519","signed_at":"2026-05-17T23:40:43.217954Z","signature_b64":"uCjhetOnMDS/xqvk3IS9g9zwr287IytarXa5A+776MSosGG/ZAGuIStvhlriVbXlNjKApG0//ggsToVKVs4UAQ==","signed_message":"canonical_sha256_bytes","builder_version":"pith-number-builder-2026-05-17-v1","receipt_version":"0.3","canonical_sha256":"da43d1b6088ecac1115ef9dae0c782df09c200bff05f824886dacd68bce0703a","last_reissued_at":"2026-05-17T23:40:43.217366Z","signature_status":"signed_v1","first_computed_at":"2026-05-17T23:40:43.217366Z","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54"},"source_kind":"arxiv","source_id":"1905.13150","source_version":2,"attestation_state":"computed"},"signer":{"signer_id":"pith.science","signer_type":"pith_registry","key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54"},"created_at":"2026-05-17T23:40:43Z","supersedes":[],"prev_event":null,"signature":{"signature_status":"signed_v1","algorithm":"ed25519","key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","signature_b64":"2Te+IQhFfIPvzbJkYTNjWLASwxQAxT299lR9PKS1sC+9iuN72i5Iq+D3cvc/iOe+L5Q+LW614isWvBOXu6lRCQ==","signed_message":"open_graph_event_sha256_bytes","signed_at":"2026-05-29T23:37:56.287428Z"},"content_sha256":"1503e1accdb3582592e8fe70c91071c0a72d1f7bc5f938d8d6332610222d2c50","schema_version":"1.0","event_id":"sha256:1503e1accdb3582592e8fe70c91071c0a72d1f7bc5f938d8d6332610222d2c50"},{"event_type":"graph_snapshot","subject_pith_number":"pith:2019:3JB5DNQIR3FMCEK67HNOBR4C34","target":"graph","payload":{"graph_snapshot":{"paper":{"title":"Lattice-based lightly-supervised acoustic model training","license":"http://arxiv.org/licenses/nonexclusive-distrib/1.0/","headline":"","cross_cats":["cs.SD","eess.AS"],"primary_cat":"cs.CL","authors_text":"Joachim Fainberg, Ond\\v{r}ej Klejch, Peter Bell, Steve Renals","submitted_at":"2019-05-30T16:12:26Z","abstract_excerpt":"In the broadcast domain there is an abundance of related text data and partial transcriptions, such as closed captions and subtitles. This text data can be used for lightly supervised training, in which text matching the audio is selected using an existing speech recognition model. Current approaches to light supervision typically filter the data based on matching error rates between the transcriptions and biased decoding hypotheses. In contrast, semi-supervised training does not require matching text data, instead generating a hypothesis using a background language model. State-of-the-art sem"},"claims":{"count":0,"items":[],"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"source":{"id":"1905.13150","kind":"arxiv","version":2},"verdict":{"id":null,"model_set":{},"created_at":null,"strongest_claim":"","one_line_summary":"","pipeline_version":null,"weakest_assumption":"","pith_extraction_headline":""},"references":{"count":0,"sample":[],"resolved_work":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57","internal_anchors":0},"formal_canon":{"evidence_count":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"author_claims":{"count":0,"strong_count":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"builder_version":"pith-number-builder-2026-05-17-v1"},"verdict_id":null},"signer":{"signer_id":"pith.science","signer_type":"pith_registry","key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54"},"created_at":"2026-05-17T23:40:43Z","supersedes":[],"prev_event":null,"signature":{"signature_status":"signed_v1","algorithm":"ed25519","key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","signature_b64":"CCmpAJts/O43nG/lAN7IlLwmwat9tUFwxQEH23GhL55GvFyO6c3Tm9aM9w6rFflwRkhFXHlP+dHtAqsE3YuDAQ==","signed_message":"open_graph_event_sha256_bytes","signed_at":"2026-05-29T23:37:56.288073Z"},"content_sha256":"b554a073d4a6e33a4766b35104ac1512032aea196c5b992dcb29f2b060372eb9","schema_version":"1.0","event_id":"sha256:b554a073d4a6e33a4766b35104ac1512032aea196c5b992dcb29f2b060372eb9"}],"timestamp_proofs":[],"mirror_hints":[{"mirror_type":"https","name":"Pith Resolver","base_url":"https://pith.science","bundle_url":"https://pith.science/pith/3JB5DNQIR3FMCEK67HNOBR4C34/bundle.json","state_url":"https://pith.science/pith/3JB5DNQIR3FMCEK67HNOBR4C34/state.json","well_known_bundle_url":"https://pith.science/.well-known/pith/3JB5DNQIR3FMCEK67HNOBR4C34/bundle.json","status":"primary"}],"public_keys":[{"key_id":"pith-v1-2026-05","algorithm":"ed25519","format":"raw","public_key_b64":"stVStoiQhXFxp4s2pdzPNoqVNBMojDU/fJ2db5S3CbM=","public_key_hex":"b2d552b68890857171a78b36a5dccf368a953413288c353f7c9d9d6f94b709b3","fingerprint_sha256_b32_first128bits":"RVFV5Z2OI2J3ZUO7ERDEBCYNKS","fingerprint_sha256_hex":"8d4b5ee74e4693bcd1df2446408b0d54","rotates_at":null,"url":"https://pith.science/pith-signing-key.json","notes":"Pith uses this Ed25519 key to sign canonical record SHA-256 digests. Verify with: ed25519_verify(public_key, message=canonical_sha256_bytes, signature=base64decode(signature_b64))."}],"merge_version":"pith-open-graph-merge-v1","built_at":"2026-05-29T23:37:56Z","links":{"resolver":"https://pith.science/pith/3JB5DNQIR3FMCEK67HNOBR4C34","bundle":"https://pith.science/pith/3JB5DNQIR3FMCEK67HNOBR4C34/bundle.json","state":"https://pith.science/pith/3JB5DNQIR3FMCEK67HNOBR4C34/state.json","well_known_bundle":"https://pith.science/.well-known/pith/3JB5DNQIR3FMCEK67HNOBR4C34/bundle.json"},"state":{"state_type":"pith_open_graph_state","state_version":"1.0","pith_number":"pith:2019:3JB5DNQIR3FMCEK67HNOBR4C34","merge_version":"pith-open-graph-merge-v1","event_count":2,"valid_event_count":2,"invalid_event_count":0,"equivocation_count":0,"current":{"canonical_record":{"metadata":{"abstract_canon_sha256":"e10917c65d308bb15ef04e5530172cbfaf835c9e8d1d78f529e4833072fe821a","cross_cats_sorted":["cs.SD","eess.AS"],"license":"http://arxiv.org/licenses/nonexclusive-distrib/1.0/","primary_cat":"cs.CL","submitted_at":"2019-05-30T16:12:26Z","title_canon_sha256":"59f0b60da042c59b4b39b05375711044cbfb79703f5cb58285224f47e53880b3"},"schema_version":"1.0","source":{"id":"1905.13150","kind":"arxiv","version":2}},"source_aliases":[{"alias_kind":"arxiv","alias_value":"1905.13150","created_at":"2026-05-17T23:40:43Z"},{"alias_kind":"arxiv_version","alias_value":"1905.13150v2","created_at":"2026-05-17T23:40:43Z"},{"alias_kind":"doi","alias_value":"10.48550/arxiv.1905.13150","created_at":"2026-05-17T23:40:43Z"},{"alias_kind":"pith_short_12","alias_value":"3JB5DNQIR3FM","created_at":"2026-05-18T12:33:07Z"},{"alias_kind":"pith_short_16","alias_value":"3JB5DNQIR3FMCEK6","created_at":"2026-05-18T12:33:07Z"},{"alias_kind":"pith_short_8","alias_value":"3JB5DNQI","created_at":"2026-05-18T12:33:07Z"}],"graph_snapshots":[{"event_id":"sha256:b554a073d4a6e33a4766b35104ac1512032aea196c5b992dcb29f2b060372eb9","target":"graph","created_at":"2026-05-17T23:40:43Z","signer":{"key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","signer_id":"pith.science","signer_type":"pith_registry"},"payload":{"graph_snapshot":{"author_claims":{"count":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57","strong_count":0},"builder_version":"pith-number-builder-2026-05-17-v1","claims":{"count":0,"items":[],"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"formal_canon":{"evidence_count":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"paper":{"abstract_excerpt":"In the broadcast domain there is an abundance of related text data and partial transcriptions, such as closed captions and subtitles. This text data can be used for lightly supervised training, in which text matching the audio is selected using an existing speech recognition model. Current approaches to light supervision typically filter the data based on matching error rates between the transcriptions and biased decoding hypotheses. In contrast, semi-supervised training does not require matching text data, instead generating a hypothesis using a background language model. State-of-the-art sem","authors_text":"Joachim Fainberg, Ond\\v{r}ej Klejch, Peter Bell, Steve Renals","cross_cats":["cs.SD","eess.AS"],"headline":"","license":"http://arxiv.org/licenses/nonexclusive-distrib/1.0/","primary_cat":"cs.CL","submitted_at":"2019-05-30T16:12:26Z","title":"Lattice-based lightly-supervised acoustic model training"},"references":{"count":0,"internal_anchors":0,"resolved_work":0,"sample":[],"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"source":{"id":"1905.13150","kind":"arxiv","version":2},"verdict":{"created_at":null,"id":null,"model_set":{},"one_line_summary":"","pipeline_version":null,"pith_extraction_headline":"","strongest_claim":"","weakest_assumption":""}},"verdict_id":null}}],"author_attestations":[],"timestamp_anchors":[],"storage_attestations":[],"citation_signatures":[],"replication_records":[],"corrections":[],"mirror_hints":[],"record_created":{"event_id":"sha256:1503e1accdb3582592e8fe70c91071c0a72d1f7bc5f938d8d6332610222d2c50","target":"record","created_at":"2026-05-17T23:40:43Z","signer":{"key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","signer_id":"pith.science","signer_type":"pith_registry"},"payload":{"attestation_state":"computed","canonical_record":{"metadata":{"abstract_canon_sha256":"e10917c65d308bb15ef04e5530172cbfaf835c9e8d1d78f529e4833072fe821a","cross_cats_sorted":["cs.SD","eess.AS"],"license":"http://arxiv.org/licenses/nonexclusive-distrib/1.0/","primary_cat":"cs.CL","submitted_at":"2019-05-30T16:12:26Z","title_canon_sha256":"59f0b60da042c59b4b39b05375711044cbfb79703f5cb58285224f47e53880b3"},"schema_version":"1.0","source":{"id":"1905.13150","kind":"arxiv","version":2}},"canonical_sha256":"da43d1b6088ecac1115ef9dae0c782df09c200bff05f824886dacd68bce0703a","receipt":{"algorithm":"ed25519","builder_version":"pith-number-builder-2026-05-17-v1","canonical_sha256":"da43d1b6088ecac1115ef9dae0c782df09c200bff05f824886dacd68bce0703a","first_computed_at":"2026-05-17T23:40:43.217366Z","key_id":"pith-v1-2026-05","kind":"pith_receipt","last_reissued_at":"2026-05-17T23:40:43.217366Z","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","receipt_version":"0.3","signature_b64":"uCjhetOnMDS/xqvk3IS9g9zwr287IytarXa5A+776MSosGG/ZAGuIStvhlriVbXlNjKApG0//ggsToVKVs4UAQ==","signature_status":"signed_v1","signed_at":"2026-05-17T23:40:43.217954Z","signed_message":"canonical_sha256_bytes"},"source_id":"1905.13150","source_kind":"arxiv","source_version":2}}},"equivocations":[],"invalid_events":[],"applied_event_ids":["sha256:1503e1accdb3582592e8fe70c91071c0a72d1f7bc5f938d8d6332610222d2c50","sha256:b554a073d4a6e33a4766b35104ac1512032aea196c5b992dcb29f2b060372eb9"],"state_sha256":"cdb98ff6aeecfe092c82790630e14894fb3dae37d3be985f7b07339fc9ee2b65"},"bundle_signature":{"signature_status":"signed_v1","algorithm":"ed25519","key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","signature_b64":"t41PWA0g1AiceCsgBqAHL80r6WJ8+1Zixc0JYI65d4I40vowKSxYdiTqeseDe9bXim3jljTXcwBBlRQn4TT4CQ==","signed_message":"bundle_sha256_bytes","signed_at":"2026-05-29T23:37:56.291198Z","bundle_sha256":"46373b0926794476a9414b4cc96993325bcccc739274f8ee2d4a52160b1b627b"}}