{"record_type":"pith_number_record","schema_url":"https://pith.science/schemas/pith-number/v1.json","pith_number":"pith:2019:3QNNWB4W42KH52OR7NEB3XUZ32","short_pith_number":"pith:3QNNWB4W","schema_version":"1.0","canonical_sha256":"dc1adb0796e6947ee9d1fb481dde99de8d6f83621ac07d9184b6bb87b5761923","source":{"kind":"arxiv","id":"1906.11298","version":1},"attestation_state":"computed","paper":{"title":"A Generative Model for Punctuation in Dependency Trees","license":"http://arxiv.org/licenses/nonexclusive-distrib/1.0/","headline":"","cross_cats":["cs.LG"],"primary_cat":"cs.CL","authors_text":"Dingquan Wang, Jason Eisner, Xiang Lisa Li","submitted_at":"2019-06-26T19:03:17Z","abstract_excerpt":"Treebanks traditionally treat punctuation marks as ordinary words, but linguists have suggested that a tree's \"true\" punctuation marks are not observed (Nunberg, 1990). These latent \"underlying\" marks serve to delimit or separate constituents in the syntax tree. When the tree's yield is rendered as a written sentence, a string rewriting mechanism transduces the underlying marks into \"surface\" marks, which are part of the observed (surface) string but should not be regarded as part of the tree. We formalize this idea in a generative model of punctuation that admits efficient dynamic programming"},"verification_status":{"content_addressed":true,"pith_receipt":true,"author_attested":false,"weak_author_claims":0,"strong_author_claims":0,"externally_anchored":false,"storage_verified":false,"citation_signatures":0,"replication_records":0,"graph_snapshot":true,"references_resolved":false,"formal_links_present":false},"canonical_record":{"source":{"id":"1906.11298","kind":"arxiv","version":1},"metadata":{"license":"http://arxiv.org/licenses/nonexclusive-distrib/1.0/","primary_cat":"cs.CL","submitted_at":"2019-06-26T19:03:17Z","cross_cats_sorted":["cs.LG"],"title_canon_sha256":"1f6ee5802b29cc2d838a77c49bf21e01a2d0f0d7b55d570bd68006a75e94ed40","abstract_canon_sha256":"9ec50f64f5d87b6f457743556f7021f118f3dd8ea7016db7e8656e8ee0dfb8ab"},"schema_version":"1.0"},"receipt":{"kind":"pith_receipt","key_id":"pith-v1-2026-05","algorithm":"ed25519","signed_at":"2026-05-17T23:42:07.571402Z","signature_b64":"VVwLTHHDEgvrsPG5yKtgabYxl++Epa8vpbADOQQB0YKvVb/f+pw4Eb8JRrF4HKLx8KTuatJYmtZrs4w0z3nvBQ==","signed_message":"canonical_sha256_bytes","builder_version":"pith-number-builder-2026-05-17-v1","receipt_version":"0.3","canonical_sha256":"dc1adb0796e6947ee9d1fb481dde99de8d6f83621ac07d9184b6bb87b5761923","last_reissued_at":"2026-05-17T23:42:07.570917Z","signature_status":"signed_v1","first_computed_at":"2026-05-17T23:42:07.570917Z","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54"},"graph_snapshot":{"paper":{"title":"A Generative Model for Punctuation in Dependency Trees","license":"http://arxiv.org/licenses/nonexclusive-distrib/1.0/","headline":"","cross_cats":["cs.LG"],"primary_cat":"cs.CL","authors_text":"Dingquan Wang, Jason Eisner, Xiang Lisa Li","submitted_at":"2019-06-26T19:03:17Z","abstract_excerpt":"Treebanks traditionally treat punctuation marks as ordinary words, but linguists have suggested that a tree's \"true\" punctuation marks are not observed (Nunberg, 1990). These latent \"underlying\" marks serve to delimit or separate constituents in the syntax tree. When the tree's yield is rendered as a written sentence, a string rewriting mechanism transduces the underlying marks into \"surface\" marks, which are part of the observed (surface) string but should not be regarded as part of the tree. We formalize this idea in a generative model of punctuation that admits efficient dynamic programming"},"claims":{"count":0,"items":[],"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"source":{"id":"1906.11298","kind":"arxiv","version":1},"verdict":{"id":null,"model_set":{},"created_at":null,"strongest_claim":"","one_line_summary":"","pipeline_version":null,"weakest_assumption":"","pith_extraction_headline":""},"references":{"count":0,"sample":[],"resolved_work":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57","internal_anchors":0},"formal_canon":{"evidence_count":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"author_claims":{"count":0,"strong_count":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"builder_version":"pith-number-builder-2026-05-17-v1"},"aliases":[{"alias_kind":"arxiv","alias_value":"1906.11298","created_at":"2026-05-17T23:42:07.570991+00:00"},{"alias_kind":"arxiv_version","alias_value":"1906.11298v1","created_at":"2026-05-17T23:42:07.570991+00:00"},{"alias_kind":"doi","alias_value":"10.48550/arxiv.1906.11298","created_at":"2026-05-17T23:42:07.570991+00:00"},{"alias_kind":"pith_short_12","alias_value":"3QNNWB4W42KH","created_at":"2026-05-18T12:33:07.085635+00:00"},{"alias_kind":"pith_short_16","alias_value":"3QNNWB4W42KH52OR","created_at":"2026-05-18T12:33:07.085635+00:00"},{"alias_kind":"pith_short_8","alias_value":"3QNNWB4W","created_at":"2026-05-18T12:33:07.085635+00:00"}],"events":[],"event_summary":{},"paper_claims":[],"inbound_citations":{"count":0,"internal_anchor_count":0,"sample":[]},"formal_canon":{"evidence_count":0,"sample":[],"anchors":[]},"links":{"html":"https://pith.science/pith/3QNNWB4W42KH52OR7NEB3XUZ32","json":"https://pith.science/pith/3QNNWB4W42KH52OR7NEB3XUZ32.json","graph_json":"https://pith.science/api/pith-number/3QNNWB4W42KH52OR7NEB3XUZ32/graph.json","events_json":"https://pith.science/api/pith-number/3QNNWB4W42KH52OR7NEB3XUZ32/events.json","paper":"https://pith.science/paper/3QNNWB4W"},"agent_actions":{"view_html":"https://pith.science/pith/3QNNWB4W42KH52OR7NEB3XUZ32","download_json":"https://pith.science/pith/3QNNWB4W42KH52OR7NEB3XUZ32.json","view_paper":"https://pith.science/paper/3QNNWB4W","resolve_alias":"https://pith.science/api/pith-number/resolve?arxiv=1906.11298&json=true","fetch_graph":"https://pith.science/api/pith-number/3QNNWB4W42KH52OR7NEB3XUZ32/graph.json","fetch_events":"https://pith.science/api/pith-number/3QNNWB4W42KH52OR7NEB3XUZ32/events.json","actions":{"anchor_timestamp":"https://pith.science/pith/3QNNWB4W42KH52OR7NEB3XUZ32/action/timestamp_anchor","attest_storage":"https://pith.science/pith/3QNNWB4W42KH52OR7NEB3XUZ32/action/storage_attestation","attest_author":"https://pith.science/pith/3QNNWB4W42KH52OR7NEB3XUZ32/action/author_attestation","sign_citation":"https://pith.science/pith/3QNNWB4W42KH52OR7NEB3XUZ32/action/citation_signature","submit_replication":"https://pith.science/pith/3QNNWB4W42KH52OR7NEB3XUZ32/action/replication_record"}},"created_at":"2026-05-17T23:42:07.570991+00:00","updated_at":"2026-05-17T23:42:07.570991+00:00"}