{"record_type":"pith_number_record","schema_url":"https://pith.science/schemas/pith-number/v1.json","pith_number":"pith:2016:PU6IG7CQLGPGCW2UD5BTNWZLVP","short_pith_number":"pith:PU6IG7CQ","schema_version":"1.0","canonical_sha256":"7d3c837c50599e615b541f4336db2babdab3136f30bb48abe37676b298b022b3","source":{"kind":"arxiv","id":"1603.03144","version":2},"attestation_state":"computed","paper":{"title":"Part-of-Speech Tagging for Historical English","license":"http://arxiv.org/licenses/nonexclusive-distrib/1.0/","headline":"","cross_cats":["cs.DL"],"primary_cat":"cs.CL","authors_text":"Jacob Eisenstein, Yi Yang","submitted_at":"2016-03-10T04:27:15Z","abstract_excerpt":"As more historical texts are digitized, there is interest in applying natural language processing tools to these archives. However, the performance of these tools is often unsatisfactory, due to language change and genre differences. Spelling normalization heuristics are the dominant solution for dealing with historical texts, but this approach fails to account for changes in usage and vocabulary. In this empirical paper, we assess the capability of domain adaptation techniques to cope with historical texts, focusing on the classic benchmark task of part-of-speech tagging. We evaluate several "},"verification_status":{"content_addressed":true,"pith_receipt":true,"author_attested":false,"weak_author_claims":0,"strong_author_claims":0,"externally_anchored":false,"storage_verified":false,"citation_signatures":0,"replication_records":0,"graph_snapshot":true,"references_resolved":false,"formal_links_present":false},"canonical_record":{"source":{"id":"1603.03144","kind":"arxiv","version":2},"metadata":{"license":"http://arxiv.org/licenses/nonexclusive-distrib/1.0/","primary_cat":"cs.CL","submitted_at":"2016-03-10T04:27:15Z","cross_cats_sorted":["cs.DL"],"title_canon_sha256":"b4405980b4cc122bc0b1fbee0f218b6b67630e1fd5cc16616a31c329c1ca7050","abstract_canon_sha256":"5bcf9a4c19c77449c0fc2d8699c278eeaae2613dbce5bc8efd3db3bb691d53ce"},"schema_version":"1.0"},"receipt":{"kind":"pith_receipt","key_id":"pith-v1-2026-05","algorithm":"ed25519","signed_at":"2026-05-18T01:17:49.996039Z","signature_b64":"+ivdpVSygS2YFmt+F3jtweMedyJuJmOOtTGVXzx4UUL+Eei5SkbV/nJGwW5IqVOuR5CDVq58ovmrZ1216PTQBQ==","signed_message":"canonical_sha256_bytes","builder_version":"pith-number-builder-2026-05-17-v1","receipt_version":"0.3","canonical_sha256":"7d3c837c50599e615b541f4336db2babdab3136f30bb48abe37676b298b022b3","last_reissued_at":"2026-05-18T01:17:49.995255Z","signature_status":"signed_v1","first_computed_at":"2026-05-18T01:17:49.995255Z","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54"},"graph_snapshot":{"paper":{"title":"Part-of-Speech Tagging for Historical English","license":"http://arxiv.org/licenses/nonexclusive-distrib/1.0/","headline":"","cross_cats":["cs.DL"],"primary_cat":"cs.CL","authors_text":"Jacob Eisenstein, Yi Yang","submitted_at":"2016-03-10T04:27:15Z","abstract_excerpt":"As more historical texts are digitized, there is interest in applying natural language processing tools to these archives. However, the performance of these tools is often unsatisfactory, due to language change and genre differences. Spelling normalization heuristics are the dominant solution for dealing with historical texts, but this approach fails to account for changes in usage and vocabulary. In this empirical paper, we assess the capability of domain adaptation techniques to cope with historical texts, focusing on the classic benchmark task of part-of-speech tagging. We evaluate several "},"claims":{"count":0,"items":[],"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"source":{"id":"1603.03144","kind":"arxiv","version":2},"verdict":{"id":null,"model_set":{},"created_at":null,"strongest_claim":"","one_line_summary":"","pipeline_version":null,"weakest_assumption":"","pith_extraction_headline":""},"references":{"count":0,"sample":[],"resolved_work":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57","internal_anchors":0},"formal_canon":{"evidence_count":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"author_claims":{"count":0,"strong_count":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"builder_version":"pith-number-builder-2026-05-17-v1"},"aliases":[{"alias_kind":"arxiv","alias_value":"1603.03144","created_at":"2026-05-18T01:17:49.995387+00:00"},{"alias_kind":"arxiv_version","alias_value":"1603.03144v2","created_at":"2026-05-18T01:17:49.995387+00:00"},{"alias_kind":"doi","alias_value":"10.48550/arxiv.1603.03144","created_at":"2026-05-18T01:17:49.995387+00:00"},{"alias_kind":"pith_short_12","alias_value":"PU6IG7CQLGPG","created_at":"2026-05-18T12:30:39.010887+00:00"},{"alias_kind":"pith_short_16","alias_value":"PU6IG7CQLGPGCW2U","created_at":"2026-05-18T12:30:39.010887+00:00"},{"alias_kind":"pith_short_8","alias_value":"PU6IG7CQ","created_at":"2026-05-18T12:30:39.010887+00:00"}],"events":[],"event_summary":{},"paper_claims":[],"inbound_citations":{"count":0,"internal_anchor_count":0,"sample":[]},"formal_canon":{"evidence_count":0,"sample":[],"anchors":[]},"links":{"html":"https://pith.science/pith/PU6IG7CQLGPGCW2UD5BTNWZLVP","json":"https://pith.science/pith/PU6IG7CQLGPGCW2UD5BTNWZLVP.json","graph_json":"https://pith.science/api/pith-number/PU6IG7CQLGPGCW2UD5BTNWZLVP/graph.json","events_json":"https://pith.science/api/pith-number/PU6IG7CQLGPGCW2UD5BTNWZLVP/events.json","paper":"https://pith.science/paper/PU6IG7CQ"},"agent_actions":{"view_html":"https://pith.science/pith/PU6IG7CQLGPGCW2UD5BTNWZLVP","download_json":"https://pith.science/pith/PU6IG7CQLGPGCW2UD5BTNWZLVP.json","view_paper":"https://pith.science/paper/PU6IG7CQ","resolve_alias":"https://pith.science/api/pith-number/resolve?arxiv=1603.03144&json=true","fetch_graph":"https://pith.science/api/pith-number/PU6IG7CQLGPGCW2UD5BTNWZLVP/graph.json","fetch_events":"https://pith.science/api/pith-number/PU6IG7CQLGPGCW2UD5BTNWZLVP/events.json","actions":{"anchor_timestamp":"https://pith.science/pith/PU6IG7CQLGPGCW2UD5BTNWZLVP/action/timestamp_anchor","attest_storage":"https://pith.science/pith/PU6IG7CQLGPGCW2UD5BTNWZLVP/action/storage_attestation","attest_author":"https://pith.science/pith/PU6IG7CQLGPGCW2UD5BTNWZLVP/action/author_attestation","sign_citation":"https://pith.science/pith/PU6IG7CQLGPGCW2UD5BTNWZLVP/action/citation_signature","submit_replication":"https://pith.science/pith/PU6IG7CQLGPGCW2UD5BTNWZLVP/action/replication_record"}},"created_at":"2026-05-18T01:17:49.995387+00:00","updated_at":"2026-05-18T01:17:49.995387+00:00"}