{"bundle_type":"pith_open_graph_bundle","bundle_version":"1.0","pith_number":"pith:2019:6LGSCTFAXPXG46F75IQNRZYJR6","short_pith_number":"pith:6LGSCTFA","canonical_record":{"source":{"id":"1905.08920","kind":"arxiv","version":1},"metadata":{"license":"http://arxiv.org/licenses/nonexclusive-distrib/1.0/","primary_cat":"cs.CL","submitted_at":"2019-05-21T10:33:06Z","cross_cats_sorted":["cs.LG","stat.ML"],"title_canon_sha256":"35fa1f9460f88aeb690f65a7f8fe4421ab1ffa6a1d5e54769a583f3ee5d7dd0d","abstract_canon_sha256":"86b4257eda1d29588b64bd905fc69220d8097d9225f8c0b0e202bd8a16e12f3f"},"schema_version":"1.0"},"canonical_sha256":"f2cd214ca0bbee6e78bfea20d8e7098fb11fc3e7fc3f715f463a66da126b17c8","source":{"kind":"arxiv","id":"1905.08920","version":1},"source_aliases":[{"alias_kind":"arxiv","alias_value":"1905.08920","created_at":"2026-05-17T23:45:24Z"},{"alias_kind":"arxiv_version","alias_value":"1905.08920v1","created_at":"2026-05-17T23:45:24Z"},{"alias_kind":"doi","alias_value":"10.48550/arxiv.1905.08920","created_at":"2026-05-17T23:45:24Z"},{"alias_kind":"pith_short_12","alias_value":"6LGSCTFAXPXG","created_at":"2026-05-18T12:33:10Z"},{"alias_kind":"pith_short_16","alias_value":"6LGSCTFAXPXG46F7","created_at":"2026-05-18T12:33:10Z"},{"alias_kind":"pith_short_8","alias_value":"6LGSCTFA","created_at":"2026-05-18T12:33:10Z"}],"events":[{"event_type":"record_created","subject_pith_number":"pith:2019:6LGSCTFAXPXG46F75IQNRZYJR6","target":"record","payload":{"canonical_record":{"source":{"id":"1905.08920","kind":"arxiv","version":1},"metadata":{"license":"http://arxiv.org/licenses/nonexclusive-distrib/1.0/","primary_cat":"cs.CL","submitted_at":"2019-05-21T10:33:06Z","cross_cats_sorted":["cs.LG","stat.ML"],"title_canon_sha256":"35fa1f9460f88aeb690f65a7f8fe4421ab1ffa6a1d5e54769a583f3ee5d7dd0d","abstract_canon_sha256":"86b4257eda1d29588b64bd905fc69220d8097d9225f8c0b0e202bd8a16e12f3f"},"schema_version":"1.0"},"canonical_sha256":"f2cd214ca0bbee6e78bfea20d8e7098fb11fc3e7fc3f715f463a66da126b17c8","receipt":{"kind":"pith_receipt","key_id":"pith-v1-2026-05","algorithm":"ed25519","signed_at":"2026-05-17T23:45:24.875404Z","signature_b64":"wVquxy/fwnokMBcpOAqq7R/UDdln6t7aD+ivLKSWIrNXakySQMx0WFddZ/4/oeSvMRTGiL/Q/ZfjCf60kZ5eCA==","signed_message":"canonical_sha256_bytes","builder_version":"pith-number-builder-2026-05-17-v1","receipt_version":"0.3","canonical_sha256":"f2cd214ca0bbee6e78bfea20d8e7098fb11fc3e7fc3f715f463a66da126b17c8","last_reissued_at":"2026-05-17T23:45:24.875034Z","signature_status":"signed_v1","first_computed_at":"2026-05-17T23:45:24.875034Z","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54"},"source_kind":"arxiv","source_id":"1905.08920","source_version":1,"attestation_state":"computed"},"signer":{"signer_id":"pith.science","signer_type":"pith_registry","key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54"},"created_at":"2026-05-17T23:45:24Z","supersedes":[],"prev_event":null,"signature":{"signature_status":"signed_v1","algorithm":"ed25519","key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","signature_b64":"eQ81/q66WLCGmI7eKTBqU6He2O9tArZH90hpgmr9eybp5Mf9sCJjEFwAOoYqze7Zm931infeW1qHWxPF8yA4Cg==","signed_message":"open_graph_event_sha256_bytes","signed_at":"2026-06-08T19:07:14.849256Z"},"content_sha256":"4bb876cfa3d04f025c305370381e1bc94fd495c92204b0022db273ba99ea7f38","schema_version":"1.0","event_id":"sha256:4bb876cfa3d04f025c305370381e1bc94fd495c92204b0022db273ba99ea7f38"},{"event_type":"graph_snapshot","subject_pith_number":"pith:2019:6LGSCTFAXPXG46F75IQNRZYJR6","target":"graph","payload":{"graph_snapshot":{"paper":{"title":"Domain adaptation for part-of-speech tagging of noisy user-generated text","license":"http://arxiv.org/licenses/nonexclusive-distrib/1.0/","headline":"","cross_cats":["cs.LG","stat.ML"],"primary_cat":"cs.CL","authors_text":"Benjamin Roth, Dietrich Trautmann, Luisa M\\\"arz","submitted_at":"2019-05-21T10:33:06Z","abstract_excerpt":"The performance of a Part-of-speech (POS) tagger is highly dependent on the domain ofthe processed text, and for many domains there is no or only very little training data available. This work addresses the problem of POS tagging noisy user-generated text using a neural network. We propose an architecture that trains an out-of-domain model on a large newswire corpus, and transfers those weights by using them as a prior for a model trained on the target domain (a data-set of German Tweets) for which there is very little an-notations available. The neural network has two standard bidirectional L"},"claims":{"count":0,"items":[],"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"source":{"id":"1905.08920","kind":"arxiv","version":1},"verdict":{"id":null,"model_set":{},"created_at":null,"strongest_claim":"","one_line_summary":"","pipeline_version":null,"weakest_assumption":"","pith_extraction_headline":""},"references":{"count":0,"sample":[],"resolved_work":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57","internal_anchors":0},"formal_canon":{"evidence_count":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"author_claims":{"count":0,"strong_count":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"builder_version":"pith-number-builder-2026-05-17-v1"},"verdict_id":null},"signer":{"signer_id":"pith.science","signer_type":"pith_registry","key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54"},"created_at":"2026-05-17T23:45:24Z","supersedes":[],"prev_event":null,"signature":{"signature_status":"signed_v1","algorithm":"ed25519","key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","signature_b64":"u719BqlcR7jso5YD4L/WG4n/UA8tFwcARujlizVK4HZu6aoCxRNxMl71xy0AjrJ9/0ahZW3xfmpRXqQThHOpDw==","signed_message":"open_graph_event_sha256_bytes","signed_at":"2026-06-08T19:07:14.849993Z"},"content_sha256":"800a23c551544a559c91511a33ba028a5f021117baa5b3c0d6d0b0df923a6f82","schema_version":"1.0","event_id":"sha256:800a23c551544a559c91511a33ba028a5f021117baa5b3c0d6d0b0df923a6f82"}],"timestamp_proofs":[],"mirror_hints":[{"mirror_type":"https","name":"Pith Resolver","base_url":"https://pith.science","bundle_url":"https://pith.science/pith/6LGSCTFAXPXG46F75IQNRZYJR6/bundle.json","state_url":"https://pith.science/pith/6LGSCTFAXPXG46F75IQNRZYJR6/state.json","well_known_bundle_url":"https://pith.science/.well-known/pith/6LGSCTFAXPXG46F75IQNRZYJR6/bundle.json","status":"primary"}],"public_keys":[{"key_id":"pith-v1-2026-05","algorithm":"ed25519","format":"raw","public_key_b64":"stVStoiQhXFxp4s2pdzPNoqVNBMojDU/fJ2db5S3CbM=","public_key_hex":"b2d552b68890857171a78b36a5dccf368a953413288c353f7c9d9d6f94b709b3","fingerprint_sha256_b32_first128bits":"RVFV5Z2OI2J3ZUO7ERDEBCYNKS","fingerprint_sha256_hex":"8d4b5ee74e4693bcd1df2446408b0d54","rotates_at":null,"url":"https://pith.science/pith-signing-key.json","notes":"Pith uses this Ed25519 key to sign canonical record SHA-256 digests. Verify with: ed25519_verify(public_key, message=canonical_sha256_bytes, signature=base64decode(signature_b64))."}],"merge_version":"pith-open-graph-merge-v1","built_at":"2026-06-08T19:07:14Z","links":{"resolver":"https://pith.science/pith/6LGSCTFAXPXG46F75IQNRZYJR6","bundle":"https://pith.science/pith/6LGSCTFAXPXG46F75IQNRZYJR6/bundle.json","state":"https://pith.science/pith/6LGSCTFAXPXG46F75IQNRZYJR6/state.json","well_known_bundle":"https://pith.science/.well-known/pith/6LGSCTFAXPXG46F75IQNRZYJR6/bundle.json"},"state":{"state_type":"pith_open_graph_state","state_version":"1.0","pith_number":"pith:2019:6LGSCTFAXPXG46F75IQNRZYJR6","merge_version":"pith-open-graph-merge-v1","event_count":2,"valid_event_count":2,"invalid_event_count":0,"equivocation_count":0,"current":{"canonical_record":{"metadata":{"abstract_canon_sha256":"86b4257eda1d29588b64bd905fc69220d8097d9225f8c0b0e202bd8a16e12f3f","cross_cats_sorted":["cs.LG","stat.ML"],"license":"http://arxiv.org/licenses/nonexclusive-distrib/1.0/","primary_cat":"cs.CL","submitted_at":"2019-05-21T10:33:06Z","title_canon_sha256":"35fa1f9460f88aeb690f65a7f8fe4421ab1ffa6a1d5e54769a583f3ee5d7dd0d"},"schema_version":"1.0","source":{"id":"1905.08920","kind":"arxiv","version":1}},"source_aliases":[{"alias_kind":"arxiv","alias_value":"1905.08920","created_at":"2026-05-17T23:45:24Z"},{"alias_kind":"arxiv_version","alias_value":"1905.08920v1","created_at":"2026-05-17T23:45:24Z"},{"alias_kind":"doi","alias_value":"10.48550/arxiv.1905.08920","created_at":"2026-05-17T23:45:24Z"},{"alias_kind":"pith_short_12","alias_value":"6LGSCTFAXPXG","created_at":"2026-05-18T12:33:10Z"},{"alias_kind":"pith_short_16","alias_value":"6LGSCTFAXPXG46F7","created_at":"2026-05-18T12:33:10Z"},{"alias_kind":"pith_short_8","alias_value":"6LGSCTFA","created_at":"2026-05-18T12:33:10Z"}],"graph_snapshots":[{"event_id":"sha256:800a23c551544a559c91511a33ba028a5f021117baa5b3c0d6d0b0df923a6f82","target":"graph","created_at":"2026-05-17T23:45:24Z","signer":{"key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","signer_id":"pith.science","signer_type":"pith_registry"},"payload":{"graph_snapshot":{"author_claims":{"count":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57","strong_count":0},"builder_version":"pith-number-builder-2026-05-17-v1","claims":{"count":0,"items":[],"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"formal_canon":{"evidence_count":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"paper":{"abstract_excerpt":"The performance of a Part-of-speech (POS) tagger is highly dependent on the domain ofthe processed text, and for many domains there is no or only very little training data available. This work addresses the problem of POS tagging noisy user-generated text using a neural network. We propose an architecture that trains an out-of-domain model on a large newswire corpus, and transfers those weights by using them as a prior for a model trained on the target domain (a data-set of German Tweets) for which there is very little an-notations available. The neural network has two standard bidirectional L","authors_text":"Benjamin Roth, Dietrich Trautmann, Luisa M\\\"arz","cross_cats":["cs.LG","stat.ML"],"headline":"","license":"http://arxiv.org/licenses/nonexclusive-distrib/1.0/","primary_cat":"cs.CL","submitted_at":"2019-05-21T10:33:06Z","title":"Domain adaptation for part-of-speech tagging of noisy user-generated text"},"references":{"count":0,"internal_anchors":0,"resolved_work":0,"sample":[],"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"source":{"id":"1905.08920","kind":"arxiv","version":1},"verdict":{"created_at":null,"id":null,"model_set":{},"one_line_summary":"","pipeline_version":null,"pith_extraction_headline":"","strongest_claim":"","weakest_assumption":""}},"verdict_id":null}}],"author_attestations":[],"timestamp_anchors":[],"storage_attestations":[],"citation_signatures":[],"replication_records":[],"corrections":[],"mirror_hints":[],"record_created":{"event_id":"sha256:4bb876cfa3d04f025c305370381e1bc94fd495c92204b0022db273ba99ea7f38","target":"record","created_at":"2026-05-17T23:45:24Z","signer":{"key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","signer_id":"pith.science","signer_type":"pith_registry"},"payload":{"attestation_state":"computed","canonical_record":{"metadata":{"abstract_canon_sha256":"86b4257eda1d29588b64bd905fc69220d8097d9225f8c0b0e202bd8a16e12f3f","cross_cats_sorted":["cs.LG","stat.ML"],"license":"http://arxiv.org/licenses/nonexclusive-distrib/1.0/","primary_cat":"cs.CL","submitted_at":"2019-05-21T10:33:06Z","title_canon_sha256":"35fa1f9460f88aeb690f65a7f8fe4421ab1ffa6a1d5e54769a583f3ee5d7dd0d"},"schema_version":"1.0","source":{"id":"1905.08920","kind":"arxiv","version":1}},"canonical_sha256":"f2cd214ca0bbee6e78bfea20d8e7098fb11fc3e7fc3f715f463a66da126b17c8","receipt":{"algorithm":"ed25519","builder_version":"pith-number-builder-2026-05-17-v1","canonical_sha256":"f2cd214ca0bbee6e78bfea20d8e7098fb11fc3e7fc3f715f463a66da126b17c8","first_computed_at":"2026-05-17T23:45:24.875034Z","key_id":"pith-v1-2026-05","kind":"pith_receipt","last_reissued_at":"2026-05-17T23:45:24.875034Z","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","receipt_version":"0.3","signature_b64":"wVquxy/fwnokMBcpOAqq7R/UDdln6t7aD+ivLKSWIrNXakySQMx0WFddZ/4/oeSvMRTGiL/Q/ZfjCf60kZ5eCA==","signature_status":"signed_v1","signed_at":"2026-05-17T23:45:24.875404Z","signed_message":"canonical_sha256_bytes"},"source_id":"1905.08920","source_kind":"arxiv","source_version":1}}},"equivocations":[],"invalid_events":[],"applied_event_ids":["sha256:4bb876cfa3d04f025c305370381e1bc94fd495c92204b0022db273ba99ea7f38","sha256:800a23c551544a559c91511a33ba028a5f021117baa5b3c0d6d0b0df923a6f82"],"state_sha256":"63202a12ff017b8942a6276da9dc910201a5d96b118ea87e20acecef6687966f"},"bundle_signature":{"signature_status":"signed_v1","algorithm":"ed25519","key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","signature_b64":"zojcRZ0pfMwrf37buxTQPcEuZ3N9yE7S2Xm4hMPQOcS+5euBZ9WOz9a0XuQuxk5cFPZmnBNZlg6oPRVDNRRhDA==","signed_message":"bundle_sha256_bytes","signed_at":"2026-06-08T19:07:14.853722Z","bundle_sha256":"0d85f768852ea1f38e94809a621d28e08daf606ecdc47ca49b4ea0bd7b8ae39e"}}