{"record_type":"pith_number_record","schema_url":"https://pith.science/schemas/pith-number/v1.json","pith_number":"pith:2016:7FNS7PZCVYYMZOZRIKPFIFWKE5","short_pith_number":"pith:7FNS7PZC","schema_version":"1.0","canonical_sha256":"f95b2fbf22ae30ccbb31429e5416ca277ea57942494da96327f433d2ca6eb7e3","source":{"kind":"arxiv","id":"1612.00148","version":1},"attestation_state":"computed","paper":{"title":"Domain Adaptation for Named Entity Recognition in Online Media with Word Embeddings","license":"http://arxiv.org/licenses/nonexclusive-distrib/1.0/","headline":"","cross_cats":["cs.IR"],"primary_cat":"cs.CL","authors_text":"Troy Chevalier, Vivek Kulkarni, Yashar Mehdad","submitted_at":"2016-12-01T05:08:53Z","abstract_excerpt":"Content on the Internet is heterogeneous and arises from various domains like News, Entertainment, Finance and Technology. Understanding such content requires identifying named entities (persons, places and organizations) as one of the key steps. Traditionally Named Entity Recognition (NER) systems have been built using available annotated datasets (like CoNLL, MUC) and demonstrate excellent performance. However, these models fail to generalize onto other domains like Sports and Finance where conventions and language use can differ significantly. Furthermore, several domains do not have large "},"verification_status":{"content_addressed":true,"pith_receipt":true,"author_attested":false,"weak_author_claims":0,"strong_author_claims":0,"externally_anchored":false,"storage_verified":false,"citation_signatures":0,"replication_records":0,"graph_snapshot":true,"references_resolved":false,"formal_links_present":false},"canonical_record":{"source":{"id":"1612.00148","kind":"arxiv","version":1},"metadata":{"license":"http://arxiv.org/licenses/nonexclusive-distrib/1.0/","primary_cat":"cs.CL","submitted_at":"2016-12-01T05:08:53Z","cross_cats_sorted":["cs.IR"],"title_canon_sha256":"5b42b34ac1bd901e1b9ea273148e2a701228a5ece2b0f5f2c7e18fc7758961c0","abstract_canon_sha256":"d26a203a5e9a7a145693fde91a30f90fa571de57258dab39ec50c5c49b70f22d"},"schema_version":"1.0"},"receipt":{"kind":"pith_receipt","key_id":"pith-v1-2026-05","algorithm":"ed25519","signed_at":"2026-05-18T00:56:05.909585Z","signature_b64":"YTYi4LTiZtJrzIkU8R9uGbc94DfMWe0w3RedQJWe2CjiA5ktiWfKXb09J3U8Ef562QDaOAusxXWyqMv7qV3CCQ==","signed_message":"canonical_sha256_bytes","builder_version":"pith-number-builder-2026-05-17-v1","receipt_version":"0.3","canonical_sha256":"f95b2fbf22ae30ccbb31429e5416ca277ea57942494da96327f433d2ca6eb7e3","last_reissued_at":"2026-05-18T00:56:05.909003Z","signature_status":"signed_v1","first_computed_at":"2026-05-18T00:56:05.909003Z","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54"},"graph_snapshot":{"paper":{"title":"Domain Adaptation for Named Entity Recognition in Online Media with Word Embeddings","license":"http://arxiv.org/licenses/nonexclusive-distrib/1.0/","headline":"","cross_cats":["cs.IR"],"primary_cat":"cs.CL","authors_text":"Troy Chevalier, Vivek Kulkarni, Yashar Mehdad","submitted_at":"2016-12-01T05:08:53Z","abstract_excerpt":"Content on the Internet is heterogeneous and arises from various domains like News, Entertainment, Finance and Technology. Understanding such content requires identifying named entities (persons, places and organizations) as one of the key steps. Traditionally Named Entity Recognition (NER) systems have been built using available annotated datasets (like CoNLL, MUC) and demonstrate excellent performance. However, these models fail to generalize onto other domains like Sports and Finance where conventions and language use can differ significantly. Furthermore, several domains do not have large "},"claims":{"count":0,"items":[],"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"source":{"id":"1612.00148","kind":"arxiv","version":1},"verdict":{"id":null,"model_set":{},"created_at":null,"strongest_claim":"","one_line_summary":"","pipeline_version":null,"weakest_assumption":"","pith_extraction_headline":""},"references":{"count":0,"sample":[],"resolved_work":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57","internal_anchors":0},"formal_canon":{"evidence_count":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"author_claims":{"count":0,"strong_count":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"builder_version":"pith-number-builder-2026-05-17-v1"},"aliases":[{"alias_kind":"arxiv","alias_value":"1612.00148","created_at":"2026-05-18T00:56:05.909081+00:00"},{"alias_kind":"arxiv_version","alias_value":"1612.00148v1","created_at":"2026-05-18T00:56:05.909081+00:00"},{"alias_kind":"doi","alias_value":"10.48550/arxiv.1612.00148","created_at":"2026-05-18T00:56:05.909081+00:00"},{"alias_kind":"pith_short_12","alias_value":"7FNS7PZCVYYM","created_at":"2026-05-18T12:30:04.600751+00:00"},{"alias_kind":"pith_short_16","alias_value":"7FNS7PZCVYYMZOZR","created_at":"2026-05-18T12:30:04.600751+00:00"},{"alias_kind":"pith_short_8","alias_value":"7FNS7PZC","created_at":"2026-05-18T12:30:04.600751+00:00"}],"events":[],"event_summary":{},"paper_claims":[],"inbound_citations":{"count":0,"internal_anchor_count":0,"sample":[]},"formal_canon":{"evidence_count":0,"sample":[],"anchors":[]},"links":{"html":"https://pith.science/pith/7FNS7PZCVYYMZOZRIKPFIFWKE5","json":"https://pith.science/pith/7FNS7PZCVYYMZOZRIKPFIFWKE5.json","graph_json":"https://pith.science/api/pith-number/7FNS7PZCVYYMZOZRIKPFIFWKE5/graph.json","events_json":"https://pith.science/api/pith-number/7FNS7PZCVYYMZOZRIKPFIFWKE5/events.json","paper":"https://pith.science/paper/7FNS7PZC"},"agent_actions":{"view_html":"https://pith.science/pith/7FNS7PZCVYYMZOZRIKPFIFWKE5","download_json":"https://pith.science/pith/7FNS7PZCVYYMZOZRIKPFIFWKE5.json","view_paper":"https://pith.science/paper/7FNS7PZC","resolve_alias":"https://pith.science/api/pith-number/resolve?arxiv=1612.00148&json=true","fetch_graph":"https://pith.science/api/pith-number/7FNS7PZCVYYMZOZRIKPFIFWKE5/graph.json","fetch_events":"https://pith.science/api/pith-number/7FNS7PZCVYYMZOZRIKPFIFWKE5/events.json","actions":{"anchor_timestamp":"https://pith.science/pith/7FNS7PZCVYYMZOZRIKPFIFWKE5/action/timestamp_anchor","attest_storage":"https://pith.science/pith/7FNS7PZCVYYMZOZRIKPFIFWKE5/action/storage_attestation","attest_author":"https://pith.science/pith/7FNS7PZCVYYMZOZRIKPFIFWKE5/action/author_attestation","sign_citation":"https://pith.science/pith/7FNS7PZCVYYMZOZRIKPFIFWKE5/action/citation_signature","submit_replication":"https://pith.science/pith/7FNS7PZCVYYMZOZRIKPFIFWKE5/action/replication_record"}},"created_at":"2026-05-18T00:56:05.909081+00:00","updated_at":"2026-05-18T00:56:05.909081+00:00"}