{"record_type":"pith_number_record","schema_url":"https://pith.science/schemas/pith-number/v1.json","pith_number":"pith:2015:XB6CJ5NY43G7AXHYCYPUQYADZC","short_pith_number":"pith:XB6CJ5NY","schema_version":"1.0","canonical_sha256":"b87c24f5b8e6cdf05cf8161f486003c89cd9aab494d747dd07d31828de8f7352","source":{"kind":"arxiv","id":"1510.06786","version":2},"attestation_state":"computed","paper":{"title":"Freshman or Fresher? Quantifying the Geographic Variation of Internet Language","license":"http://arxiv.org/licenses/nonexclusive-distrib/1.0/","headline":"","cross_cats":["cs.IR","cs.LG"],"primary_cat":"cs.CL","authors_text":"Bryan Perozzi, Steven Skiena, Vivek Kulkarni","submitted_at":"2015-10-22T22:53:10Z","abstract_excerpt":"We present a new computational technique to detect and analyze statistically significant geographic variation in language. Our meta-analysis approach captures statistical properties of word usage across geographical regions and uses statistical methods to identify significant changes specific to regions. While previous approaches have primarily focused on lexical variation between regions, our method identifies words that demonstrate semantic and syntactic variation as well.\n  We extend recently developed techniques for neural language models to learn word representations which capture differi"},"verification_status":{"content_addressed":true,"pith_receipt":true,"author_attested":false,"weak_author_claims":0,"strong_author_claims":0,"externally_anchored":false,"storage_verified":false,"citation_signatures":0,"replication_records":0,"graph_snapshot":true,"references_resolved":false,"formal_links_present":false},"canonical_record":{"source":{"id":"1510.06786","kind":"arxiv","version":2},"metadata":{"license":"http://arxiv.org/licenses/nonexclusive-distrib/1.0/","primary_cat":"cs.CL","submitted_at":"2015-10-22T22:53:10Z","cross_cats_sorted":["cs.IR","cs.LG"],"title_canon_sha256":"bcdb2030fb2c509ba32e4d92199688dda3b07c5df3ce03d63c86e5aa5e34d3aa","abstract_canon_sha256":"af0bff6fb7d4527805a469420c7f46086f7ae9451de5c32c858462ed9f338f0b"},"schema_version":"1.0"},"receipt":{"kind":"pith_receipt","key_id":"pith-v1-2026-05","algorithm":"ed25519","signed_at":"2026-05-18T01:19:34.066865Z","signature_b64":"2yXA4HOlZEC2psabE+pd1jPYdEuU/5A6Pp1V5WZ2E1X+vK2g8IZzweBa8g7xs5fq59gLLH/Xu2qc1uSSuW2NBQ==","signed_message":"canonical_sha256_bytes","builder_version":"pith-number-builder-2026-05-17-v1","receipt_version":"0.3","canonical_sha256":"b87c24f5b8e6cdf05cf8161f486003c89cd9aab494d747dd07d31828de8f7352","last_reissued_at":"2026-05-18T01:19:34.066433Z","signature_status":"signed_v1","first_computed_at":"2026-05-18T01:19:34.066433Z","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54"},"graph_snapshot":{"paper":{"title":"Freshman or Fresher? Quantifying the Geographic Variation of Internet Language","license":"http://arxiv.org/licenses/nonexclusive-distrib/1.0/","headline":"","cross_cats":["cs.IR","cs.LG"],"primary_cat":"cs.CL","authors_text":"Bryan Perozzi, Steven Skiena, Vivek Kulkarni","submitted_at":"2015-10-22T22:53:10Z","abstract_excerpt":"We present a new computational technique to detect and analyze statistically significant geographic variation in language. Our meta-analysis approach captures statistical properties of word usage across geographical regions and uses statistical methods to identify significant changes specific to regions. While previous approaches have primarily focused on lexical variation between regions, our method identifies words that demonstrate semantic and syntactic variation as well.\n  We extend recently developed techniques for neural language models to learn word representations which capture differi"},"claims":{"count":0,"items":[],"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"source":{"id":"1510.06786","kind":"arxiv","version":2},"verdict":{"id":null,"model_set":{},"created_at":null,"strongest_claim":"","one_line_summary":"","pipeline_version":null,"weakest_assumption":"","pith_extraction_headline":""},"references":{"count":0,"sample":[],"resolved_work":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57","internal_anchors":0},"formal_canon":{"evidence_count":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"author_claims":{"count":0,"strong_count":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"builder_version":"pith-number-builder-2026-05-17-v1"},"aliases":[{"alias_kind":"arxiv","alias_value":"1510.06786","created_at":"2026-05-18T01:19:34.066501+00:00"},{"alias_kind":"arxiv_version","alias_value":"1510.06786v2","created_at":"2026-05-18T01:19:34.066501+00:00"},{"alias_kind":"doi","alias_value":"10.48550/arxiv.1510.06786","created_at":"2026-05-18T01:19:34.066501+00:00"},{"alias_kind":"pith_short_12","alias_value":"XB6CJ5NY43G7","created_at":"2026-05-18T12:29:50.041715+00:00"},{"alias_kind":"pith_short_16","alias_value":"XB6CJ5NY43G7AXHY","created_at":"2026-05-18T12:29:50.041715+00:00"},{"alias_kind":"pith_short_8","alias_value":"XB6CJ5NY","created_at":"2026-05-18T12:29:50.041715+00:00"}],"events":[],"event_summary":{},"paper_claims":[],"inbound_citations":{"count":0,"internal_anchor_count":0,"sample":[]},"formal_canon":{"evidence_count":0,"sample":[],"anchors":[]},"links":{"html":"https://pith.science/pith/XB6CJ5NY43G7AXHYCYPUQYADZC","json":"https://pith.science/pith/XB6CJ5NY43G7AXHYCYPUQYADZC.json","graph_json":"https://pith.science/api/pith-number/XB6CJ5NY43G7AXHYCYPUQYADZC/graph.json","events_json":"https://pith.science/api/pith-number/XB6CJ5NY43G7AXHYCYPUQYADZC/events.json","paper":"https://pith.science/paper/XB6CJ5NY"},"agent_actions":{"view_html":"https://pith.science/pith/XB6CJ5NY43G7AXHYCYPUQYADZC","download_json":"https://pith.science/pith/XB6CJ5NY43G7AXHYCYPUQYADZC.json","view_paper":"https://pith.science/paper/XB6CJ5NY","resolve_alias":"https://pith.science/api/pith-number/resolve?arxiv=1510.06786&json=true","fetch_graph":"https://pith.science/api/pith-number/XB6CJ5NY43G7AXHYCYPUQYADZC/graph.json","fetch_events":"https://pith.science/api/pith-number/XB6CJ5NY43G7AXHYCYPUQYADZC/events.json","actions":{"anchor_timestamp":"https://pith.science/pith/XB6CJ5NY43G7AXHYCYPUQYADZC/action/timestamp_anchor","attest_storage":"https://pith.science/pith/XB6CJ5NY43G7AXHYCYPUQYADZC/action/storage_attestation","attest_author":"https://pith.science/pith/XB6CJ5NY43G7AXHYCYPUQYADZC/action/author_attestation","sign_citation":"https://pith.science/pith/XB6CJ5NY43G7AXHYCYPUQYADZC/action/citation_signature","submit_replication":"https://pith.science/pith/XB6CJ5NY43G7AXHYCYPUQYADZC/action/replication_record"}},"created_at":"2026-05-18T01:19:34.066501+00:00","updated_at":"2026-05-18T01:19:34.066501+00:00"}