{"state_type":"pith_open_graph_state","state_version":"1.0","pith_number":"pith:2026:VMGB2BVNJEHQP6PM7ESFQBTHGQ","merge_version":"pith-open-graph-merge-v1","event_count":2,"valid_event_count":2,"invalid_event_count":0,"equivocation_count":0,"current":{"canonical_record":{"metadata":{"abstract_canon_sha256":"635fa21eb07200169cfcbca918cb952a64f615ae959c612e6b958ab193bad5da","cross_cats_sorted":[],"license":"http://creativecommons.org/licenses/by/4.0/","primary_cat":"cs.CL","submitted_at":"2026-04-17T06:37:25Z","title_canon_sha256":"6896165c79aec3b6bf3217edc533ec69e0acbae99cab7142eeb24adc0af1141f"},"schema_version":"1.0","source":{"id":"2604.15744","kind":"arxiv","version":1}},"source_aliases":[{"alias_kind":"arxiv","alias_value":"2604.15744","created_at":"2026-06-03T01:05:13Z"},{"alias_kind":"arxiv_version","alias_value":"2604.15744v1","created_at":"2026-06-03T01:05:13Z"},{"alias_kind":"doi","alias_value":"10.48550/arxiv.2604.15744","created_at":"2026-06-03T01:05:13Z"},{"alias_kind":"pith_short_12","alias_value":"VMGB2BVNJEHQ","created_at":"2026-06-03T01:05:13Z"},{"alias_kind":"pith_short_16","alias_value":"VMGB2BVNJEHQP6PM","created_at":"2026-06-03T01:05:13Z"},{"alias_kind":"pith_short_8","alias_value":"VMGB2BVN","created_at":"2026-06-03T01:05:13Z"}],"graph_snapshots":[{"event_id":"sha256:f37f27254e7e04e955b67433f921ef3fbe6ff7ed9f34212823600c103275eaf0","target":"graph","created_at":"2026-06-03T01:05:13Z","signer":{"key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","signer_id":"pith.science","signer_type":"pith_registry"},"payload":{"graph_snapshot":{"author_claims":{"count":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57","strong_count":0},"builder_version":"pith-number-builder-2026-05-17-v1","claims":{"count":3,"items":[{"attestation":"unclaimed","claim_id":"C1","kind":"strongest_claim","source":"verdict.strongest_claim","status":"machine_extracted","text":"Users generally associate language with place, and place-related communities form a contiguous speech community, though alignment between geographic dialect communities and place-related communities remains complex. Advanced language modelling, including static and diachronic Word2Vec language embeddings, revealed semantic variation across place-based communities and meaningful semantic shifts within New Zealand English."},{"attestation":"unclaimed","claim_id":"C2","kind":"weakest_assumption","source":"verdict.weakest_assumption","status":"machine_extracted","text":"That Reddit communities tied to places accurately represent geographic dialect communities and that user perceptions of language-place links correspond to measurable patterns in actual language use."},{"attestation":"unclaimed","claim_id":"C3","kind":"one_line_summary","source":"verdict.one_line_summary","status":"machine_extracted","text":"New Zealand Reddit users link language to place and form contiguous speech communities with complex geographic alignment; Word2Vec embeddings reveal semantic variations and shifts in NZ English on a 4.26 billion word corpus."}],"snapshot_sha256":"d1fb2e68ebd4c277a506b84f7f884264a67814bf63c72f8c05f5924b584c8433"},"formal_canon":{"evidence_count":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"integrity":{"available":true,"clean":true,"detectors_run":[],"endpoint":"/pith/2604.15744/integrity.json","findings":[],"snapshot_sha256":"c28c3603d3b5d939e8dc4c7e95fa8dfce3d595e45f758748cecf8e644a296938","summary":{"advisory":0,"by_detector":{},"critical":0,"informational":0}},"paper":{"abstract_excerpt":"This thesis investigates geographic dialect alignment in place-informed social media communities, focussing on New Zealand-related Reddit communities. By integrating qualitative analyses of user perceptions with computational methods, the study examines how language use reflects place identity and patterns of language variation and change based on user-informed lexical, morphosyntactic, and semantic variables. The findings show that users generally associate language with place, and place-related communities form a contiguous speech community, though alignment between geographic dialect commun","authors_text":"Sidney Wong","cross_cats":[],"headline":"New Zealand Reddit users link language to place and form contiguous speech communities with complex geographic alignment; Word2Vec embeddings reveal semantic variations and shifts in NZ English on a 4.26 billion word corpus.","license":"http://creativecommons.org/licenses/by/4.0/","primary_cat":"cs.CL","submitted_at":"2026-04-17T06:37:25Z","title":"Language, Place, and Social Media: Geographic Dialect Alignment in New Zealand"},"references":{"count":293,"internal_anchors":1,"resolved_work":293,"sample":[{"cited_arxiv_id":"","doi":"","is_internal_anchor":false,"ref_index":1,"title":"Abell, M. and Gordon, E. (1990). This objectionable colonial dialect': historical and contemporary attitudes to New Zealand speech. In Bell, A. and Holmes, J., editors, New Zealand Ways of Speaking En","work_id":"ebec6968-d3cf-471c-accf-adc91a2787ca","year":1990},{"cited_arxiv_id":"","doi":"","is_internal_anchor":false,"ref_index":2,"title":"They Had Us In the First Half","work_id":"7fa76632-9013-4064-a647-1b1ec89e36cc","year":2019},{"cited_arxiv_id":"","doi":"10.1080/13645579.2022.2111816","is_internal_anchor":false,"ref_index":3,"title":"Adams, N. N. (2022). ' Scraping ' Reddit posts for academic research? Addressing some blurred lines of consent in growing internet-based research trend during the time of COVID -19. International jour","work_id":"0b537314-5b05-4973-9dee-d1c29660d0d2","year":2022},{"cited_arxiv_id":"","doi":"10.1016/s0271-5309(03)00012-0","is_internal_anchor":false,"ref_index":4,"title":"Agha, A. (2003). The social life of cultural value. Language & Communication , 23(3):231--273. https://doi.org/10.1016/S0271-5309(03)00012-0","work_id":"ba6ccfcb-9509-4762-b465-72795d63f471","year":2003},{"cited_arxiv_id":"","doi":"","is_internal_anchor":false,"ref_index":5,"title":"Agnew, J. A. (1987). Place and Politics : The Geographical Mediation of State and Society , volume 1 of Routeledge Library Editions : Political Geography . Routledge, Abingdon, England; New York, NY, ","work_id":"b43a2198-d108-4890-aed3-50ec553b28fe","year":1987}],"snapshot_sha256":"d1bb52de6ee36fc9b2d395fe44b3717415d1fc22138798cea599cfd8dcd94c5d"},"source":{"id":"2604.15744","kind":"arxiv","version":1},"verdict":{"created_at":"2026-05-10T08:31:52.274803Z","id":"fb841da6-0bd0-4452-9f8e-f040994d733b","model_set":{"reader":"grok-4.3"},"one_line_summary":"New Zealand Reddit users link language to place and form contiguous speech communities with complex geographic alignment; Word2Vec embeddings reveal semantic variations and shifts in NZ English on a 4.26 billion word corpus.","pipeline_version":"pith-pipeline@v0.9.0","pith_extraction_headline":"","strongest_claim":"Users generally associate language with place, and place-related communities form a contiguous speech community, though alignment between geographic dialect communities and place-related communities remains complex. Advanced language modelling, including static and diachronic Word2Vec language embeddings, revealed semantic variation across place-based communities and meaningful semantic shifts within New Zealand English.","weakest_assumption":"That Reddit communities tied to places accurately represent geographic dialect communities and that user perceptions of language-place links correspond to measurable patterns in actual language use."}},"verdict_id":"fb841da6-0bd0-4452-9f8e-f040994d733b"}}],"author_attestations":[],"timestamp_anchors":[],"storage_attestations":[],"citation_signatures":[],"replication_records":[],"corrections":[],"mirror_hints":[],"record_created":{"event_id":"sha256:8b29d87a3a4beae3c039ef621c7ec7f6748e707acaaa69d0ef63a4abc4f9acb2","target":"record","created_at":"2026-06-03T01:05:13Z","signer":{"key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","signer_id":"pith.science","signer_type":"pith_registry"},"payload":{"attestation_state":"computed","canonical_record":{"metadata":{"abstract_canon_sha256":"635fa21eb07200169cfcbca918cb952a64f615ae959c612e6b958ab193bad5da","cross_cats_sorted":[],"license":"http://creativecommons.org/licenses/by/4.0/","primary_cat":"cs.CL","submitted_at":"2026-04-17T06:37:25Z","title_canon_sha256":"6896165c79aec3b6bf3217edc533ec69e0acbae99cab7142eeb24adc0af1141f"},"schema_version":"1.0","source":{"id":"2604.15744","kind":"arxiv","version":1}},"canonical_sha256":"ab0c1d06ad490f07f9ecf924580667340efe9aff9dd70bf52134ffdcd27f6162","receipt":{"algorithm":"ed25519","builder_version":"pith-number-builder-2026-05-17-v1","canonical_sha256":"ab0c1d06ad490f07f9ecf924580667340efe9aff9dd70bf52134ffdcd27f6162","first_computed_at":"2026-06-03T01:05:13.757647Z","key_id":"pith-v1-2026-05","kind":"pith_receipt","last_reissued_at":"2026-06-03T01:05:13.757647Z","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","receipt_version":"0.3","signature_b64":"55K58NFa92xIDFqCRW/KFNSCYw+GClnN17tc16+S95VsXU9ee1nmEFk1nL+ffrR6i/KyVpjyY6l26Ruzpdr7CA==","signature_status":"signed_v1","signed_at":"2026-06-03T01:05:13.758057Z","signed_message":"canonical_sha256_bytes"},"source_id":"2604.15744","source_kind":"arxiv","source_version":1}}},"equivocations":[],"invalid_events":[],"applied_event_ids":["sha256:8b29d87a3a4beae3c039ef621c7ec7f6748e707acaaa69d0ef63a4abc4f9acb2","sha256:f37f27254e7e04e955b67433f921ef3fbe6ff7ed9f34212823600c103275eaf0"],"state_sha256":"8eb18a9ba5a6b908f3dc56997750cc8712d3cab8f16d5ac809390b724625e738"}