{"bundle_type":"pith_open_graph_bundle","bundle_version":"1.0","pith_number":"pith:2019:AVTTBS5CY7DSGCSQO3XUMO3XFI","short_pith_number":"pith:AVTTBS5C","canonical_record":{"source":{"id":"1907.04492","kind":"arxiv","version":1},"metadata":{"license":"http://creativecommons.org/licenses/by/4.0/","primary_cat":"cs.CL","submitted_at":"2019-07-10T02:43:37Z","cross_cats_sorted":[],"title_canon_sha256":"302faea4e3fd580ede57cb109777bf11998688dad4e8c26ffd0832c7ed2c1558","abstract_canon_sha256":"fbee1f46f0abbf0f9a09e099141e8327866e29a0e41b3ef14a9b60ac09c76918"},"schema_version":"1.0"},"canonical_sha256":"056730cba2c7c7230a5076ef463b772a1d05eb9b0e3355cf15a92f2d8ba5c71d","source":{"kind":"arxiv","id":"1907.04492","version":1},"source_aliases":[{"alias_kind":"arxiv","alias_value":"1907.04492","created_at":"2026-05-17T23:41:00Z"},{"alias_kind":"arxiv_version","alias_value":"1907.04492v1","created_at":"2026-05-17T23:41:00Z"},{"alias_kind":"doi","alias_value":"10.48550/arxiv.1907.04492","created_at":"2026-05-17T23:41:00Z"},{"alias_kind":"pith_short_12","alias_value":"AVTTBS5CY7DS","created_at":"2026-05-18T12:33:12Z"},{"alias_kind":"pith_short_16","alias_value":"AVTTBS5CY7DSGCSQ","created_at":"2026-05-18T12:33:12Z"},{"alias_kind":"pith_short_8","alias_value":"AVTTBS5C","created_at":"2026-05-18T12:33:12Z"}],"events":[{"event_type":"record_created","subject_pith_number":"pith:2019:AVTTBS5CY7DSGCSQO3XUMO3XFI","target":"record","payload":{"canonical_record":{"source":{"id":"1907.04492","kind":"arxiv","version":1},"metadata":{"license":"http://creativecommons.org/licenses/by/4.0/","primary_cat":"cs.CL","submitted_at":"2019-07-10T02:43:37Z","cross_cats_sorted":[],"title_canon_sha256":"302faea4e3fd580ede57cb109777bf11998688dad4e8c26ffd0832c7ed2c1558","abstract_canon_sha256":"fbee1f46f0abbf0f9a09e099141e8327866e29a0e41b3ef14a9b60ac09c76918"},"schema_version":"1.0"},"canonical_sha256":"056730cba2c7c7230a5076ef463b772a1d05eb9b0e3355cf15a92f2d8ba5c71d","receipt":{"kind":"pith_receipt","key_id":"pith-v1-2026-05","algorithm":"ed25519","signed_at":"2026-05-17T23:41:00.110235Z","signature_b64":"P2GJQRJmtLm61sogPFn5cI25QHWjJETayZky+3JRdjniuMnL4RvpLGN5YJZzDRycaydCJrUKw9N/lFE2+p2wBw==","signed_message":"canonical_sha256_bytes","builder_version":"pith-number-builder-2026-05-17-v1","receipt_version":"0.3","canonical_sha256":"056730cba2c7c7230a5076ef463b772a1d05eb9b0e3355cf15a92f2d8ba5c71d","last_reissued_at":"2026-05-17T23:41:00.109594Z","signature_status":"signed_v1","first_computed_at":"2026-05-17T23:41:00.109594Z","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54"},"source_kind":"arxiv","source_id":"1907.04492","source_version":1,"attestation_state":"computed"},"signer":{"signer_id":"pith.science","signer_type":"pith_registry","key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54"},"created_at":"2026-05-17T23:41:00Z","supersedes":[],"prev_event":null,"signature":{"signature_status":"signed_v1","algorithm":"ed25519","key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","signature_b64":"V0ORTt/inTWwQaeGXXI40xLRp6ww65iZahI0cVjkY+haoFuywSoRk//GXS75ZP89ggEL2lEqCh/aiRcJyqcoDw==","signed_message":"open_graph_event_sha256_bytes","signed_at":"2026-05-25T18:31:27.518173Z"},"content_sha256":"ae448f7809731955167ed42cade78e76e1cd023d71fc80693aa09d5a25bd9e70","schema_version":"1.0","event_id":"sha256:ae448f7809731955167ed42cade78e76e1cd023d71fc80693aa09d5a25bd9e70"},{"event_type":"graph_snapshot","subject_pith_number":"pith:2019:AVTTBS5CY7DSGCSQO3XUMO3XFI","target":"graph","payload":{"graph_snapshot":{"paper":{"title":"Exploiting user-frequency information for mining regionalisms from Social Media texts","license":"http://creativecommons.org/licenses/by/4.0/","headline":"","cross_cats":[],"primary_cat":"cs.CL","authors_text":"Agust\\'in Gravano, Dami\\'an E. Aleman, Juan Manuel P\\'erez, Santiago N. Kalinowski","submitted_at":"2019-07-10T02:43:37Z","abstract_excerpt":"The task of detecting regionalisms (expressions or words used in certain regions) has traditionally relied on the use of questionnaires and surveys, and has also heavily depended on the expertise and intuition of the surveyor. The irruption of Social Media and its microblogging services has produced an unprecedented wealth of content, mainly informal text generated by users, opening new opportunities for linguists to extend their studies of language variation. Previous work on automatic detection of regionalisms depended mostly on word frequencies. In this work, we present a novel metric based"},"claims":{"count":0,"items":[],"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"source":{"id":"1907.04492","kind":"arxiv","version":1},"verdict":{"id":null,"model_set":{},"created_at":null,"strongest_claim":"","one_line_summary":"","pipeline_version":null,"weakest_assumption":"","pith_extraction_headline":""},"references":{"count":0,"sample":[],"resolved_work":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57","internal_anchors":0},"formal_canon":{"evidence_count":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"author_claims":{"count":0,"strong_count":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"builder_version":"pith-number-builder-2026-05-17-v1"},"verdict_id":null},"signer":{"signer_id":"pith.science","signer_type":"pith_registry","key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54"},"created_at":"2026-05-17T23:41:00Z","supersedes":[],"prev_event":null,"signature":{"signature_status":"signed_v1","algorithm":"ed25519","key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","signature_b64":"cY8M/LS1D5Dm+fdw80M5+GsHONOyYubqZKduNBVqJlB4fHSNt2wJs+osZJ/+6W9Iu7pmkbGVHMAvUe4w93S9CQ==","signed_message":"open_graph_event_sha256_bytes","signed_at":"2026-05-25T18:31:27.518910Z"},"content_sha256":"04704d0a70c9e0403627844b5f62671932d464edd835fb643a36de292bd7648a","schema_version":"1.0","event_id":"sha256:04704d0a70c9e0403627844b5f62671932d464edd835fb643a36de292bd7648a"}],"timestamp_proofs":[],"mirror_hints":[{"mirror_type":"https","name":"Pith Resolver","base_url":"https://pith.science","bundle_url":"https://pith.science/pith/AVTTBS5CY7DSGCSQO3XUMO3XFI/bundle.json","state_url":"https://pith.science/pith/AVTTBS5CY7DSGCSQO3XUMO3XFI/state.json","well_known_bundle_url":"https://pith.science/.well-known/pith/AVTTBS5CY7DSGCSQO3XUMO3XFI/bundle.json","status":"primary"}],"public_keys":[{"key_id":"pith-v1-2026-05","algorithm":"ed25519","format":"raw","public_key_b64":"stVStoiQhXFxp4s2pdzPNoqVNBMojDU/fJ2db5S3CbM=","public_key_hex":"b2d552b68890857171a78b36a5dccf368a953413288c353f7c9d9d6f94b709b3","fingerprint_sha256_b32_first128bits":"RVFV5Z2OI2J3ZUO7ERDEBCYNKS","fingerprint_sha256_hex":"8d4b5ee74e4693bcd1df2446408b0d54","rotates_at":null,"url":"https://pith.science/pith-signing-key.json","notes":"Pith uses this Ed25519 key to sign canonical record SHA-256 digests. Verify with: ed25519_verify(public_key, message=canonical_sha256_bytes, signature=base64decode(signature_b64))."}],"merge_version":"pith-open-graph-merge-v1","built_at":"2026-05-25T18:31:27Z","links":{"resolver":"https://pith.science/pith/AVTTBS5CY7DSGCSQO3XUMO3XFI","bundle":"https://pith.science/pith/AVTTBS5CY7DSGCSQO3XUMO3XFI/bundle.json","state":"https://pith.science/pith/AVTTBS5CY7DSGCSQO3XUMO3XFI/state.json","well_known_bundle":"https://pith.science/.well-known/pith/AVTTBS5CY7DSGCSQO3XUMO3XFI/bundle.json"},"state":{"state_type":"pith_open_graph_state","state_version":"1.0","pith_number":"pith:2019:AVTTBS5CY7DSGCSQO3XUMO3XFI","merge_version":"pith-open-graph-merge-v1","event_count":2,"valid_event_count":2,"invalid_event_count":0,"equivocation_count":0,"current":{"canonical_record":{"metadata":{"abstract_canon_sha256":"fbee1f46f0abbf0f9a09e099141e8327866e29a0e41b3ef14a9b60ac09c76918","cross_cats_sorted":[],"license":"http://creativecommons.org/licenses/by/4.0/","primary_cat":"cs.CL","submitted_at":"2019-07-10T02:43:37Z","title_canon_sha256":"302faea4e3fd580ede57cb109777bf11998688dad4e8c26ffd0832c7ed2c1558"},"schema_version":"1.0","source":{"id":"1907.04492","kind":"arxiv","version":1}},"source_aliases":[{"alias_kind":"arxiv","alias_value":"1907.04492","created_at":"2026-05-17T23:41:00Z"},{"alias_kind":"arxiv_version","alias_value":"1907.04492v1","created_at":"2026-05-17T23:41:00Z"},{"alias_kind":"doi","alias_value":"10.48550/arxiv.1907.04492","created_at":"2026-05-17T23:41:00Z"},{"alias_kind":"pith_short_12","alias_value":"AVTTBS5CY7DS","created_at":"2026-05-18T12:33:12Z"},{"alias_kind":"pith_short_16","alias_value":"AVTTBS5CY7DSGCSQ","created_at":"2026-05-18T12:33:12Z"},{"alias_kind":"pith_short_8","alias_value":"AVTTBS5C","created_at":"2026-05-18T12:33:12Z"}],"graph_snapshots":[{"event_id":"sha256:04704d0a70c9e0403627844b5f62671932d464edd835fb643a36de292bd7648a","target":"graph","created_at":"2026-05-17T23:41:00Z","signer":{"key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","signer_id":"pith.science","signer_type":"pith_registry"},"payload":{"graph_snapshot":{"author_claims":{"count":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57","strong_count":0},"builder_version":"pith-number-builder-2026-05-17-v1","claims":{"count":0,"items":[],"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"formal_canon":{"evidence_count":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"paper":{"abstract_excerpt":"The task of detecting regionalisms (expressions or words used in certain regions) has traditionally relied on the use of questionnaires and surveys, and has also heavily depended on the expertise and intuition of the surveyor. The irruption of Social Media and its microblogging services has produced an unprecedented wealth of content, mainly informal text generated by users, opening new opportunities for linguists to extend their studies of language variation. Previous work on automatic detection of regionalisms depended mostly on word frequencies. In this work, we present a novel metric based","authors_text":"Agust\\'in Gravano, Dami\\'an E. Aleman, Juan Manuel P\\'erez, Santiago N. Kalinowski","cross_cats":[],"headline":"","license":"http://creativecommons.org/licenses/by/4.0/","primary_cat":"cs.CL","submitted_at":"2019-07-10T02:43:37Z","title":"Exploiting user-frequency information for mining regionalisms from Social Media texts"},"references":{"count":0,"internal_anchors":0,"resolved_work":0,"sample":[],"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"source":{"id":"1907.04492","kind":"arxiv","version":1},"verdict":{"created_at":null,"id":null,"model_set":{},"one_line_summary":"","pipeline_version":null,"pith_extraction_headline":"","strongest_claim":"","weakest_assumption":""}},"verdict_id":null}}],"author_attestations":[],"timestamp_anchors":[],"storage_attestations":[],"citation_signatures":[],"replication_records":[],"corrections":[],"mirror_hints":[],"record_created":{"event_id":"sha256:ae448f7809731955167ed42cade78e76e1cd023d71fc80693aa09d5a25bd9e70","target":"record","created_at":"2026-05-17T23:41:00Z","signer":{"key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","signer_id":"pith.science","signer_type":"pith_registry"},"payload":{"attestation_state":"computed","canonical_record":{"metadata":{"abstract_canon_sha256":"fbee1f46f0abbf0f9a09e099141e8327866e29a0e41b3ef14a9b60ac09c76918","cross_cats_sorted":[],"license":"http://creativecommons.org/licenses/by/4.0/","primary_cat":"cs.CL","submitted_at":"2019-07-10T02:43:37Z","title_canon_sha256":"302faea4e3fd580ede57cb109777bf11998688dad4e8c26ffd0832c7ed2c1558"},"schema_version":"1.0","source":{"id":"1907.04492","kind":"arxiv","version":1}},"canonical_sha256":"056730cba2c7c7230a5076ef463b772a1d05eb9b0e3355cf15a92f2d8ba5c71d","receipt":{"algorithm":"ed25519","builder_version":"pith-number-builder-2026-05-17-v1","canonical_sha256":"056730cba2c7c7230a5076ef463b772a1d05eb9b0e3355cf15a92f2d8ba5c71d","first_computed_at":"2026-05-17T23:41:00.109594Z","key_id":"pith-v1-2026-05","kind":"pith_receipt","last_reissued_at":"2026-05-17T23:41:00.109594Z","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","receipt_version":"0.3","signature_b64":"P2GJQRJmtLm61sogPFn5cI25QHWjJETayZky+3JRdjniuMnL4RvpLGN5YJZzDRycaydCJrUKw9N/lFE2+p2wBw==","signature_status":"signed_v1","signed_at":"2026-05-17T23:41:00.110235Z","signed_message":"canonical_sha256_bytes"},"source_id":"1907.04492","source_kind":"arxiv","source_version":1}}},"equivocations":[],"invalid_events":[],"applied_event_ids":["sha256:ae448f7809731955167ed42cade78e76e1cd023d71fc80693aa09d5a25bd9e70","sha256:04704d0a70c9e0403627844b5f62671932d464edd835fb643a36de292bd7648a"],"state_sha256":"4db7fc4ba454b41c2b87214f6358ab5d615553a60a2dbbc01c28f705fe32769a"},"bundle_signature":{"signature_status":"signed_v1","algorithm":"ed25519","key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","signature_b64":"vMH0TJu3+8qQ9TgK7h5MPQCxq/YzWMtcfPdWhsdFPd6OKHOWcWwuYGBe3DeyA49CaLuoa1RU6UwkTtVqaGZxCg==","signed_message":"bundle_sha256_bytes","signed_at":"2026-05-25T18:31:27.523480Z","bundle_sha256":"014af3ece120471f8e6c4a46c94544c51e6c30df813ca4aa68ab80d9f9a2dbbd"}}