{"bundle_type":"pith_open_graph_bundle","bundle_version":"1.0","pith_number":"pith:2018:BTSNPFZFJDITC2DNYVTYAITCVU","short_pith_number":"pith:BTSNPFZF","canonical_record":{"source":{"id":"1811.07497","kind":"arxiv","version":1},"metadata":{"license":"http://arxiv.org/licenses/nonexclusive-distrib/1.0/","primary_cat":"cs.CL","submitted_at":"2018-11-19T04:42:54Z","cross_cats_sorted":[],"title_canon_sha256":"75325cf9601da9c75946282f349b650273ee353ab9de49fe68d280ed70e5ecc3","abstract_canon_sha256":"bf444740ff5c1cc1a4254c949059d6322fb5b80108d4a3bf65ffc099563c488b"},"schema_version":"1.0"},"canonical_sha256":"0ce4d7972548d131686dc567802262ad35c799b449e826b54755bc00eb43215a","source":{"kind":"arxiv","id":"1811.07497","version":1},"source_aliases":[{"alias_kind":"arxiv","alias_value":"1811.07497","created_at":"2026-05-18T00:00:24Z"},{"alias_kind":"arxiv_version","alias_value":"1811.07497v1","created_at":"2026-05-18T00:00:24Z"},{"alias_kind":"doi","alias_value":"10.48550/arxiv.1811.07497","created_at":"2026-05-18T00:00:24Z"},{"alias_kind":"pith_short_12","alias_value":"BTSNPFZFJDIT","created_at":"2026-05-18T12:32:16Z"},{"alias_kind":"pith_short_16","alias_value":"BTSNPFZFJDITC2DN","created_at":"2026-05-18T12:32:16Z"},{"alias_kind":"pith_short_8","alias_value":"BTSNPFZF","created_at":"2026-05-18T12:32:16Z"}],"events":[{"event_type":"record_created","subject_pith_number":"pith:2018:BTSNPFZFJDITC2DNYVTYAITCVU","target":"record","payload":{"canonical_record":{"source":{"id":"1811.07497","kind":"arxiv","version":1},"metadata":{"license":"http://arxiv.org/licenses/nonexclusive-distrib/1.0/","primary_cat":"cs.CL","submitted_at":"2018-11-19T04:42:54Z","cross_cats_sorted":[],"title_canon_sha256":"75325cf9601da9c75946282f349b650273ee353ab9de49fe68d280ed70e5ecc3","abstract_canon_sha256":"bf444740ff5c1cc1a4254c949059d6322fb5b80108d4a3bf65ffc099563c488b"},"schema_version":"1.0"},"canonical_sha256":"0ce4d7972548d131686dc567802262ad35c799b449e826b54755bc00eb43215a","receipt":{"kind":"pith_receipt","key_id":"pith-v1-2026-05","algorithm":"ed25519","signed_at":"2026-05-18T00:00:24.319761Z","signature_b64":"2BvJeqJKz353l5NjvYgxlpQb0A5hGTrifKOmRoSD4odPRANIl2zwJ6dPyGQ2Z5aKrnDAeCSTzhFotNP212DFCA==","signed_message":"canonical_sha256_bytes","builder_version":"pith-number-builder-2026-05-17-v1","receipt_version":"0.3","canonical_sha256":"0ce4d7972548d131686dc567802262ad35c799b449e826b54755bc00eb43215a","last_reissued_at":"2026-05-18T00:00:24.319054Z","signature_status":"signed_v1","first_computed_at":"2026-05-18T00:00:24.319054Z","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54"},"source_kind":"arxiv","source_id":"1811.07497","source_version":1,"attestation_state":"computed"},"signer":{"signer_id":"pith.science","signer_type":"pith_registry","key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54"},"created_at":"2026-05-18T00:00:24Z","supersedes":[],"prev_event":null,"signature":{"signature_status":"signed_v1","algorithm":"ed25519","key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","signature_b64":"6wLL+Cis9tyQLx5mNDR+oiErgx7UFO2yeWhAcVe2Qh0BJ++rs5MzsTlqARnE5WhW3v4hK4W1NO3NCICXZhtwDg==","signed_message":"open_graph_event_sha256_bytes","signed_at":"2026-06-06T15:03:07.526031Z"},"content_sha256":"78a9da31213f04d33f76ae36dcc2b5f1fb822b2152f471100b59bf8f26b0a2ac","schema_version":"1.0","event_id":"sha256:78a9da31213f04d33f76ae36dcc2b5f1fb822b2152f471100b59bf8f26b0a2ac"},{"event_type":"graph_snapshot","subject_pith_number":"pith:2018:BTSNPFZFJDITC2DNYVTYAITCVU","target":"graph","payload":{"graph_snapshot":{"paper":{"title":"A Comparative Analysis of Content-based Geolocation in Blogs and Tweets","license":"http://arxiv.org/licenses/nonexclusive-distrib/1.0/","headline":"","cross_cats":[],"primary_cat":"cs.CL","authors_text":"Konstantinos Pappas, Mahmoud Azab, Rada Mihalcea","submitted_at":"2018-11-19T04:42:54Z","abstract_excerpt":"The geolocation of online information is an essential component in any geospatial application. While most of the previous work on geolocation has focused on Twitter, in this paper we quantify and compare the performance of text-based geolocation methods on social media data drawn from both Blogger and Twitter. We introduce a novel set of location specific features that are both highly informative and easily interpretable, and show that we can achieve error rate reductions of up to 12.5% with respect to the best previously proposed geolocation features. We also show that despite posting longer "},"claims":{"count":0,"items":[],"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"source":{"id":"1811.07497","kind":"arxiv","version":1},"verdict":{"id":null,"model_set":{},"created_at":null,"strongest_claim":"","one_line_summary":"","pipeline_version":null,"weakest_assumption":"","pith_extraction_headline":""},"references":{"count":0,"sample":[],"resolved_work":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57","internal_anchors":0},"formal_canon":{"evidence_count":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"author_claims":{"count":0,"strong_count":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"builder_version":"pith-number-builder-2026-05-17-v1"},"verdict_id":null},"signer":{"signer_id":"pith.science","signer_type":"pith_registry","key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54"},"created_at":"2026-05-18T00:00:24Z","supersedes":[],"prev_event":null,"signature":{"signature_status":"signed_v1","algorithm":"ed25519","key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","signature_b64":"U0HIXSdWSnC8tP6RqfVFr3hfZLH5H6+PgmUJUCc8ZSdysQyt7Fr2eZNfnDCYeeLHWpalQtXXZzRA02MyL8j2BA==","signed_message":"open_graph_event_sha256_bytes","signed_at":"2026-06-06T15:03:07.526387Z"},"content_sha256":"47587b74e3349464c5da52d61c77581c1445db94d92eefda40e816b5ab6dfbb6","schema_version":"1.0","event_id":"sha256:47587b74e3349464c5da52d61c77581c1445db94d92eefda40e816b5ab6dfbb6"}],"timestamp_proofs":[],"mirror_hints":[{"mirror_type":"https","name":"Pith Resolver","base_url":"https://pith.science","bundle_url":"https://pith.science/pith/BTSNPFZFJDITC2DNYVTYAITCVU/bundle.json","state_url":"https://pith.science/pith/BTSNPFZFJDITC2DNYVTYAITCVU/state.json","well_known_bundle_url":"https://pith.science/.well-known/pith/BTSNPFZFJDITC2DNYVTYAITCVU/bundle.json","status":"primary"}],"public_keys":[{"key_id":"pith-v1-2026-05","algorithm":"ed25519","format":"raw","public_key_b64":"stVStoiQhXFxp4s2pdzPNoqVNBMojDU/fJ2db5S3CbM=","public_key_hex":"b2d552b68890857171a78b36a5dccf368a953413288c353f7c9d9d6f94b709b3","fingerprint_sha256_b32_first128bits":"RVFV5Z2OI2J3ZUO7ERDEBCYNKS","fingerprint_sha256_hex":"8d4b5ee74e4693bcd1df2446408b0d54","rotates_at":null,"url":"https://pith.science/pith-signing-key.json","notes":"Pith uses this Ed25519 key to sign canonical record SHA-256 digests. Verify with: ed25519_verify(public_key, message=canonical_sha256_bytes, signature=base64decode(signature_b64))."}],"merge_version":"pith-open-graph-merge-v1","built_at":"2026-06-06T15:03:07Z","links":{"resolver":"https://pith.science/pith/BTSNPFZFJDITC2DNYVTYAITCVU","bundle":"https://pith.science/pith/BTSNPFZFJDITC2DNYVTYAITCVU/bundle.json","state":"https://pith.science/pith/BTSNPFZFJDITC2DNYVTYAITCVU/state.json","well_known_bundle":"https://pith.science/.well-known/pith/BTSNPFZFJDITC2DNYVTYAITCVU/bundle.json"},"state":{"state_type":"pith_open_graph_state","state_version":"1.0","pith_number":"pith:2018:BTSNPFZFJDITC2DNYVTYAITCVU","merge_version":"pith-open-graph-merge-v1","event_count":2,"valid_event_count":2,"invalid_event_count":0,"equivocation_count":0,"current":{"canonical_record":{"metadata":{"abstract_canon_sha256":"bf444740ff5c1cc1a4254c949059d6322fb5b80108d4a3bf65ffc099563c488b","cross_cats_sorted":[],"license":"http://arxiv.org/licenses/nonexclusive-distrib/1.0/","primary_cat":"cs.CL","submitted_at":"2018-11-19T04:42:54Z","title_canon_sha256":"75325cf9601da9c75946282f349b650273ee353ab9de49fe68d280ed70e5ecc3"},"schema_version":"1.0","source":{"id":"1811.07497","kind":"arxiv","version":1}},"source_aliases":[{"alias_kind":"arxiv","alias_value":"1811.07497","created_at":"2026-05-18T00:00:24Z"},{"alias_kind":"arxiv_version","alias_value":"1811.07497v1","created_at":"2026-05-18T00:00:24Z"},{"alias_kind":"doi","alias_value":"10.48550/arxiv.1811.07497","created_at":"2026-05-18T00:00:24Z"},{"alias_kind":"pith_short_12","alias_value":"BTSNPFZFJDIT","created_at":"2026-05-18T12:32:16Z"},{"alias_kind":"pith_short_16","alias_value":"BTSNPFZFJDITC2DN","created_at":"2026-05-18T12:32:16Z"},{"alias_kind":"pith_short_8","alias_value":"BTSNPFZF","created_at":"2026-05-18T12:32:16Z"}],"graph_snapshots":[{"event_id":"sha256:47587b74e3349464c5da52d61c77581c1445db94d92eefda40e816b5ab6dfbb6","target":"graph","created_at":"2026-05-18T00:00:24Z","signer":{"key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","signer_id":"pith.science","signer_type":"pith_registry"},"payload":{"graph_snapshot":{"author_claims":{"count":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57","strong_count":0},"builder_version":"pith-number-builder-2026-05-17-v1","claims":{"count":0,"items":[],"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"formal_canon":{"evidence_count":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"paper":{"abstract_excerpt":"The geolocation of online information is an essential component in any geospatial application. While most of the previous work on geolocation has focused on Twitter, in this paper we quantify and compare the performance of text-based geolocation methods on social media data drawn from both Blogger and Twitter. We introduce a novel set of location specific features that are both highly informative and easily interpretable, and show that we can achieve error rate reductions of up to 12.5% with respect to the best previously proposed geolocation features. We also show that despite posting longer ","authors_text":"Konstantinos Pappas, Mahmoud Azab, Rada Mihalcea","cross_cats":[],"headline":"","license":"http://arxiv.org/licenses/nonexclusive-distrib/1.0/","primary_cat":"cs.CL","submitted_at":"2018-11-19T04:42:54Z","title":"A Comparative Analysis of Content-based Geolocation in Blogs and Tweets"},"references":{"count":0,"internal_anchors":0,"resolved_work":0,"sample":[],"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"source":{"id":"1811.07497","kind":"arxiv","version":1},"verdict":{"created_at":null,"id":null,"model_set":{},"one_line_summary":"","pipeline_version":null,"pith_extraction_headline":"","strongest_claim":"","weakest_assumption":""}},"verdict_id":null}}],"author_attestations":[],"timestamp_anchors":[],"storage_attestations":[],"citation_signatures":[],"replication_records":[],"corrections":[],"mirror_hints":[],"record_created":{"event_id":"sha256:78a9da31213f04d33f76ae36dcc2b5f1fb822b2152f471100b59bf8f26b0a2ac","target":"record","created_at":"2026-05-18T00:00:24Z","signer":{"key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","signer_id":"pith.science","signer_type":"pith_registry"},"payload":{"attestation_state":"computed","canonical_record":{"metadata":{"abstract_canon_sha256":"bf444740ff5c1cc1a4254c949059d6322fb5b80108d4a3bf65ffc099563c488b","cross_cats_sorted":[],"license":"http://arxiv.org/licenses/nonexclusive-distrib/1.0/","primary_cat":"cs.CL","submitted_at":"2018-11-19T04:42:54Z","title_canon_sha256":"75325cf9601da9c75946282f349b650273ee353ab9de49fe68d280ed70e5ecc3"},"schema_version":"1.0","source":{"id":"1811.07497","kind":"arxiv","version":1}},"canonical_sha256":"0ce4d7972548d131686dc567802262ad35c799b449e826b54755bc00eb43215a","receipt":{"algorithm":"ed25519","builder_version":"pith-number-builder-2026-05-17-v1","canonical_sha256":"0ce4d7972548d131686dc567802262ad35c799b449e826b54755bc00eb43215a","first_computed_at":"2026-05-18T00:00:24.319054Z","key_id":"pith-v1-2026-05","kind":"pith_receipt","last_reissued_at":"2026-05-18T00:00:24.319054Z","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","receipt_version":"0.3","signature_b64":"2BvJeqJKz353l5NjvYgxlpQb0A5hGTrifKOmRoSD4odPRANIl2zwJ6dPyGQ2Z5aKrnDAeCSTzhFotNP212DFCA==","signature_status":"signed_v1","signed_at":"2026-05-18T00:00:24.319761Z","signed_message":"canonical_sha256_bytes"},"source_id":"1811.07497","source_kind":"arxiv","source_version":1}}},"equivocations":[],"invalid_events":[],"applied_event_ids":["sha256:78a9da31213f04d33f76ae36dcc2b5f1fb822b2152f471100b59bf8f26b0a2ac","sha256:47587b74e3349464c5da52d61c77581c1445db94d92eefda40e816b5ab6dfbb6"],"state_sha256":"ffa893ca72d23846595564f50363066afa9176b54b8ffc5a97cc7b777db0337f"},"bundle_signature":{"signature_status":"signed_v1","algorithm":"ed25519","key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","signature_b64":"UdudqIh6Mzg+0fQGfBF8B0ogOwA1WPelRxB5PUnsk3zKImbV6bE+YmgwQciNEEaK1hOobVNZnLv0U3fOi67vBg==","signed_message":"bundle_sha256_bytes","signed_at":"2026-06-06T15:03:07.528389Z","bundle_sha256":"16abb9b26df21d0c0c6219636ed06410c7a3fb4ea730d1e34632114d3159e4ce"}}