{"bundle_type":"pith_open_graph_bundle","bundle_version":"1.0","pith_number":"pith:2018:OZR7OKD3M25FPI2CNR6RUBQHXZ","short_pith_number":"pith:OZR7OKD3","canonical_record":{"source":{"id":"1801.06436","kind":"arxiv","version":1},"metadata":{"license":"http://creativecommons.org/licenses/by-nc-sa/4.0/","primary_cat":"cs.CL","submitted_at":"2018-01-19T15:00:33Z","cross_cats_sorted":[],"title_canon_sha256":"7fa985e7195f7d279f2e68cea5ce622a62b95e14b4e124ea106046a13587d64b","abstract_canon_sha256":"cda7a3b370b17fe2bbf9ae58521c67580b0fe32802d47efebdefc9afacc5d82d"},"schema_version":"1.0"},"canonical_sha256":"7663f7287b66ba57a3426c7d1a0607be7c2d67433051745eb020ab63e85a462b","source":{"kind":"arxiv","id":"1801.06436","version":1},"source_aliases":[{"alias_kind":"arxiv","alias_value":"1801.06436","created_at":"2026-05-18T00:25:30Z"},{"alias_kind":"arxiv_version","alias_value":"1801.06436v1","created_at":"2026-05-18T00:25:30Z"},{"alias_kind":"doi","alias_value":"10.48550/arxiv.1801.06436","created_at":"2026-05-18T00:25:30Z"},{"alias_kind":"pith_short_12","alias_value":"OZR7OKD3M25F","created_at":"2026-05-18T12:32:43Z"},{"alias_kind":"pith_short_16","alias_value":"OZR7OKD3M25FPI2C","created_at":"2026-05-18T12:32:43Z"},{"alias_kind":"pith_short_8","alias_value":"OZR7OKD3","created_at":"2026-05-18T12:32:43Z"}],"events":[{"event_type":"record_created","subject_pith_number":"pith:2018:OZR7OKD3M25FPI2CNR6RUBQHXZ","target":"record","payload":{"canonical_record":{"source":{"id":"1801.06436","kind":"arxiv","version":1},"metadata":{"license":"http://creativecommons.org/licenses/by-nc-sa/4.0/","primary_cat":"cs.CL","submitted_at":"2018-01-19T15:00:33Z","cross_cats_sorted":[],"title_canon_sha256":"7fa985e7195f7d279f2e68cea5ce622a62b95e14b4e124ea106046a13587d64b","abstract_canon_sha256":"cda7a3b370b17fe2bbf9ae58521c67580b0fe32802d47efebdefc9afacc5d82d"},"schema_version":"1.0"},"canonical_sha256":"7663f7287b66ba57a3426c7d1a0607be7c2d67433051745eb020ab63e85a462b","receipt":{"kind":"pith_receipt","key_id":"pith-v1-2026-05","algorithm":"ed25519","signed_at":"2026-05-18T00:25:30.136250Z","signature_b64":"lPPrgiem/vP01tb3zZY9tphwVBs3d1xSIClF9huCUiMn7akPCPv5fOjhGomOexkKLwsJcH6xa8yzXIvjRQsqBA==","signed_message":"canonical_sha256_bytes","builder_version":"pith-number-builder-2026-05-17-v1","receipt_version":"0.3","canonical_sha256":"7663f7287b66ba57a3426c7d1a0607be7c2d67433051745eb020ab63e85a462b","last_reissued_at":"2026-05-18T00:25:30.135504Z","signature_status":"signed_v1","first_computed_at":"2026-05-18T00:25:30.135504Z","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54"},"source_kind":"arxiv","source_id":"1801.06436","source_version":1,"attestation_state":"computed"},"signer":{"signer_id":"pith.science","signer_type":"pith_registry","key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54"},"created_at":"2026-05-18T00:25:30Z","supersedes":[],"prev_event":null,"signature":{"signature_status":"signed_v1","algorithm":"ed25519","key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","signature_b64":"vHobbMwdspppi2ehrtzyq8pk3qtkeyo0A/ISPuTiKeJRUPcGUqv2LC+lYWiEJw7Rjriz3W2LcEqPjPRjUSGwBQ==","signed_message":"open_graph_event_sha256_bytes","signed_at":"2026-06-03T08:36:36.879216Z"},"content_sha256":"d96375507d7abd85fb2af374a38dd50d18b182e63cd40c224bb0972377c22b34","schema_version":"1.0","event_id":"sha256:d96375507d7abd85fb2af374a38dd50d18b182e63cd40c224bb0972377c22b34"},{"event_type":"graph_snapshot","subject_pith_number":"pith:2018:OZR7OKD3M25FPI2CNR6RUBQHXZ","target":"graph","payload":{"graph_snapshot":{"paper":{"title":"A Resource-Light Method for Cross-Lingual Semantic Textual Similarity","license":"http://creativecommons.org/licenses/by-nc-sa/4.0/","headline":"","cross_cats":[],"primary_cat":"cs.CL","authors_text":"Goran Glava\\v{s}, Marc Franco-Salvador, Paolo Rosso, Simone Paolo Ponzetto","submitted_at":"2018-01-19T15:00:33Z","abstract_excerpt":"Recognizing semantically similar sentences or paragraphs across languages is beneficial for many tasks, ranging from cross-lingual information retrieval and plagiarism detection to machine translation. Recently proposed methods for predicting cross-lingual semantic similarity of short texts, however, make use of tools and resources (e.g., machine translation systems, syntactic parsers or named entity recognition) that for many languages (or language pairs) do not exist. In contrast, we propose an unsupervised and a very resource-light approach for measuring semantic similarity between texts in"},"claims":{"count":0,"items":[],"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"source":{"id":"1801.06436","kind":"arxiv","version":1},"verdict":{"id":null,"model_set":{},"created_at":null,"strongest_claim":"","one_line_summary":"","pipeline_version":null,"weakest_assumption":"","pith_extraction_headline":""},"references":{"count":0,"sample":[],"resolved_work":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57","internal_anchors":0},"formal_canon":{"evidence_count":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"author_claims":{"count":0,"strong_count":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"builder_version":"pith-number-builder-2026-05-17-v1"},"verdict_id":null},"signer":{"signer_id":"pith.science","signer_type":"pith_registry","key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54"},"created_at":"2026-05-18T00:25:30Z","supersedes":[],"prev_event":null,"signature":{"signature_status":"signed_v1","algorithm":"ed25519","key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","signature_b64":"5H07ENPNaOywNNXXoLmA74K4aePfEZJn79MCF7ofe0o48+MNOICWBED7mOhw3t9GXrOemtYzoYJGRpa514T7AQ==","signed_message":"open_graph_event_sha256_bytes","signed_at":"2026-06-03T08:36:36.879578Z"},"content_sha256":"a9e935e8070a49ff3bf1a0f158132858e688737c6eb326c818f420db5aabb63e","schema_version":"1.0","event_id":"sha256:a9e935e8070a49ff3bf1a0f158132858e688737c6eb326c818f420db5aabb63e"}],"timestamp_proofs":[],"mirror_hints":[{"mirror_type":"https","name":"Pith Resolver","base_url":"https://pith.science","bundle_url":"https://pith.science/pith/OZR7OKD3M25FPI2CNR6RUBQHXZ/bundle.json","state_url":"https://pith.science/pith/OZR7OKD3M25FPI2CNR6RUBQHXZ/state.json","well_known_bundle_url":"https://pith.science/.well-known/pith/OZR7OKD3M25FPI2CNR6RUBQHXZ/bundle.json","status":"primary"}],"public_keys":[{"key_id":"pith-v1-2026-05","algorithm":"ed25519","format":"raw","public_key_b64":"stVStoiQhXFxp4s2pdzPNoqVNBMojDU/fJ2db5S3CbM=","public_key_hex":"b2d552b68890857171a78b36a5dccf368a953413288c353f7c9d9d6f94b709b3","fingerprint_sha256_b32_first128bits":"RVFV5Z2OI2J3ZUO7ERDEBCYNKS","fingerprint_sha256_hex":"8d4b5ee74e4693bcd1df2446408b0d54","rotates_at":null,"url":"https://pith.science/pith-signing-key.json","notes":"Pith uses this Ed25519 key to sign canonical record SHA-256 digests. Verify with: ed25519_verify(public_key, message=canonical_sha256_bytes, signature=base64decode(signature_b64))."}],"merge_version":"pith-open-graph-merge-v1","built_at":"2026-06-03T08:36:36Z","links":{"resolver":"https://pith.science/pith/OZR7OKD3M25FPI2CNR6RUBQHXZ","bundle":"https://pith.science/pith/OZR7OKD3M25FPI2CNR6RUBQHXZ/bundle.json","state":"https://pith.science/pith/OZR7OKD3M25FPI2CNR6RUBQHXZ/state.json","well_known_bundle":"https://pith.science/.well-known/pith/OZR7OKD3M25FPI2CNR6RUBQHXZ/bundle.json"},"state":{"state_type":"pith_open_graph_state","state_version":"1.0","pith_number":"pith:2018:OZR7OKD3M25FPI2CNR6RUBQHXZ","merge_version":"pith-open-graph-merge-v1","event_count":2,"valid_event_count":2,"invalid_event_count":0,"equivocation_count":0,"current":{"canonical_record":{"metadata":{"abstract_canon_sha256":"cda7a3b370b17fe2bbf9ae58521c67580b0fe32802d47efebdefc9afacc5d82d","cross_cats_sorted":[],"license":"http://creativecommons.org/licenses/by-nc-sa/4.0/","primary_cat":"cs.CL","submitted_at":"2018-01-19T15:00:33Z","title_canon_sha256":"7fa985e7195f7d279f2e68cea5ce622a62b95e14b4e124ea106046a13587d64b"},"schema_version":"1.0","source":{"id":"1801.06436","kind":"arxiv","version":1}},"source_aliases":[{"alias_kind":"arxiv","alias_value":"1801.06436","created_at":"2026-05-18T00:25:30Z"},{"alias_kind":"arxiv_version","alias_value":"1801.06436v1","created_at":"2026-05-18T00:25:30Z"},{"alias_kind":"doi","alias_value":"10.48550/arxiv.1801.06436","created_at":"2026-05-18T00:25:30Z"},{"alias_kind":"pith_short_12","alias_value":"OZR7OKD3M25F","created_at":"2026-05-18T12:32:43Z"},{"alias_kind":"pith_short_16","alias_value":"OZR7OKD3M25FPI2C","created_at":"2026-05-18T12:32:43Z"},{"alias_kind":"pith_short_8","alias_value":"OZR7OKD3","created_at":"2026-05-18T12:32:43Z"}],"graph_snapshots":[{"event_id":"sha256:a9e935e8070a49ff3bf1a0f158132858e688737c6eb326c818f420db5aabb63e","target":"graph","created_at":"2026-05-18T00:25:30Z","signer":{"key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","signer_id":"pith.science","signer_type":"pith_registry"},"payload":{"graph_snapshot":{"author_claims":{"count":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57","strong_count":0},"builder_version":"pith-number-builder-2026-05-17-v1","claims":{"count":0,"items":[],"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"formal_canon":{"evidence_count":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"paper":{"abstract_excerpt":"Recognizing semantically similar sentences or paragraphs across languages is beneficial for many tasks, ranging from cross-lingual information retrieval and plagiarism detection to machine translation. Recently proposed methods for predicting cross-lingual semantic similarity of short texts, however, make use of tools and resources (e.g., machine translation systems, syntactic parsers or named entity recognition) that for many languages (or language pairs) do not exist. In contrast, we propose an unsupervised and a very resource-light approach for measuring semantic similarity between texts in","authors_text":"Goran Glava\\v{s}, Marc Franco-Salvador, Paolo Rosso, Simone Paolo Ponzetto","cross_cats":[],"headline":"","license":"http://creativecommons.org/licenses/by-nc-sa/4.0/","primary_cat":"cs.CL","submitted_at":"2018-01-19T15:00:33Z","title":"A Resource-Light Method for Cross-Lingual Semantic Textual Similarity"},"references":{"count":0,"internal_anchors":0,"resolved_work":0,"sample":[],"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"source":{"id":"1801.06436","kind":"arxiv","version":1},"verdict":{"created_at":null,"id":null,"model_set":{},"one_line_summary":"","pipeline_version":null,"pith_extraction_headline":"","strongest_claim":"","weakest_assumption":""}},"verdict_id":null}}],"author_attestations":[],"timestamp_anchors":[],"storage_attestations":[],"citation_signatures":[],"replication_records":[],"corrections":[],"mirror_hints":[],"record_created":{"event_id":"sha256:d96375507d7abd85fb2af374a38dd50d18b182e63cd40c224bb0972377c22b34","target":"record","created_at":"2026-05-18T00:25:30Z","signer":{"key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","signer_id":"pith.science","signer_type":"pith_registry"},"payload":{"attestation_state":"computed","canonical_record":{"metadata":{"abstract_canon_sha256":"cda7a3b370b17fe2bbf9ae58521c67580b0fe32802d47efebdefc9afacc5d82d","cross_cats_sorted":[],"license":"http://creativecommons.org/licenses/by-nc-sa/4.0/","primary_cat":"cs.CL","submitted_at":"2018-01-19T15:00:33Z","title_canon_sha256":"7fa985e7195f7d279f2e68cea5ce622a62b95e14b4e124ea106046a13587d64b"},"schema_version":"1.0","source":{"id":"1801.06436","kind":"arxiv","version":1}},"canonical_sha256":"7663f7287b66ba57a3426c7d1a0607be7c2d67433051745eb020ab63e85a462b","receipt":{"algorithm":"ed25519","builder_version":"pith-number-builder-2026-05-17-v1","canonical_sha256":"7663f7287b66ba57a3426c7d1a0607be7c2d67433051745eb020ab63e85a462b","first_computed_at":"2026-05-18T00:25:30.135504Z","key_id":"pith-v1-2026-05","kind":"pith_receipt","last_reissued_at":"2026-05-18T00:25:30.135504Z","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","receipt_version":"0.3","signature_b64":"lPPrgiem/vP01tb3zZY9tphwVBs3d1xSIClF9huCUiMn7akPCPv5fOjhGomOexkKLwsJcH6xa8yzXIvjRQsqBA==","signature_status":"signed_v1","signed_at":"2026-05-18T00:25:30.136250Z","signed_message":"canonical_sha256_bytes"},"source_id":"1801.06436","source_kind":"arxiv","source_version":1}}},"equivocations":[],"invalid_events":[],"applied_event_ids":["sha256:d96375507d7abd85fb2af374a38dd50d18b182e63cd40c224bb0972377c22b34","sha256:a9e935e8070a49ff3bf1a0f158132858e688737c6eb326c818f420db5aabb63e"],"state_sha256":"5b52296071a9295d58efc05ce1c59233e9428b83bcd3b09d82ef42cd5d78fe77"},"bundle_signature":{"signature_status":"signed_v1","algorithm":"ed25519","key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","signature_b64":"jGedFJokF9rKNCwPe2ZKn3zrvA04H/EFriirDancXAKgSx8DVxR8kHvoNuHh7Tdlb442qsg5S2b4qozC1V5WAQ==","signed_message":"bundle_sha256_bytes","signed_at":"2026-06-03T08:36:36.881530Z","bundle_sha256":"a9e1fbf2f07d0490a2020542fc43ccf4de4ad024bf89e70c06d3c18e51949dac"}}