{"state_type":"pith_open_graph_state","state_version":"1.0","pith_number":"pith:2026:5UG6KD2ETUQYCL6DKMHBLJERYG","merge_version":"pith-open-graph-merge-v1","event_count":2,"valid_event_count":2,"invalid_event_count":0,"equivocation_count":0,"current":{"canonical_record":{"metadata":{"abstract_canon_sha256":"e8f68bf699a164480375b7f69b50be64064af87a20f7fffaa6e3fe91422fb83e","cross_cats_sorted":[],"license":"http://arxiv.org/licenses/nonexclusive-distrib/1.0/","primary_cat":"cs.CL","submitted_at":"2026-05-18T14:56:44Z","title_canon_sha256":"857652be774a5522dbb38414dd9efe1e940815234b1778f356620b58e2c65ff4"},"schema_version":"1.0","source":{"id":"2605.18504","kind":"arxiv","version":1}},"source_aliases":[{"alias_kind":"arxiv","alias_value":"2605.18504","created_at":"2026-05-20T00:06:04Z"},{"alias_kind":"arxiv_version","alias_value":"2605.18504v1","created_at":"2026-05-20T00:06:04Z"},{"alias_kind":"doi","alias_value":"10.48550/arxiv.2605.18504","created_at":"2026-05-20T00:06:04Z"},{"alias_kind":"pith_short_12","alias_value":"5UG6KD2ETUQY","created_at":"2026-05-20T00:06:04Z"},{"alias_kind":"pith_short_16","alias_value":"5UG6KD2ETUQYCL6D","created_at":"2026-05-20T00:06:04Z"},{"alias_kind":"pith_short_8","alias_value":"5UG6KD2E","created_at":"2026-05-20T00:06:04Z"}],"graph_snapshots":[{"event_id":"sha256:c3614ab10df0956701bc64035af067903ccabf8b0030da07af3879145ccd744d","target":"graph","created_at":"2026-05-20T00:06:04Z","signer":{"key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","signer_id":"pith.science","signer_type":"pith_registry"},"payload":{"graph_snapshot":{"author_claims":{"count":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57","strong_count":0},"builder_version":"pith-number-builder-2026-05-17-v1","claims":{"count":0,"items":[],"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"formal_canon":{"evidence_count":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"integrity":{"available":true,"clean":true,"detectors_run":[],"endpoint":"/pith/2605.18504/integrity.json","findings":[],"snapshot_sha256":"c28c3603d3b5d939e8dc4c7e95fa8dfce3d595e45f758748cecf8e644a296938","summary":{"advisory":0,"by_detector":{},"critical":0,"informational":0}},"paper":{"abstract_excerpt":"Machine Translation (MT) for Ancient Greek (AG) to Modern Greek (MG) is a low-resource task, constrained by the lack of large-scale, high-quality parallel data. We address this gap by introducing the AG-MG Parallel Corpus, a new resource containing 132,481 sentence-aligned pairs derived from literary, historical, and biblical texts. We present a novel corpus creation pipeline that combines web-scraped, excerpt-level data with a multi-stage sentence-level alignment, and refinement process. Our method uses VecAlign with LaBSE embeddings, which we first fine-tune on a manually-aligned AG-MG subse","authors_text":"Maria Giagkou, Prokopis Prokopidis, Sokratis Sofianopoulos, Spyridon Mavromatis","cross_cats":[],"headline":"","license":"http://arxiv.org/licenses/nonexclusive-distrib/1.0/","primary_cat":"cs.CL","submitted_at":"2026-05-18T14:56:44Z","title":"Ancient Greek to Modern Greek Machine Translation: A Novel Benchmark and Fine-Tuning Experiments on LLMs and NMT Models"},"references":{"count":0,"internal_anchors":0,"resolved_work":0,"sample":[],"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"source":{"id":"2605.18504","kind":"arxiv","version":1},"verdict":{"created_at":null,"id":null,"model_set":{},"one_line_summary":"","pipeline_version":null,"pith_extraction_headline":"","strongest_claim":"","weakest_assumption":""}},"verdict_id":null}}],"author_attestations":[],"timestamp_anchors":[],"storage_attestations":[],"citation_signatures":[],"replication_records":[],"corrections":[],"mirror_hints":[],"record_created":{"event_id":"sha256:82332da3be2e66fa47ea1d57f73ae111bcc71018cbba94a88c8d23d221ada18e","target":"record","created_at":"2026-05-20T00:06:04Z","signer":{"key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","signer_id":"pith.science","signer_type":"pith_registry"},"payload":{"attestation_state":"computed","canonical_record":{"metadata":{"abstract_canon_sha256":"e8f68bf699a164480375b7f69b50be64064af87a20f7fffaa6e3fe91422fb83e","cross_cats_sorted":[],"license":"http://arxiv.org/licenses/nonexclusive-distrib/1.0/","primary_cat":"cs.CL","submitted_at":"2026-05-18T14:56:44Z","title_canon_sha256":"857652be774a5522dbb38414dd9efe1e940815234b1778f356620b58e2c65ff4"},"schema_version":"1.0","source":{"id":"2605.18504","kind":"arxiv","version":1}},"canonical_sha256":"ed0de50f449d21812fc3530e15a491c1bed15b823a818afbbc61d3a17f9be9f9","receipt":{"algorithm":"ed25519","builder_version":"pith-number-builder-2026-05-17-v1","canonical_sha256":"ed0de50f449d21812fc3530e15a491c1bed15b823a818afbbc61d3a17f9be9f9","first_computed_at":"2026-05-20T00:06:04.612740Z","key_id":"pith-v1-2026-05","kind":"pith_receipt","last_reissued_at":"2026-05-20T00:06:04.612740Z","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","receipt_version":"0.3","signature_b64":"6xbAThW1UVtHl3FRRJQwz+c+U8vjRPAdVTWzP59HbRgVeKzs79R3ayA+dRVTMP9st7GJ8k7pa/GQSU2SKj2NCg==","signature_status":"signed_v1","signed_at":"2026-05-20T00:06:04.613556Z","signed_message":"canonical_sha256_bytes"},"source_id":"2605.18504","source_kind":"arxiv","source_version":1}}},"equivocations":[],"invalid_events":[],"applied_event_ids":["sha256:82332da3be2e66fa47ea1d57f73ae111bcc71018cbba94a88c8d23d221ada18e","sha256:c3614ab10df0956701bc64035af067903ccabf8b0030da07af3879145ccd744d"],"state_sha256":"1cc00eca1425b3f3c8862aa4f8e21a8a12ef2bae7d92636025e7d49270796d87"}