{"bundle_type":"pith_open_graph_bundle","bundle_version":"1.0","pith_number":"pith:2026:HZOXB3MUYR6Z535MMI3Q7ZR375","short_pith_number":"pith:HZOXB3MU","canonical_record":{"source":{"id":"2605.23597","kind":"arxiv","version":1},"metadata":{"license":"http://creativecommons.org/licenses/by/4.0/","primary_cat":"cs.CL","submitted_at":"2026-05-22T13:06:03Z","cross_cats_sorted":["cs.LG"],"title_canon_sha256":"70088f2567bdc69e314323253a8d400e30f22ad2cbbf1f1cd4147ecca7ff04ab","abstract_canon_sha256":"88c8121c98634396ac2b4dfcfd19cb3ba4c5ff4bb84027fd90c3b5afe0c2a56f"},"schema_version":"1.0"},"canonical_sha256":"3e5d70ed94c47d9eefac62370fe63bff66b895f47b000d900f0dd404f387e813","source":{"kind":"arxiv","id":"2605.23597","version":1},"source_aliases":[{"alias_kind":"arxiv","alias_value":"2605.23597","created_at":"2026-05-25T02:02:21Z"},{"alias_kind":"arxiv_version","alias_value":"2605.23597v1","created_at":"2026-05-25T02:02:21Z"},{"alias_kind":"doi","alias_value":"10.48550/arxiv.2605.23597","created_at":"2026-05-25T02:02:21Z"},{"alias_kind":"pith_short_12","alias_value":"HZOXB3MUYR6Z","created_at":"2026-05-25T02:02:21Z"},{"alias_kind":"pith_short_16","alias_value":"HZOXB3MUYR6Z535M","created_at":"2026-05-25T02:02:21Z"},{"alias_kind":"pith_short_8","alias_value":"HZOXB3MU","created_at":"2026-05-25T02:02:21Z"}],"events":[{"event_type":"record_created","subject_pith_number":"pith:2026:HZOXB3MUYR6Z535MMI3Q7ZR375","target":"record","payload":{"canonical_record":{"source":{"id":"2605.23597","kind":"arxiv","version":1},"metadata":{"license":"http://creativecommons.org/licenses/by/4.0/","primary_cat":"cs.CL","submitted_at":"2026-05-22T13:06:03Z","cross_cats_sorted":["cs.LG"],"title_canon_sha256":"70088f2567bdc69e314323253a8d400e30f22ad2cbbf1f1cd4147ecca7ff04ab","abstract_canon_sha256":"88c8121c98634396ac2b4dfcfd19cb3ba4c5ff4bb84027fd90c3b5afe0c2a56f"},"schema_version":"1.0"},"canonical_sha256":"3e5d70ed94c47d9eefac62370fe63bff66b895f47b000d900f0dd404f387e813","receipt":{"kind":"pith_receipt","key_id":"pith-v1-2026-05","algorithm":"ed25519","signed_at":"2026-05-25T02:02:21.491640Z","signature_b64":"IQjhvAA1jo4nL9qcQ84pN5hh3aT5qqEAO52K4GdmpvXoMep7u+1BwsSzpUBVi6GwOI0kyDr5sbdhFIKPRUJODQ==","signed_message":"canonical_sha256_bytes","builder_version":"pith-number-builder-2026-05-17-v1","receipt_version":"0.3","canonical_sha256":"3e5d70ed94c47d9eefac62370fe63bff66b895f47b000d900f0dd404f387e813","last_reissued_at":"2026-05-25T02:02:21.490973Z","signature_status":"signed_v1","first_computed_at":"2026-05-25T02:02:21.490973Z","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54"},"source_kind":"arxiv","source_id":"2605.23597","source_version":1,"attestation_state":"computed"},"signer":{"signer_id":"pith.science","signer_type":"pith_registry","key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54"},"created_at":"2026-05-25T02:02:21Z","supersedes":[],"prev_event":null,"signature":{"signature_status":"signed_v1","algorithm":"ed25519","key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","signature_b64":"/vp9aNUng46/A5PvBWwrIuhD157tWjZHQUMDeJKObeKeBOcQjSDKxQS9tpJKcT9fymaY6KTY6Uw82pltt82DCg==","signed_message":"open_graph_event_sha256_bytes","signed_at":"2026-06-10T09:53:26.583801Z"},"content_sha256":"378dd62693e9261b1276a4f86bb9cc91ff035c3ff4bca99505a3d0fd1c3e096e","schema_version":"1.0","event_id":"sha256:378dd62693e9261b1276a4f86bb9cc91ff035c3ff4bca99505a3d0fd1c3e096e"},{"event_type":"graph_snapshot","subject_pith_number":"pith:2026:HZOXB3MUYR6Z535MMI3Q7ZR375","target":"graph","payload":{"graph_snapshot":{"paper":{"title":"Structure-Guided Entity Resolution: Fine-Tuning LLMs for Robust Name Matching in Complex Linguistic Contexts","license":"http://creativecommons.org/licenses/by/4.0/","headline":"","cross_cats":["cs.LG"],"primary_cat":"cs.CL","authors_text":"Hitesh Kapoor, Nilesh Patil, Shivam Chourasia","submitted_at":"2026-05-22T13:06:03Z","abstract_excerpt":"Matching person names across heterogeneous records is a core challenge in entity resolution, especially within linguistically and culturally complex environments. Variations in naming conventions, inconsistent transliteration across scripts, and frequent data entry errors make it difficult to unify user identities, an essential requirement for Know Your Customer (KYC) compliance. While Large Language Models have shown promise in understanding natural language, they often struggle with the structured ambiguity present in such domain-specific settings. This paper introduces Structure-Guided Enti"},"claims":{"count":0,"items":[],"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"source":{"id":"2605.23597","kind":"arxiv","version":1},"verdict":{"id":null,"model_set":{},"created_at":null,"strongest_claim":"","one_line_summary":"","pipeline_version":null,"weakest_assumption":"","pith_extraction_headline":""},"integrity":{"clean":true,"summary":{"advisory":0,"critical":0,"by_detector":{},"informational":0},"endpoint":"/pith/2605.23597/integrity.json","findings":[],"available":true,"detectors_run":[],"snapshot_sha256":"c28c3603d3b5d939e8dc4c7e95fa8dfce3d595e45f758748cecf8e644a296938"},"references":{"count":0,"sample":[],"resolved_work":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57","internal_anchors":0},"formal_canon":{"evidence_count":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"author_claims":{"count":0,"strong_count":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"builder_version":"pith-number-builder-2026-05-17-v1"},"verdict_id":null},"signer":{"signer_id":"pith.science","signer_type":"pith_registry","key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54"},"created_at":"2026-05-25T02:02:21Z","supersedes":[],"prev_event":null,"signature":{"signature_status":"signed_v1","algorithm":"ed25519","key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","signature_b64":"kuS7rmN66qLhE+laIyud2ZN/Qa7uXNels8X22cacZmre7nvVuXFWlPhUL1eIXY9OQsVv2SX9VMRabrRS2bnjBQ==","signed_message":"open_graph_event_sha256_bytes","signed_at":"2026-06-10T09:53:26.584491Z"},"content_sha256":"80fff558c0c672098d2c210f876d3f1b30ffd499de31c16f9387a22c93f09397","schema_version":"1.0","event_id":"sha256:80fff558c0c672098d2c210f876d3f1b30ffd499de31c16f9387a22c93f09397"}],"timestamp_proofs":[],"mirror_hints":[{"mirror_type":"https","name":"Pith Resolver","base_url":"https://pith.science","bundle_url":"https://pith.science/pith/HZOXB3MUYR6Z535MMI3Q7ZR375/bundle.json","state_url":"https://pith.science/pith/HZOXB3MUYR6Z535MMI3Q7ZR375/state.json","well_known_bundle_url":"https://pith.science/.well-known/pith/HZOXB3MUYR6Z535MMI3Q7ZR375/bundle.json","status":"primary"}],"public_keys":[{"key_id":"pith-v1-2026-05","algorithm":"ed25519","format":"raw","public_key_b64":"stVStoiQhXFxp4s2pdzPNoqVNBMojDU/fJ2db5S3CbM=","public_key_hex":"b2d552b68890857171a78b36a5dccf368a953413288c353f7c9d9d6f94b709b3","fingerprint_sha256_b32_first128bits":"RVFV5Z2OI2J3ZUO7ERDEBCYNKS","fingerprint_sha256_hex":"8d4b5ee74e4693bcd1df2446408b0d54","rotates_at":null,"url":"https://pith.science/pith-signing-key.json","notes":"Pith uses this Ed25519 key to sign canonical record SHA-256 digests. Verify with: ed25519_verify(public_key, message=canonical_sha256_bytes, signature=base64decode(signature_b64))."}],"merge_version":"pith-open-graph-merge-v1","built_at":"2026-06-10T09:53:26Z","links":{"resolver":"https://pith.science/pith/HZOXB3MUYR6Z535MMI3Q7ZR375","bundle":"https://pith.science/pith/HZOXB3MUYR6Z535MMI3Q7ZR375/bundle.json","state":"https://pith.science/pith/HZOXB3MUYR6Z535MMI3Q7ZR375/state.json","well_known_bundle":"https://pith.science/.well-known/pith/HZOXB3MUYR6Z535MMI3Q7ZR375/bundle.json"},"state":{"state_type":"pith_open_graph_state","state_version":"1.0","pith_number":"pith:2026:HZOXB3MUYR6Z535MMI3Q7ZR375","merge_version":"pith-open-graph-merge-v1","event_count":2,"valid_event_count":2,"invalid_event_count":0,"equivocation_count":0,"current":{"canonical_record":{"metadata":{"abstract_canon_sha256":"88c8121c98634396ac2b4dfcfd19cb3ba4c5ff4bb84027fd90c3b5afe0c2a56f","cross_cats_sorted":["cs.LG"],"license":"http://creativecommons.org/licenses/by/4.0/","primary_cat":"cs.CL","submitted_at":"2026-05-22T13:06:03Z","title_canon_sha256":"70088f2567bdc69e314323253a8d400e30f22ad2cbbf1f1cd4147ecca7ff04ab"},"schema_version":"1.0","source":{"id":"2605.23597","kind":"arxiv","version":1}},"source_aliases":[{"alias_kind":"arxiv","alias_value":"2605.23597","created_at":"2026-05-25T02:02:21Z"},{"alias_kind":"arxiv_version","alias_value":"2605.23597v1","created_at":"2026-05-25T02:02:21Z"},{"alias_kind":"doi","alias_value":"10.48550/arxiv.2605.23597","created_at":"2026-05-25T02:02:21Z"},{"alias_kind":"pith_short_12","alias_value":"HZOXB3MUYR6Z","created_at":"2026-05-25T02:02:21Z"},{"alias_kind":"pith_short_16","alias_value":"HZOXB3MUYR6Z535M","created_at":"2026-05-25T02:02:21Z"},{"alias_kind":"pith_short_8","alias_value":"HZOXB3MU","created_at":"2026-05-25T02:02:21Z"}],"graph_snapshots":[{"event_id":"sha256:80fff558c0c672098d2c210f876d3f1b30ffd499de31c16f9387a22c93f09397","target":"graph","created_at":"2026-05-25T02:02:21Z","signer":{"key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","signer_id":"pith.science","signer_type":"pith_registry"},"payload":{"graph_snapshot":{"author_claims":{"count":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57","strong_count":0},"builder_version":"pith-number-builder-2026-05-17-v1","claims":{"count":0,"items":[],"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"formal_canon":{"evidence_count":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"integrity":{"available":true,"clean":true,"detectors_run":[],"endpoint":"/pith/2605.23597/integrity.json","findings":[],"snapshot_sha256":"c28c3603d3b5d939e8dc4c7e95fa8dfce3d595e45f758748cecf8e644a296938","summary":{"advisory":0,"by_detector":{},"critical":0,"informational":0}},"paper":{"abstract_excerpt":"Matching person names across heterogeneous records is a core challenge in entity resolution, especially within linguistically and culturally complex environments. Variations in naming conventions, inconsistent transliteration across scripts, and frequent data entry errors make it difficult to unify user identities, an essential requirement for Know Your Customer (KYC) compliance. While Large Language Models have shown promise in understanding natural language, they often struggle with the structured ambiguity present in such domain-specific settings. This paper introduces Structure-Guided Enti","authors_text":"Hitesh Kapoor, Nilesh Patil, Shivam Chourasia","cross_cats":["cs.LG"],"headline":"","license":"http://creativecommons.org/licenses/by/4.0/","primary_cat":"cs.CL","submitted_at":"2026-05-22T13:06:03Z","title":"Structure-Guided Entity Resolution: Fine-Tuning LLMs for Robust Name Matching in Complex Linguistic Contexts"},"references":{"count":0,"internal_anchors":0,"resolved_work":0,"sample":[],"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"source":{"id":"2605.23597","kind":"arxiv","version":1},"verdict":{"created_at":null,"id":null,"model_set":{},"one_line_summary":"","pipeline_version":null,"pith_extraction_headline":"","strongest_claim":"","weakest_assumption":""}},"verdict_id":null}}],"author_attestations":[],"timestamp_anchors":[],"storage_attestations":[],"citation_signatures":[],"replication_records":[],"corrections":[],"mirror_hints":[],"record_created":{"event_id":"sha256:378dd62693e9261b1276a4f86bb9cc91ff035c3ff4bca99505a3d0fd1c3e096e","target":"record","created_at":"2026-05-25T02:02:21Z","signer":{"key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","signer_id":"pith.science","signer_type":"pith_registry"},"payload":{"attestation_state":"computed","canonical_record":{"metadata":{"abstract_canon_sha256":"88c8121c98634396ac2b4dfcfd19cb3ba4c5ff4bb84027fd90c3b5afe0c2a56f","cross_cats_sorted":["cs.LG"],"license":"http://creativecommons.org/licenses/by/4.0/","primary_cat":"cs.CL","submitted_at":"2026-05-22T13:06:03Z","title_canon_sha256":"70088f2567bdc69e314323253a8d400e30f22ad2cbbf1f1cd4147ecca7ff04ab"},"schema_version":"1.0","source":{"id":"2605.23597","kind":"arxiv","version":1}},"canonical_sha256":"3e5d70ed94c47d9eefac62370fe63bff66b895f47b000d900f0dd404f387e813","receipt":{"algorithm":"ed25519","builder_version":"pith-number-builder-2026-05-17-v1","canonical_sha256":"3e5d70ed94c47d9eefac62370fe63bff66b895f47b000d900f0dd404f387e813","first_computed_at":"2026-05-25T02:02:21.490973Z","key_id":"pith-v1-2026-05","kind":"pith_receipt","last_reissued_at":"2026-05-25T02:02:21.490973Z","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","receipt_version":"0.3","signature_b64":"IQjhvAA1jo4nL9qcQ84pN5hh3aT5qqEAO52K4GdmpvXoMep7u+1BwsSzpUBVi6GwOI0kyDr5sbdhFIKPRUJODQ==","signature_status":"signed_v1","signed_at":"2026-05-25T02:02:21.491640Z","signed_message":"canonical_sha256_bytes"},"source_id":"2605.23597","source_kind":"arxiv","source_version":1}}},"equivocations":[],"invalid_events":[],"applied_event_ids":["sha256:378dd62693e9261b1276a4f86bb9cc91ff035c3ff4bca99505a3d0fd1c3e096e","sha256:80fff558c0c672098d2c210f876d3f1b30ffd499de31c16f9387a22c93f09397"],"state_sha256":"c803607d0ed7ab90adc3a558d52c43807ea021c34e871f6074fdc1317ca1b7ea"},"bundle_signature":{"signature_status":"signed_v1","algorithm":"ed25519","key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","signature_b64":"+tsIA9UvFAGnkXyT5MUnufuskpLCAffuWPaShEE4c6nCVjarRmMilwBAmCV9j4yUkcgndcM39oIYGGulYoUUDA==","signed_message":"bundle_sha256_bytes","signed_at":"2026-06-10T09:53:26.588447Z","bundle_sha256":"0bc6af3248228086fd1f5b19136af8c69f121510e40b4a8ad51bfaa85689ddbb"}}