{"state_type":"pith_open_graph_state","state_version":"1.0","pith_number":"pith:2026:CVW24JX5HS26CRZWSL7ODQMQLY","merge_version":"pith-open-graph-merge-v1","event_count":2,"valid_event_count":2,"invalid_event_count":0,"equivocation_count":0,"current":{"canonical_record":{"metadata":{"abstract_canon_sha256":"9045fc19522ed5a7c2b3c6985eda018da97cfd841a88176b50b7fe0e0fc8e169","cross_cats_sorted":["cs.LG"],"license":"http://arxiv.org/licenses/nonexclusive-distrib/1.0/","primary_cat":"cs.CL","submitted_at":"2026-06-18T07:00:43Z","title_canon_sha256":"89951779045104667e545f897388fa0945f9a19f784871e8737f3c999f43785e"},"schema_version":"1.0","source":{"id":"2606.19852","kind":"arxiv","version":1}},"source_aliases":[{"alias_kind":"arxiv","alias_value":"2606.19852","created_at":"2026-06-19T16:12:37Z"},{"alias_kind":"arxiv_version","alias_value":"2606.19852v1","created_at":"2026-06-19T16:12:37Z"},{"alias_kind":"doi","alias_value":"10.48550/arxiv.2606.19852","created_at":"2026-06-19T16:12:37Z"},{"alias_kind":"pith_short_12","alias_value":"CVW24JX5HS26","created_at":"2026-06-19T16:12:37Z"},{"alias_kind":"pith_short_16","alias_value":"CVW24JX5HS26CRZW","created_at":"2026-06-19T16:12:37Z"},{"alias_kind":"pith_short_8","alias_value":"CVW24JX5","created_at":"2026-06-19T16:12:37Z"}],"graph_snapshots":[{"event_id":"sha256:433ed4f6746ab829c7a646f5259a6bab870f35b3fdd3526055c3a5e539adbd1a","target":"graph","created_at":"2026-06-19T16:12:37Z","signer":{"key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","signer_id":"pith.science","signer_type":"pith_registry"},"payload":{"graph_snapshot":{"author_claims":{"count":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57","strong_count":0},"builder_version":"pith-number-builder-2026-05-17-v1","claims":{"count":0,"items":[],"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"formal_canon":{"evidence_count":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"integrity":{"available":true,"clean":true,"detectors_run":[],"endpoint":"/pith/2606.19852/integrity.json","findings":[],"snapshot_sha256":"c28c3603d3b5d939e8dc4c7e95fa8dfce3d595e45f758748cecf8e644a296938","summary":{"advisory":0,"by_detector":{},"critical":0,"informational":0}},"paper":{"abstract_excerpt":"Information extraction from pathology reports is essential for cancer staging, tumor registry population. Yet key data remains embedded in narrative reports, making manual extraction labor-intensive and error-prone. Traditional supervised Natural Language Processing pipelines address this through fully supervised Named Entity Recognition and Relation Extraction, but require expensive manual annotation and suffer cascading failures when upstream entities are missed. In this study, we developed a zero-shot, agentic workflow, and evaluated five open-source generative Large Language Models (LLMs) ","authors_text":"Aman Pathak (1), Aokun Chen (3), Cheng Peng (1), Hiren Mehta (2), Mengxian Lyu (1), Reema Solan (1), Sankalp Talankar (1), Yasir Khan (1), Yi Guo (1), Yonghui Wu (1), Ziyi Chen (1)","cross_cats":["cs.LG"],"headline":"","license":"http://arxiv.org/licenses/nonexclusive-distrib/1.0/","primary_cat":"cs.CL","submitted_at":"2026-06-18T07:00:43Z","title":"Prompt, Plan, Extract: Zero-Shot Agentic LLMs Workflows for Lung Pathology Extraction from Clinical Narratives"},"references":{"count":0,"internal_anchors":0,"resolved_work":0,"sample":[],"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"source":{"id":"2606.19852","kind":"arxiv","version":1},"verdict":{"created_at":null,"id":null,"model_set":{},"one_line_summary":"","pipeline_version":null,"pith_extraction_headline":"","strongest_claim":"","weakest_assumption":""}},"verdict_id":null}}],"author_attestations":[],"timestamp_anchors":[],"storage_attestations":[],"citation_signatures":[],"replication_records":[],"corrections":[],"mirror_hints":[],"record_created":{"event_id":"sha256:3d18eedce6d5e338d10c5549205b34cd90a1727bec0c0c979629c030d404bdcb","target":"record","created_at":"2026-06-19T16:12:37Z","signer":{"key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","signer_id":"pith.science","signer_type":"pith_registry"},"payload":{"attestation_state":"computed","canonical_record":{"metadata":{"abstract_canon_sha256":"9045fc19522ed5a7c2b3c6985eda018da97cfd841a88176b50b7fe0e0fc8e169","cross_cats_sorted":["cs.LG"],"license":"http://arxiv.org/licenses/nonexclusive-distrib/1.0/","primary_cat":"cs.CL","submitted_at":"2026-06-18T07:00:43Z","title_canon_sha256":"89951779045104667e545f897388fa0945f9a19f784871e8737f3c999f43785e"},"schema_version":"1.0","source":{"id":"2606.19852","kind":"arxiv","version":1}},"canonical_sha256":"156dae26fd3cb5e1473692fee1c1905e1fb0ee7e1cd5a48223cecddbe6791357","receipt":{"algorithm":"ed25519","builder_version":"pith-number-builder-2026-05-17-v1","canonical_sha256":"156dae26fd3cb5e1473692fee1c1905e1fb0ee7e1cd5a48223cecddbe6791357","first_computed_at":"2026-06-19T16:12:37.010284Z","key_id":"pith-v1-2026-05","kind":"pith_receipt","last_reissued_at":"2026-06-19T16:12:37.010284Z","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","receipt_version":"0.3","signature_b64":"DEF8/Xq1wUmfqGa3xDNRKOQuG/dHKrMMAnypwWv+wUzr1CDFkO9MLmZxbvwjN2ta1s8fChPC8Gsb9Pki7i0pCw==","signature_status":"signed_v1","signed_at":"2026-06-19T16:12:37.010702Z","signed_message":"canonical_sha256_bytes"},"source_id":"2606.19852","source_kind":"arxiv","source_version":1}}},"equivocations":[],"invalid_events":[],"applied_event_ids":["sha256:3d18eedce6d5e338d10c5549205b34cd90a1727bec0c0c979629c030d404bdcb","sha256:433ed4f6746ab829c7a646f5259a6bab870f35b3fdd3526055c3a5e539adbd1a"],"state_sha256":"203cbfab6ad10b9b0b0fe750180dc3622793705ab94063d2b6f413e93a3fbaef"}