{"state_type":"pith_open_graph_state","state_version":"1.0","pith_number":"pith:2026:4CBROHNK6RQQIJEI63HEA7EZ2E","merge_version":"pith-open-graph-merge-v1","event_count":2,"valid_event_count":2,"invalid_event_count":0,"equivocation_count":0,"current":{"canonical_record":{"metadata":{"abstract_canon_sha256":"b72378bfac67d8952b365c5a50564d37715dd0204f60e78a5cabf2d1476905be","cross_cats_sorted":["cs.CL"],"license":"http://creativecommons.org/licenses/by-nc-sa/4.0/","primary_cat":"cs.CV","submitted_at":"2026-06-29T12:17:35Z","title_canon_sha256":"67488d9ccafc938559878884f2538761eb361f322af4bad5d7773d6df2a6dcb3"},"schema_version":"1.0","source":{"id":"2606.30201","kind":"arxiv","version":1}},"source_aliases":[{"alias_kind":"arxiv","alias_value":"2606.30201","created_at":"2026-06-30T02:17:53Z"},{"alias_kind":"arxiv_version","alias_value":"2606.30201v1","created_at":"2026-06-30T02:17:53Z"},{"alias_kind":"doi","alias_value":"10.48550/arxiv.2606.30201","created_at":"2026-06-30T02:17:53Z"},{"alias_kind":"pith_short_12","alias_value":"4CBROHNK6RQQ","created_at":"2026-06-30T02:17:53Z"},{"alias_kind":"pith_short_16","alias_value":"4CBROHNK6RQQIJEI","created_at":"2026-06-30T02:17:53Z"},{"alias_kind":"pith_short_8","alias_value":"4CBROHNK","created_at":"2026-06-30T02:17:53Z"}],"graph_snapshots":[{"event_id":"sha256:970ee0e81042e67976fc731e075a2f917c38a959d59cc0e7e47bc797b8786caa","target":"graph","created_at":"2026-06-30T02:17:53Z","signer":{"key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","signer_id":"pith.science","signer_type":"pith_registry"},"payload":{"graph_snapshot":{"author_claims":{"count":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57","strong_count":0},"builder_version":"pith-number-builder-2026-05-17-v1","claims":{"count":0,"items":[],"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"formal_canon":{"evidence_count":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"integrity":{"available":true,"clean":true,"detectors_run":[],"endpoint":"/pith/2606.30201/integrity.json","findings":[],"snapshot_sha256":"c28c3603d3b5d939e8dc4c7e95fa8dfce3d595e45f758748cecf8e644a296938","summary":{"advisory":0,"by_detector":{},"critical":0,"informational":0}},"paper":{"abstract_excerpt":"Current evaluation protocols for Vision-Language Models (VLMs) in Radiology Report Generation (RRG) rely on report-level metrics that measure lexical overlap or aggregate clinical correctness. However, such metrics do not test whether individual diagnostic statements stem from the actual pathological evidence visible in the image. This allows models to achieve competitive scores by exploiting learned priors or spurious correlations, a failure mode we refer to as vision shortcut. We introduce SHOVIR, a benchmark for evaluating vision shortcut behavior in RRG. SHOVIR extends two spatially annota","authors_text":"Filippo Ruffini, Marco Salm\\'e, Paolo Soda, Rosa Sicilia, Valerio Guarrasi","cross_cats":["cs.CL"],"headline":"","license":"http://creativecommons.org/licenses/by-nc-sa/4.0/","primary_cat":"cs.CV","submitted_at":"2026-06-29T12:17:35Z","title":"SHOVIR: A Benchmark for Evaluating Vision Shortcut Learning in Radiology Report Generation"},"references":{"count":0,"internal_anchors":0,"resolved_work":0,"sample":[],"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"source":{"id":"2606.30201","kind":"arxiv","version":1},"verdict":{"created_at":null,"id":null,"model_set":{},"one_line_summary":"","pipeline_version":null,"pith_extraction_headline":"","strongest_claim":"","weakest_assumption":""}},"verdict_id":null}}],"author_attestations":[],"timestamp_anchors":[],"storage_attestations":[],"citation_signatures":[],"replication_records":[],"corrections":[],"mirror_hints":[],"record_created":{"event_id":"sha256:ad934135d38dfb1c7b8101925a2974b03f4ebaa47253473d115ce7867d2626f9","target":"record","created_at":"2026-06-30T02:17:53Z","signer":{"key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","signer_id":"pith.science","signer_type":"pith_registry"},"payload":{"attestation_state":"computed","canonical_record":{"metadata":{"abstract_canon_sha256":"b72378bfac67d8952b365c5a50564d37715dd0204f60e78a5cabf2d1476905be","cross_cats_sorted":["cs.CL"],"license":"http://creativecommons.org/licenses/by-nc-sa/4.0/","primary_cat":"cs.CV","submitted_at":"2026-06-29T12:17:35Z","title_canon_sha256":"67488d9ccafc938559878884f2538761eb361f322af4bad5d7773d6df2a6dcb3"},"schema_version":"1.0","source":{"id":"2606.30201","kind":"arxiv","version":1}},"canonical_sha256":"e083171daaf461042488f6ce407c99d11f7be58b67972539379cb52c2b807cec","receipt":{"algorithm":"ed25519","builder_version":"pith-number-builder-2026-05-17-v1","canonical_sha256":"e083171daaf461042488f6ce407c99d11f7be58b67972539379cb52c2b807cec","first_computed_at":"2026-06-30T02:17:53.820622Z","key_id":"pith-v1-2026-05","kind":"pith_receipt","last_reissued_at":"2026-06-30T02:17:53.820622Z","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","receipt_version":"0.3","signature_b64":"nvLP35LScCy0D4+m8CgmkGe22l0Y7AIybEh+V1p3W7CqJd+jkJ5RmSkwdks6gcU+erAOvRPsp46q5lf4CnaCBA==","signature_status":"signed_v1","signed_at":"2026-06-30T02:17:53.821080Z","signed_message":"canonical_sha256_bytes"},"source_id":"2606.30201","source_kind":"arxiv","source_version":1}}},"equivocations":[],"invalid_events":[],"applied_event_ids":["sha256:ad934135d38dfb1c7b8101925a2974b03f4ebaa47253473d115ce7867d2626f9","sha256:970ee0e81042e67976fc731e075a2f917c38a959d59cc0e7e47bc797b8786caa"],"state_sha256":"ce3c241e484fed962b79e5bbd9695a3c29560aa96c133e8aa99e13b875e964ac"}