{"state_type":"pith_open_graph_state","state_version":"1.0","pith_number":"pith:2026:5MKU6T5SNJBYAMSVRBAGKUM5HY","merge_version":"pith-open-graph-merge-v1","event_count":2,"valid_event_count":2,"invalid_event_count":0,"equivocation_count":0,"current":{"canonical_record":{"metadata":{"abstract_canon_sha256":"2015ac8c379c2d03520bf8798beca82135ea225f07501588e5fd129dbf9e5023","cross_cats_sorted":["cs.AI"],"license":"http://creativecommons.org/licenses/by-sa/4.0/","primary_cat":"cs.CV","submitted_at":"2026-01-20T00:06:58Z","title_canon_sha256":"329f9f71f8c4ccdc6fb134c57d4a0e7c55d6031b56269e0b53b306d4d5b300bf"},"schema_version":"1.0","source":{"id":"2601.17037","kind":"arxiv","version":2}},"source_aliases":[{"alias_kind":"arxiv","alias_value":"2601.17037","created_at":"2026-06-25T00:18:12Z"},{"alias_kind":"arxiv_version","alias_value":"2601.17037v2","created_at":"2026-06-25T00:18:12Z"},{"alias_kind":"doi","alias_value":"10.48550/arxiv.2601.17037","created_at":"2026-06-25T00:18:12Z"},{"alias_kind":"pith_short_12","alias_value":"5MKU6T5SNJBY","created_at":"2026-06-25T00:18:12Z"},{"alias_kind":"pith_short_16","alias_value":"5MKU6T5SNJBYAMSV","created_at":"2026-06-25T00:18:12Z"},{"alias_kind":"pith_short_8","alias_value":"5MKU6T5S","created_at":"2026-06-25T00:18:12Z"}],"graph_snapshots":[{"event_id":"sha256:a6688024346efa99b805573708b244f108ab077b3baf15be9d67a608d330935b","target":"graph","created_at":"2026-06-25T00:18:12Z","signer":{"key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","signer_id":"pith.science","signer_type":"pith_registry"},"payload":{"graph_snapshot":{"author_claims":{"count":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57","strong_count":0},"builder_version":"pith-number-builder-2026-05-17-v1","claims":{"count":0,"items":[],"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"formal_canon":{"evidence_count":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"integrity":{"available":true,"clean":true,"detectors_run":[],"endpoint":"/pith/2601.17037/integrity.json","findings":[],"snapshot_sha256":"c28c3603d3b5d939e8dc4c7e95fa8dfce3d595e45f758748cecf8e644a296938","summary":{"advisory":0,"by_detector":{},"critical":0,"informational":0}},"paper":{"abstract_excerpt":"We investigate visual reasoning limitations of both multimodal large language models (MLLMs) and image generation models (IGMs) by creating a novel benchmark to systematically compare failure modes across image-to-text and text-to-image tasks, enabling cross-modal evaluation of visual understanding. Despite rapid growth in machine learning, vision language models (VLMs) still fail to understand basic visual concepts such as object orientation, quantity, and spatial relationships, which highlights gaps in elementary visual reasoning. By adapting MMVP benchmark questions into explicit and implic","authors_text":"Aahana Basappa, Anish Karra, Anusri Karra, Asa Gilmore, Kevin Zhu, Pranay Goel","cross_cats":["cs.AI"],"headline":"","license":"http://creativecommons.org/licenses/by-sa/4.0/","primary_cat":"cs.CV","submitted_at":"2026-01-20T00:06:58Z","title":"AMVICC: A Novel Benchmark for Cross-Modal Failure Mode Profiling for VLMs and IGMs"},"references":{"count":0,"internal_anchors":0,"resolved_work":0,"sample":[],"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"source":{"id":"2601.17037","kind":"arxiv","version":2},"verdict":{"created_at":null,"id":null,"model_set":{},"one_line_summary":"","pipeline_version":null,"pith_extraction_headline":"","strongest_claim":"","weakest_assumption":""}},"verdict_id":null}}],"author_attestations":[],"timestamp_anchors":[],"storage_attestations":[],"citation_signatures":[],"replication_records":[],"corrections":[],"mirror_hints":[],"record_created":{"event_id":"sha256:f2dd66af4643dfb2869e995b906fdfe509e8e64ff966edc738512c405ea4b5b1","target":"record","created_at":"2026-06-25T00:18:12Z","signer":{"key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","signer_id":"pith.science","signer_type":"pith_registry"},"payload":{"attestation_state":"computed","canonical_record":{"metadata":{"abstract_canon_sha256":"2015ac8c379c2d03520bf8798beca82135ea225f07501588e5fd129dbf9e5023","cross_cats_sorted":["cs.AI"],"license":"http://creativecommons.org/licenses/by-sa/4.0/","primary_cat":"cs.CV","submitted_at":"2026-01-20T00:06:58Z","title_canon_sha256":"329f9f71f8c4ccdc6fb134c57d4a0e7c55d6031b56269e0b53b306d4d5b300bf"},"schema_version":"1.0","source":{"id":"2601.17037","kind":"arxiv","version":2}},"canonical_sha256":"eb154f4fb26a43803255884065519d3e0a3b4a9e52585b4f2fc0195cbff00801","receipt":{"algorithm":"ed25519","builder_version":"pith-number-builder-2026-05-17-v1","canonical_sha256":"eb154f4fb26a43803255884065519d3e0a3b4a9e52585b4f2fc0195cbff00801","first_computed_at":"2026-06-25T00:18:12.484177Z","key_id":"pith-v1-2026-05","kind":"pith_receipt","last_reissued_at":"2026-06-25T00:18:12.484177Z","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","receipt_version":"0.3","signature_b64":"syZ2m+aUEOq0wCmrlevN4kfkl2+Vbicrz+9buSfSc4tpmV+QbUrj+CFUkBbBMYdxDEbcGOYcii2+QhwoRh9aBw==","signature_status":"signed_v1","signed_at":"2026-06-25T00:18:12.484657Z","signed_message":"canonical_sha256_bytes"},"source_id":"2601.17037","source_kind":"arxiv","source_version":2}}},"equivocations":[],"invalid_events":[],"applied_event_ids":["sha256:f2dd66af4643dfb2869e995b906fdfe509e8e64ff966edc738512c405ea4b5b1","sha256:a6688024346efa99b805573708b244f108ab077b3baf15be9d67a608d330935b"],"state_sha256":"ef18a2d6007b84ce9004e71823bbb72b4d91b872c70056810eaf33df81ceb9c5"}