{"bundle_type":"pith_open_graph_bundle","bundle_version":"1.0","pith_number":"pith:2026:Y7A3TBXEYR6EQQJZMC3CBW5VAF","short_pith_number":"pith:Y7A3TBXE","canonical_record":{"source":{"id":"2606.11745","kind":"arxiv","version":1},"metadata":{"license":"http://creativecommons.org/licenses/by-nc-sa/4.0/","primary_cat":"cs.CV","submitted_at":"2026-06-10T07:21:45Z","cross_cats_sorted":["cs.AI"],"title_canon_sha256":"d17b3785e0137a71b2ce20f81ad6cc4253e8f493edda1d7168eb7a3450c815b2","abstract_canon_sha256":"24e97ef12307c34f520d4a4dc576d77175268db823256f4d66fce962c4ddb3d8"},"schema_version":"1.0"},"canonical_sha256":"c7c1b986e4c47c48413960b620dbb50152ae63cd9a812821f9dff6106af3893a","source":{"kind":"arxiv","id":"2606.11745","version":1},"source_aliases":[{"alias_kind":"arxiv","alias_value":"2606.11745","created_at":"2026-06-11T01:10:05Z"},{"alias_kind":"arxiv_version","alias_value":"2606.11745v1","created_at":"2026-06-11T01:10:05Z"},{"alias_kind":"doi","alias_value":"10.48550/arxiv.2606.11745","created_at":"2026-06-11T01:10:05Z"},{"alias_kind":"pith_short_12","alias_value":"Y7A3TBXEYR6E","created_at":"2026-06-11T01:10:05Z"},{"alias_kind":"pith_short_16","alias_value":"Y7A3TBXEYR6EQQJZ","created_at":"2026-06-11T01:10:05Z"},{"alias_kind":"pith_short_8","alias_value":"Y7A3TBXE","created_at":"2026-06-11T01:10:05Z"}],"events":[{"event_type":"record_created","subject_pith_number":"pith:2026:Y7A3TBXEYR6EQQJZMC3CBW5VAF","target":"record","payload":{"canonical_record":{"source":{"id":"2606.11745","kind":"arxiv","version":1},"metadata":{"license":"http://creativecommons.org/licenses/by-nc-sa/4.0/","primary_cat":"cs.CV","submitted_at":"2026-06-10T07:21:45Z","cross_cats_sorted":["cs.AI"],"title_canon_sha256":"d17b3785e0137a71b2ce20f81ad6cc4253e8f493edda1d7168eb7a3450c815b2","abstract_canon_sha256":"24e97ef12307c34f520d4a4dc576d77175268db823256f4d66fce962c4ddb3d8"},"schema_version":"1.0"},"canonical_sha256":"c7c1b986e4c47c48413960b620dbb50152ae63cd9a812821f9dff6106af3893a","receipt":{"kind":"pith_receipt","key_id":"pith-v1-2026-05","algorithm":"ed25519","signed_at":"2026-06-11T01:10:05.830305Z","signature_b64":"uZ9pGCp9XPCGJ09BGr3MiXqSRUhhJ2ipe3sFIWpSpcNEYv5BnWbiO0nOYhU0ADk0dhunksrqNik4zRoIW1ENAg==","signed_message":"canonical_sha256_bytes","builder_version":"pith-number-builder-2026-05-17-v1","receipt_version":"0.3","canonical_sha256":"c7c1b986e4c47c48413960b620dbb50152ae63cd9a812821f9dff6106af3893a","last_reissued_at":"2026-06-11T01:10:05.829478Z","signature_status":"signed_v1","first_computed_at":"2026-06-11T01:10:05.829478Z","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54"},"source_kind":"arxiv","source_id":"2606.11745","source_version":1,"attestation_state":"computed"},"signer":{"signer_id":"pith.science","signer_type":"pith_registry","key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54"},"created_at":"2026-06-11T01:10:05Z","supersedes":[],"prev_event":null,"signature":{"signature_status":"signed_v1","algorithm":"ed25519","key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","signature_b64":"0ePwF7RpypPUSwDJuyjJ/SFIB7513kgMBqgCaZJ6zfAEAM27Jbt7ptWSFz/vfhy9HO1XHXBC9PGhG7euT4bVDg==","signed_message":"open_graph_event_sha256_bytes","signed_at":"2026-06-12T07:56:26.843545Z"},"content_sha256":"170ed8bcbdb10c4037f78a11b62a0b7434bda1f0543164a53250fd92a31e227f","schema_version":"1.0","event_id":"sha256:170ed8bcbdb10c4037f78a11b62a0b7434bda1f0543164a53250fd92a31e227f"},{"event_type":"graph_snapshot","subject_pith_number":"pith:2026:Y7A3TBXEYR6EQQJZMC3CBW5VAF","target":"graph","payload":{"graph_snapshot":{"paper":{"title":"From Prompts to Tokens: Internalizing Causal Supervision in Vision-Language Model for Multi-Image Causal Reasoning","license":"http://creativecommons.org/licenses/by-nc-sa/4.0/","headline":"","cross_cats":["cs.AI"],"primary_cat":"cs.CV","authors_text":"Haoping Yu, Jing Ma, Yuanxi Li","submitted_at":"2026-06-10T07:21:45Z","abstract_excerpt":"Visual causal reasoning is essential for understanding and intervening in the physical world, requiring identification of causal variables from visual inputs and reasoning over intervention effects. Despite recent progress, large vision--language models (VLMs) remain brittle at such tasks, especially for interventional and counterfactual queries over multi-image inputs. Most existing explorations inject causal knowledge via textual prompts, leaving causal mechanisms external to model execution and limiting reliable control during inference. To address this problem, we propose BridgeVLM, which "},"claims":{"count":0,"items":[],"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"source":{"id":"2606.11745","kind":"arxiv","version":1},"verdict":{"id":null,"model_set":{},"created_at":null,"strongest_claim":"","one_line_summary":"","pipeline_version":null,"weakest_assumption":"","pith_extraction_headline":""},"integrity":{"clean":true,"summary":{"advisory":0,"critical":0,"by_detector":{},"informational":0},"endpoint":"/pith/2606.11745/integrity.json","findings":[],"available":true,"detectors_run":[],"snapshot_sha256":"c28c3603d3b5d939e8dc4c7e95fa8dfce3d595e45f758748cecf8e644a296938"},"references":{"count":0,"sample":[],"resolved_work":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57","internal_anchors":0},"formal_canon":{"evidence_count":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"author_claims":{"count":0,"strong_count":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"builder_version":"pith-number-builder-2026-05-17-v1"},"verdict_id":null},"signer":{"signer_id":"pith.science","signer_type":"pith_registry","key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54"},"created_at":"2026-06-11T01:10:05Z","supersedes":[],"prev_event":null,"signature":{"signature_status":"signed_v1","algorithm":"ed25519","key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","signature_b64":"dxT93GFFLi41k7DgbwYXI3PCV7BE8TZ0KPgHiRUo5OomLsjhAwwPswkNb2gV7yJwLzZfVZgILNzJ8gPr6ItnCw==","signed_message":"open_graph_event_sha256_bytes","signed_at":"2026-06-12T07:56:26.843993Z"},"content_sha256":"bffa7cbd55c390b716173cf81fa6a893d1ba6fe915f55c96d9f5308898da12bb","schema_version":"1.0","event_id":"sha256:bffa7cbd55c390b716173cf81fa6a893d1ba6fe915f55c96d9f5308898da12bb"}],"timestamp_proofs":[],"mirror_hints":[{"mirror_type":"https","name":"Pith Resolver","base_url":"https://pith.science","bundle_url":"https://pith.science/pith/Y7A3TBXEYR6EQQJZMC3CBW5VAF/bundle.json","state_url":"https://pith.science/pith/Y7A3TBXEYR6EQQJZMC3CBW5VAF/state.json","well_known_bundle_url":"https://pith.science/.well-known/pith/Y7A3TBXEYR6EQQJZMC3CBW5VAF/bundle.json","status":"primary"}],"public_keys":[{"key_id":"pith-v1-2026-05","algorithm":"ed25519","format":"raw","public_key_b64":"stVStoiQhXFxp4s2pdzPNoqVNBMojDU/fJ2db5S3CbM=","public_key_hex":"b2d552b68890857171a78b36a5dccf368a953413288c353f7c9d9d6f94b709b3","fingerprint_sha256_b32_first128bits":"RVFV5Z2OI2J3ZUO7ERDEBCYNKS","fingerprint_sha256_hex":"8d4b5ee74e4693bcd1df2446408b0d54","rotates_at":null,"url":"https://pith.science/pith-signing-key.json","notes":"Pith uses this Ed25519 key to sign canonical record SHA-256 digests. Verify with: ed25519_verify(public_key, message=canonical_sha256_bytes, signature=base64decode(signature_b64))."}],"merge_version":"pith-open-graph-merge-v1","built_at":"2026-06-12T07:56:26Z","links":{"resolver":"https://pith.science/pith/Y7A3TBXEYR6EQQJZMC3CBW5VAF","bundle":"https://pith.science/pith/Y7A3TBXEYR6EQQJZMC3CBW5VAF/bundle.json","state":"https://pith.science/pith/Y7A3TBXEYR6EQQJZMC3CBW5VAF/state.json","well_known_bundle":"https://pith.science/.well-known/pith/Y7A3TBXEYR6EQQJZMC3CBW5VAF/bundle.json"},"state":{"state_type":"pith_open_graph_state","state_version":"1.0","pith_number":"pith:2026:Y7A3TBXEYR6EQQJZMC3CBW5VAF","merge_version":"pith-open-graph-merge-v1","event_count":2,"valid_event_count":2,"invalid_event_count":0,"equivocation_count":0,"current":{"canonical_record":{"metadata":{"abstract_canon_sha256":"24e97ef12307c34f520d4a4dc576d77175268db823256f4d66fce962c4ddb3d8","cross_cats_sorted":["cs.AI"],"license":"http://creativecommons.org/licenses/by-nc-sa/4.0/","primary_cat":"cs.CV","submitted_at":"2026-06-10T07:21:45Z","title_canon_sha256":"d17b3785e0137a71b2ce20f81ad6cc4253e8f493edda1d7168eb7a3450c815b2"},"schema_version":"1.0","source":{"id":"2606.11745","kind":"arxiv","version":1}},"source_aliases":[{"alias_kind":"arxiv","alias_value":"2606.11745","created_at":"2026-06-11T01:10:05Z"},{"alias_kind":"arxiv_version","alias_value":"2606.11745v1","created_at":"2026-06-11T01:10:05Z"},{"alias_kind":"doi","alias_value":"10.48550/arxiv.2606.11745","created_at":"2026-06-11T01:10:05Z"},{"alias_kind":"pith_short_12","alias_value":"Y7A3TBXEYR6E","created_at":"2026-06-11T01:10:05Z"},{"alias_kind":"pith_short_16","alias_value":"Y7A3TBXEYR6EQQJZ","created_at":"2026-06-11T01:10:05Z"},{"alias_kind":"pith_short_8","alias_value":"Y7A3TBXE","created_at":"2026-06-11T01:10:05Z"}],"graph_snapshots":[{"event_id":"sha256:bffa7cbd55c390b716173cf81fa6a893d1ba6fe915f55c96d9f5308898da12bb","target":"graph","created_at":"2026-06-11T01:10:05Z","signer":{"key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","signer_id":"pith.science","signer_type":"pith_registry"},"payload":{"graph_snapshot":{"author_claims":{"count":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57","strong_count":0},"builder_version":"pith-number-builder-2026-05-17-v1","claims":{"count":0,"items":[],"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"formal_canon":{"evidence_count":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"integrity":{"available":true,"clean":true,"detectors_run":[],"endpoint":"/pith/2606.11745/integrity.json","findings":[],"snapshot_sha256":"c28c3603d3b5d939e8dc4c7e95fa8dfce3d595e45f758748cecf8e644a296938","summary":{"advisory":0,"by_detector":{},"critical":0,"informational":0}},"paper":{"abstract_excerpt":"Visual causal reasoning is essential for understanding and intervening in the physical world, requiring identification of causal variables from visual inputs and reasoning over intervention effects. Despite recent progress, large vision--language models (VLMs) remain brittle at such tasks, especially for interventional and counterfactual queries over multi-image inputs. Most existing explorations inject causal knowledge via textual prompts, leaving causal mechanisms external to model execution and limiting reliable control during inference. To address this problem, we propose BridgeVLM, which ","authors_text":"Haoping Yu, Jing Ma, Yuanxi Li","cross_cats":["cs.AI"],"headline":"","license":"http://creativecommons.org/licenses/by-nc-sa/4.0/","primary_cat":"cs.CV","submitted_at":"2026-06-10T07:21:45Z","title":"From Prompts to Tokens: Internalizing Causal Supervision in Vision-Language Model for Multi-Image Causal Reasoning"},"references":{"count":0,"internal_anchors":0,"resolved_work":0,"sample":[],"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"source":{"id":"2606.11745","kind":"arxiv","version":1},"verdict":{"created_at":null,"id":null,"model_set":{},"one_line_summary":"","pipeline_version":null,"pith_extraction_headline":"","strongest_claim":"","weakest_assumption":""}},"verdict_id":null}}],"author_attestations":[],"timestamp_anchors":[],"storage_attestations":[],"citation_signatures":[],"replication_records":[],"corrections":[],"mirror_hints":[],"record_created":{"event_id":"sha256:170ed8bcbdb10c4037f78a11b62a0b7434bda1f0543164a53250fd92a31e227f","target":"record","created_at":"2026-06-11T01:10:05Z","signer":{"key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","signer_id":"pith.science","signer_type":"pith_registry"},"payload":{"attestation_state":"computed","canonical_record":{"metadata":{"abstract_canon_sha256":"24e97ef12307c34f520d4a4dc576d77175268db823256f4d66fce962c4ddb3d8","cross_cats_sorted":["cs.AI"],"license":"http://creativecommons.org/licenses/by-nc-sa/4.0/","primary_cat":"cs.CV","submitted_at":"2026-06-10T07:21:45Z","title_canon_sha256":"d17b3785e0137a71b2ce20f81ad6cc4253e8f493edda1d7168eb7a3450c815b2"},"schema_version":"1.0","source":{"id":"2606.11745","kind":"arxiv","version":1}},"canonical_sha256":"c7c1b986e4c47c48413960b620dbb50152ae63cd9a812821f9dff6106af3893a","receipt":{"algorithm":"ed25519","builder_version":"pith-number-builder-2026-05-17-v1","canonical_sha256":"c7c1b986e4c47c48413960b620dbb50152ae63cd9a812821f9dff6106af3893a","first_computed_at":"2026-06-11T01:10:05.829478Z","key_id":"pith-v1-2026-05","kind":"pith_receipt","last_reissued_at":"2026-06-11T01:10:05.829478Z","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","receipt_version":"0.3","signature_b64":"uZ9pGCp9XPCGJ09BGr3MiXqSRUhhJ2ipe3sFIWpSpcNEYv5BnWbiO0nOYhU0ADk0dhunksrqNik4zRoIW1ENAg==","signature_status":"signed_v1","signed_at":"2026-06-11T01:10:05.830305Z","signed_message":"canonical_sha256_bytes"},"source_id":"2606.11745","source_kind":"arxiv","source_version":1}}},"equivocations":[],"invalid_events":[],"applied_event_ids":["sha256:170ed8bcbdb10c4037f78a11b62a0b7434bda1f0543164a53250fd92a31e227f","sha256:bffa7cbd55c390b716173cf81fa6a893d1ba6fe915f55c96d9f5308898da12bb"],"state_sha256":"9cc745040c6814469d6d505a472bf1846ab8f7e81ce4ade147479ab1bebbe765"},"bundle_signature":{"signature_status":"signed_v1","algorithm":"ed25519","key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","signature_b64":"/Sfm6WMcTsWDzj4cRoknJy4VcLnAFnwuFb1mftHoQRqNpiF8QriLzfflLEuxxEDZz31sfQJSYGz59DrFit31BQ==","signed_message":"bundle_sha256_bytes","signed_at":"2026-06-12T07:56:26.846581Z","bundle_sha256":"2199abe616b87f0da70243685c096a9513df2f2b1c5db2e87ce70f2fa18bb21f"}}