{"bundle_type":"pith_open_graph_bundle","bundle_version":"1.0","pith_number":"pith:2026:CAO5SB4A73NPVNJXGXTAYRVRMO","short_pith_number":"pith:CAO5SB4A","canonical_record":{"source":{"id":"2606.12303","kind":"arxiv","version":1},"metadata":{"license":"http://creativecommons.org/licenses/by/4.0/","primary_cat":"cs.CV","submitted_at":"2026-06-10T16:40:18Z","cross_cats_sorted":[],"title_canon_sha256":"20de4f71f86b159861131333ddc70bad042b7058d28b71646ada90c50b0b5f8d","abstract_canon_sha256":"d08c6323b7ddf47080185359c6d12b742776b8edc10e57cfda67db8e6993cc3a"},"schema_version":"1.0"},"canonical_sha256":"101dd90780fedafab53735e60c46b163a35d6b99c1f479bcde41147d998842b7","source":{"kind":"arxiv","id":"2606.12303","version":1},"source_aliases":[{"alias_kind":"arxiv","alias_value":"2606.12303","created_at":"2026-06-11T01:11:00Z"},{"alias_kind":"arxiv_version","alias_value":"2606.12303v1","created_at":"2026-06-11T01:11:00Z"},{"alias_kind":"doi","alias_value":"10.48550/arxiv.2606.12303","created_at":"2026-06-11T01:11:00Z"},{"alias_kind":"pith_short_12","alias_value":"CAO5SB4A73NP","created_at":"2026-06-11T01:11:00Z"},{"alias_kind":"pith_short_16","alias_value":"CAO5SB4A73NPVNJX","created_at":"2026-06-11T01:11:00Z"},{"alias_kind":"pith_short_8","alias_value":"CAO5SB4A","created_at":"2026-06-11T01:11:00Z"}],"events":[{"event_type":"record_created","subject_pith_number":"pith:2026:CAO5SB4A73NPVNJXGXTAYRVRMO","target":"record","payload":{"canonical_record":{"source":{"id":"2606.12303","kind":"arxiv","version":1},"metadata":{"license":"http://creativecommons.org/licenses/by/4.0/","primary_cat":"cs.CV","submitted_at":"2026-06-10T16:40:18Z","cross_cats_sorted":[],"title_canon_sha256":"20de4f71f86b159861131333ddc70bad042b7058d28b71646ada90c50b0b5f8d","abstract_canon_sha256":"d08c6323b7ddf47080185359c6d12b742776b8edc10e57cfda67db8e6993cc3a"},"schema_version":"1.0"},"canonical_sha256":"101dd90780fedafab53735e60c46b163a35d6b99c1f479bcde41147d998842b7","receipt":{"kind":"pith_receipt","key_id":"pith-v1-2026-05","algorithm":"ed25519","signed_at":"2026-06-11T01:11:00.853935Z","signature_b64":"NqCAUtJS4GEkXvwgYyV05dhB0EkQLAbOZu9c+LA0M/EckYBrc3STGszqn0Z7RM7A83QAzKyQJpFJMcnbq19IBw==","signed_message":"canonical_sha256_bytes","builder_version":"pith-number-builder-2026-05-17-v1","receipt_version":"0.3","canonical_sha256":"101dd90780fedafab53735e60c46b163a35d6b99c1f479bcde41147d998842b7","last_reissued_at":"2026-06-11T01:11:00.853222Z","signature_status":"signed_v1","first_computed_at":"2026-06-11T01:11:00.853222Z","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54"},"source_kind":"arxiv","source_id":"2606.12303","source_version":1,"attestation_state":"computed"},"signer":{"signer_id":"pith.science","signer_type":"pith_registry","key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54"},"created_at":"2026-06-11T01:11:00Z","supersedes":[],"prev_event":null,"signature":{"signature_status":"signed_v1","algorithm":"ed25519","key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","signature_b64":"yEjcx+PFg4OJGvAviZL48eHnbvLtdCttDgPOoGkPy9GzrPctYHhqcm+Ok1SQGCGgruc8kca4wVxY9d1e00ytBQ==","signed_message":"open_graph_event_sha256_bytes","signed_at":"2026-06-26T20:12:35.692955Z"},"content_sha256":"be6b8500a6fbf24f23d6e313f7afdc876e497c04d5edac1493666e770bf9a221","schema_version":"1.0","event_id":"sha256:be6b8500a6fbf24f23d6e313f7afdc876e497c04d5edac1493666e770bf9a221"},{"event_type":"graph_snapshot","subject_pith_number":"pith:2026:CAO5SB4A73NPVNJXGXTAYRVRMO","target":"graph","payload":{"graph_snapshot":{"paper":{"title":"From 2D Grids to 1D Tokens: Reforming Shared Representations for Multimodal Image Fusion","license":"http://creativecommons.org/licenses/by/4.0/","headline":"","cross_cats":[],"primary_cat":"cs.CV","authors_text":"Yang He, Yi Yang, Yuchen Xian, Yunqiu Xu","submitted_at":"2026-06-10T16:40:18Z","abstract_excerpt":"Multimodal image fusion aims to integrate complementary information from different modalities into a fused image that preserves rich local details while maintaining globally consistent appearance. Existing approaches build shared representations on 2D feature grids, which excel at modeling local structures but offer limited leverage over image-level global appearance factors. To balance these objectives, we introduce a compact 1D token interface based on a frozen pretrained image tokenizer for modeling non-local appearance/base factors. Rather than using the tokenizer as a reconstruction backb"},"claims":{"count":0,"items":[],"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"source":{"id":"2606.12303","kind":"arxiv","version":1},"verdict":{"id":null,"model_set":{},"created_at":null,"strongest_claim":"","one_line_summary":"","pipeline_version":null,"weakest_assumption":"","pith_extraction_headline":""},"integrity":{"clean":true,"summary":{"advisory":0,"critical":0,"by_detector":{},"informational":0},"endpoint":"/pith/2606.12303/integrity.json","findings":[],"available":true,"detectors_run":[],"snapshot_sha256":"c28c3603d3b5d939e8dc4c7e95fa8dfce3d595e45f758748cecf8e644a296938"},"references":{"count":0,"sample":[],"resolved_work":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57","internal_anchors":0},"formal_canon":{"evidence_count":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"author_claims":{"count":0,"strong_count":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"builder_version":"pith-number-builder-2026-05-17-v1"},"verdict_id":null},"signer":{"signer_id":"pith.science","signer_type":"pith_registry","key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54"},"created_at":"2026-06-11T01:11:00Z","supersedes":[],"prev_event":null,"signature":{"signature_status":"signed_v1","algorithm":"ed25519","key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","signature_b64":"I6c6hDtNktLdr+0aHoX/ej/J9kT9XF+UJPq2o5UR9qUgIhq4XiPIQlR+fJZL0ezmUt04Zg9gQ4bPObMLfSTjAw==","signed_message":"open_graph_event_sha256_bytes","signed_at":"2026-06-26T20:12:35.693338Z"},"content_sha256":"f6b27db9b603508ddca061d5223f66ab198a5dbf924f0726bcfed761f7775b75","schema_version":"1.0","event_id":"sha256:f6b27db9b603508ddca061d5223f66ab198a5dbf924f0726bcfed761f7775b75"}],"timestamp_proofs":[],"mirror_hints":[{"mirror_type":"https","name":"Pith Resolver","base_url":"https://pith.science","bundle_url":"https://pith.science/pith/CAO5SB4A73NPVNJXGXTAYRVRMO/bundle.json","state_url":"https://pith.science/pith/CAO5SB4A73NPVNJXGXTAYRVRMO/state.json","well_known_bundle_url":"https://pith.science/.well-known/pith/CAO5SB4A73NPVNJXGXTAYRVRMO/bundle.json","status":"primary"}],"public_keys":[{"key_id":"pith-v1-2026-05","algorithm":"ed25519","format":"raw","public_key_b64":"stVStoiQhXFxp4s2pdzPNoqVNBMojDU/fJ2db5S3CbM=","public_key_hex":"b2d552b68890857171a78b36a5dccf368a953413288c353f7c9d9d6f94b709b3","fingerprint_sha256_b32_first128bits":"RVFV5Z2OI2J3ZUO7ERDEBCYNKS","fingerprint_sha256_hex":"8d4b5ee74e4693bcd1df2446408b0d54","rotates_at":null,"url":"https://pith.science/pith-signing-key.json","notes":"Pith uses this Ed25519 key to sign canonical record SHA-256 digests. Verify with: ed25519_verify(public_key, message=canonical_sha256_bytes, signature=base64decode(signature_b64))."}],"merge_version":"pith-open-graph-merge-v1","built_at":"2026-06-26T20:12:35Z","links":{"resolver":"https://pith.science/pith/CAO5SB4A73NPVNJXGXTAYRVRMO","bundle":"https://pith.science/pith/CAO5SB4A73NPVNJXGXTAYRVRMO/bundle.json","state":"https://pith.science/pith/CAO5SB4A73NPVNJXGXTAYRVRMO/state.json","well_known_bundle":"https://pith.science/.well-known/pith/CAO5SB4A73NPVNJXGXTAYRVRMO/bundle.json"},"state":{"state_type":"pith_open_graph_state","state_version":"1.0","pith_number":"pith:2026:CAO5SB4A73NPVNJXGXTAYRVRMO","merge_version":"pith-open-graph-merge-v1","event_count":2,"valid_event_count":2,"invalid_event_count":0,"equivocation_count":0,"current":{"canonical_record":{"metadata":{"abstract_canon_sha256":"d08c6323b7ddf47080185359c6d12b742776b8edc10e57cfda67db8e6993cc3a","cross_cats_sorted":[],"license":"http://creativecommons.org/licenses/by/4.0/","primary_cat":"cs.CV","submitted_at":"2026-06-10T16:40:18Z","title_canon_sha256":"20de4f71f86b159861131333ddc70bad042b7058d28b71646ada90c50b0b5f8d"},"schema_version":"1.0","source":{"id":"2606.12303","kind":"arxiv","version":1}},"source_aliases":[{"alias_kind":"arxiv","alias_value":"2606.12303","created_at":"2026-06-11T01:11:00Z"},{"alias_kind":"arxiv_version","alias_value":"2606.12303v1","created_at":"2026-06-11T01:11:00Z"},{"alias_kind":"doi","alias_value":"10.48550/arxiv.2606.12303","created_at":"2026-06-11T01:11:00Z"},{"alias_kind":"pith_short_12","alias_value":"CAO5SB4A73NP","created_at":"2026-06-11T01:11:00Z"},{"alias_kind":"pith_short_16","alias_value":"CAO5SB4A73NPVNJX","created_at":"2026-06-11T01:11:00Z"},{"alias_kind":"pith_short_8","alias_value":"CAO5SB4A","created_at":"2026-06-11T01:11:00Z"}],"graph_snapshots":[{"event_id":"sha256:f6b27db9b603508ddca061d5223f66ab198a5dbf924f0726bcfed761f7775b75","target":"graph","created_at":"2026-06-11T01:11:00Z","signer":{"key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","signer_id":"pith.science","signer_type":"pith_registry"},"payload":{"graph_snapshot":{"author_claims":{"count":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57","strong_count":0},"builder_version":"pith-number-builder-2026-05-17-v1","claims":{"count":0,"items":[],"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"formal_canon":{"evidence_count":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"integrity":{"available":true,"clean":true,"detectors_run":[],"endpoint":"/pith/2606.12303/integrity.json","findings":[],"snapshot_sha256":"c28c3603d3b5d939e8dc4c7e95fa8dfce3d595e45f758748cecf8e644a296938","summary":{"advisory":0,"by_detector":{},"critical":0,"informational":0}},"paper":{"abstract_excerpt":"Multimodal image fusion aims to integrate complementary information from different modalities into a fused image that preserves rich local details while maintaining globally consistent appearance. Existing approaches build shared representations on 2D feature grids, which excel at modeling local structures but offer limited leverage over image-level global appearance factors. To balance these objectives, we introduce a compact 1D token interface based on a frozen pretrained image tokenizer for modeling non-local appearance/base factors. Rather than using the tokenizer as a reconstruction backb","authors_text":"Yang He, Yi Yang, Yuchen Xian, Yunqiu Xu","cross_cats":[],"headline":"","license":"http://creativecommons.org/licenses/by/4.0/","primary_cat":"cs.CV","submitted_at":"2026-06-10T16:40:18Z","title":"From 2D Grids to 1D Tokens: Reforming Shared Representations for Multimodal Image Fusion"},"references":{"count":0,"internal_anchors":0,"resolved_work":0,"sample":[],"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"source":{"id":"2606.12303","kind":"arxiv","version":1},"verdict":{"created_at":null,"id":null,"model_set":{},"one_line_summary":"","pipeline_version":null,"pith_extraction_headline":"","strongest_claim":"","weakest_assumption":""}},"verdict_id":null}}],"author_attestations":[],"timestamp_anchors":[],"storage_attestations":[],"citation_signatures":[],"replication_records":[],"corrections":[],"mirror_hints":[],"record_created":{"event_id":"sha256:be6b8500a6fbf24f23d6e313f7afdc876e497c04d5edac1493666e770bf9a221","target":"record","created_at":"2026-06-11T01:11:00Z","signer":{"key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","signer_id":"pith.science","signer_type":"pith_registry"},"payload":{"attestation_state":"computed","canonical_record":{"metadata":{"abstract_canon_sha256":"d08c6323b7ddf47080185359c6d12b742776b8edc10e57cfda67db8e6993cc3a","cross_cats_sorted":[],"license":"http://creativecommons.org/licenses/by/4.0/","primary_cat":"cs.CV","submitted_at":"2026-06-10T16:40:18Z","title_canon_sha256":"20de4f71f86b159861131333ddc70bad042b7058d28b71646ada90c50b0b5f8d"},"schema_version":"1.0","source":{"id":"2606.12303","kind":"arxiv","version":1}},"canonical_sha256":"101dd90780fedafab53735e60c46b163a35d6b99c1f479bcde41147d998842b7","receipt":{"algorithm":"ed25519","builder_version":"pith-number-builder-2026-05-17-v1","canonical_sha256":"101dd90780fedafab53735e60c46b163a35d6b99c1f479bcde41147d998842b7","first_computed_at":"2026-06-11T01:11:00.853222Z","key_id":"pith-v1-2026-05","kind":"pith_receipt","last_reissued_at":"2026-06-11T01:11:00.853222Z","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","receipt_version":"0.3","signature_b64":"NqCAUtJS4GEkXvwgYyV05dhB0EkQLAbOZu9c+LA0M/EckYBrc3STGszqn0Z7RM7A83QAzKyQJpFJMcnbq19IBw==","signature_status":"signed_v1","signed_at":"2026-06-11T01:11:00.853935Z","signed_message":"canonical_sha256_bytes"},"source_id":"2606.12303","source_kind":"arxiv","source_version":1}}},"equivocations":[],"invalid_events":[],"applied_event_ids":["sha256:be6b8500a6fbf24f23d6e313f7afdc876e497c04d5edac1493666e770bf9a221","sha256:f6b27db9b603508ddca061d5223f66ab198a5dbf924f0726bcfed761f7775b75"],"state_sha256":"7f67df6a37bc4677d111c586689277e0042cacfe875ba8a5f6f0755a77ec0541"},"bundle_signature":{"signature_status":"signed_v1","algorithm":"ed25519","key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","signature_b64":"XtZ/kIH6drsuyQNXZhZ+lN1A5g+pjN4yV3rLsgqg0DWhmnJeqjszLYKKZuDlJyRVNR+sVxOrrxhew1SZFrmABg==","signed_message":"bundle_sha256_bytes","signed_at":"2026-06-26T20:12:35.695279Z","bundle_sha256":"fa9a5d1b61834923365e8997d6e787f42fd9afa9360b594996df22c0597c509a"}}