{"bundle_type":"pith_open_graph_bundle","bundle_version":"1.0","pith_number":"pith:2026:YS4AO72QXJS654NAJABZW3TQNX","short_pith_number":"pith:YS4AO72Q","canonical_record":{"source":{"id":"2602.23353","kind":"arxiv","version":2},"metadata":{"license":"http://creativecommons.org/licenses/by/4.0/","primary_cat":"cs.LG","submitted_at":"2026-02-26T18:55:06Z","cross_cats_sorted":["cs.AI"],"title_canon_sha256":"fe0d8b0ec9918fb1ea40c2f823afabf96b2aeb5939e0dd8b277b55bb3cc0cdd9","abstract_canon_sha256":"a360e0eebbe18b2d153fb1dd09688a069bf854b444705d4c700b455acd5d5b03"},"schema_version":"1.0"},"canonical_sha256":"c4b8077f50ba65eef1a048039b6e706df90eb5882285b3154f35c43028a90ad8","source":{"kind":"arxiv","id":"2602.23353","version":2},"source_aliases":[{"alias_kind":"arxiv","alias_value":"2602.23353","created_at":"2026-06-30T02:18:07Z"},{"alias_kind":"arxiv_version","alias_value":"2602.23353v2","created_at":"2026-06-30T02:18:07Z"},{"alias_kind":"doi","alias_value":"10.48550/arxiv.2602.23353","created_at":"2026-06-30T02:18:07Z"},{"alias_kind":"pith_short_12","alias_value":"YS4AO72QXJS6","created_at":"2026-06-30T02:18:07Z"},{"alias_kind":"pith_short_16","alias_value":"YS4AO72QXJS654NA","created_at":"2026-06-30T02:18:07Z"},{"alias_kind":"pith_short_8","alias_value":"YS4AO72Q","created_at":"2026-06-30T02:18:07Z"}],"events":[{"event_type":"record_created","subject_pith_number":"pith:2026:YS4AO72QXJS654NAJABZW3TQNX","target":"record","payload":{"canonical_record":{"source":{"id":"2602.23353","kind":"arxiv","version":2},"metadata":{"license":"http://creativecommons.org/licenses/by/4.0/","primary_cat":"cs.LG","submitted_at":"2026-02-26T18:55:06Z","cross_cats_sorted":["cs.AI"],"title_canon_sha256":"fe0d8b0ec9918fb1ea40c2f823afabf96b2aeb5939e0dd8b277b55bb3cc0cdd9","abstract_canon_sha256":"a360e0eebbe18b2d153fb1dd09688a069bf854b444705d4c700b455acd5d5b03"},"schema_version":"1.0"},"canonical_sha256":"c4b8077f50ba65eef1a048039b6e706df90eb5882285b3154f35c43028a90ad8","receipt":{"kind":"pith_receipt","key_id":"pith-v1-2026-05","algorithm":"ed25519","signed_at":"2026-06-30T02:18:07.210325Z","signature_b64":"ggl1Q5zGAzRy69xPyT6//0SghB3Ljs0rHr8DquLu8sRMAIhUShrCP90GmoWTHyLNPgZqQx/3lKGjrZu4+0oyDA==","signed_message":"canonical_sha256_bytes","builder_version":"pith-number-builder-2026-05-17-v1","receipt_version":"0.3","canonical_sha256":"c4b8077f50ba65eef1a048039b6e706df90eb5882285b3154f35c43028a90ad8","last_reissued_at":"2026-06-30T02:18:07.209767Z","signature_status":"signed_v1","first_computed_at":"2026-06-30T02:18:07.209767Z","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54"},"source_kind":"arxiv","source_id":"2602.23353","source_version":2,"attestation_state":"computed"},"signer":{"signer_id":"pith.science","signer_type":"pith_registry","key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54"},"created_at":"2026-06-30T02:18:07Z","supersedes":[],"prev_event":null,"signature":{"signature_status":"signed_v1","algorithm":"ed25519","key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","signature_b64":"cufYCyacZ4TclY7uh9tIzuEyCKATffkYyYL+YFWmr4UVnLL8cDJRNGCi5A69J57x29xknS+q+Y/dPnv4t/VdBA==","signed_message":"open_graph_event_sha256_bytes","signed_at":"2026-07-01T15:38:37.402014Z"},"content_sha256":"48dd3fe130bf2b363115311f69135d2fb268a396f8a0e1716dfb61fe35e98d98","schema_version":"1.0","event_id":"sha256:48dd3fe130bf2b363115311f69135d2fb268a396f8a0e1716dfb61fe35e98d98"},{"event_type":"graph_snapshot","subject_pith_number":"pith:2026:YS4AO72QXJS654NAJABZW3TQNX","target":"graph","payload":{"graph_snapshot":{"paper":{"title":"SOTAlign: Semi-Supervised Alignment of Unimodal Vision and Language Models via Optimal Transport","license":"http://creativecommons.org/licenses/by/4.0/","headline":"","cross_cats":["cs.AI"],"primary_cat":"cs.LG","authors_text":"Paul Krzakala, Quentin Bouniot, Simon Roschmann, Sonia Mazelet, Zeynep Akata","submitted_at":"2026-02-26T18:55:06Z","abstract_excerpt":"The Platonic Representation Hypothesis posits that neural networks trained on different modalities converge toward a shared statistical model of the world. Recent work exploits this convergence by aligning frozen pretrained vision and language models with lightweight alignment layers, but typically relies on contrastive losses and millions of paired samples. In this work, we ask whether meaningful alignment can be achieved with substantially less supervision. We introduce a semi-supervised setting in which pretrained unimodal encoders are aligned using a small number of image-text pairs togeth"},"claims":{"count":0,"items":[],"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"source":{"id":"2602.23353","kind":"arxiv","version":2},"verdict":{"id":null,"model_set":{},"created_at":null,"strongest_claim":"","one_line_summary":"","pipeline_version":null,"weakest_assumption":"","pith_extraction_headline":""},"integrity":{"clean":true,"summary":{"advisory":0,"critical":0,"by_detector":{},"informational":0},"endpoint":"/pith/2602.23353/integrity.json","findings":[],"available":true,"detectors_run":[],"snapshot_sha256":"c28c3603d3b5d939e8dc4c7e95fa8dfce3d595e45f758748cecf8e644a296938"},"references":{"count":0,"sample":[],"resolved_work":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57","internal_anchors":0},"formal_canon":{"evidence_count":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"author_claims":{"count":0,"strong_count":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"builder_version":"pith-number-builder-2026-05-17-v1"},"verdict_id":null},"signer":{"signer_id":"pith.science","signer_type":"pith_registry","key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54"},"created_at":"2026-06-30T02:18:07Z","supersedes":[],"prev_event":null,"signature":{"signature_status":"signed_v1","algorithm":"ed25519","key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","signature_b64":"GBCNP1sK+nmERYysnSx2k0E6vTSwKUeLDVj4pEVqCwrI5YRQe1jeyXnjtJs6GchmEctvQlLQDEoSwK+QPj4nDA==","signed_message":"open_graph_event_sha256_bytes","signed_at":"2026-07-01T15:38:37.402445Z"},"content_sha256":"7f97c206f46fc61059c76c0082a6705e533b20a162d42931b05a24e99286ffc3","schema_version":"1.0","event_id":"sha256:7f97c206f46fc61059c76c0082a6705e533b20a162d42931b05a24e99286ffc3"}],"timestamp_proofs":[],"mirror_hints":[{"mirror_type":"https","name":"Pith Resolver","base_url":"https://pith.science","bundle_url":"https://pith.science/pith/YS4AO72QXJS654NAJABZW3TQNX/bundle.json","state_url":"https://pith.science/pith/YS4AO72QXJS654NAJABZW3TQNX/state.json","well_known_bundle_url":"https://pith.science/.well-known/pith/YS4AO72QXJS654NAJABZW3TQNX/bundle.json","status":"primary"}],"public_keys":[{"key_id":"pith-v1-2026-05","algorithm":"ed25519","format":"raw","public_key_b64":"stVStoiQhXFxp4s2pdzPNoqVNBMojDU/fJ2db5S3CbM=","public_key_hex":"b2d552b68890857171a78b36a5dccf368a953413288c353f7c9d9d6f94b709b3","fingerprint_sha256_b32_first128bits":"RVFV5Z2OI2J3ZUO7ERDEBCYNKS","fingerprint_sha256_hex":"8d4b5ee74e4693bcd1df2446408b0d54","rotates_at":null,"url":"https://pith.science/pith-signing-key.json","notes":"Pith uses this Ed25519 key to sign canonical record SHA-256 digests. Verify with: ed25519_verify(public_key, message=canonical_sha256_bytes, signature=base64decode(signature_b64))."}],"merge_version":"pith-open-graph-merge-v1","built_at":"2026-07-01T15:38:37Z","links":{"resolver":"https://pith.science/pith/YS4AO72QXJS654NAJABZW3TQNX","bundle":"https://pith.science/pith/YS4AO72QXJS654NAJABZW3TQNX/bundle.json","state":"https://pith.science/pith/YS4AO72QXJS654NAJABZW3TQNX/state.json","well_known_bundle":"https://pith.science/.well-known/pith/YS4AO72QXJS654NAJABZW3TQNX/bundle.json"},"state":{"state_type":"pith_open_graph_state","state_version":"1.0","pith_number":"pith:2026:YS4AO72QXJS654NAJABZW3TQNX","merge_version":"pith-open-graph-merge-v1","event_count":2,"valid_event_count":2,"invalid_event_count":0,"equivocation_count":0,"current":{"canonical_record":{"metadata":{"abstract_canon_sha256":"a360e0eebbe18b2d153fb1dd09688a069bf854b444705d4c700b455acd5d5b03","cross_cats_sorted":["cs.AI"],"license":"http://creativecommons.org/licenses/by/4.0/","primary_cat":"cs.LG","submitted_at":"2026-02-26T18:55:06Z","title_canon_sha256":"fe0d8b0ec9918fb1ea40c2f823afabf96b2aeb5939e0dd8b277b55bb3cc0cdd9"},"schema_version":"1.0","source":{"id":"2602.23353","kind":"arxiv","version":2}},"source_aliases":[{"alias_kind":"arxiv","alias_value":"2602.23353","created_at":"2026-06-30T02:18:07Z"},{"alias_kind":"arxiv_version","alias_value":"2602.23353v2","created_at":"2026-06-30T02:18:07Z"},{"alias_kind":"doi","alias_value":"10.48550/arxiv.2602.23353","created_at":"2026-06-30T02:18:07Z"},{"alias_kind":"pith_short_12","alias_value":"YS4AO72QXJS6","created_at":"2026-06-30T02:18:07Z"},{"alias_kind":"pith_short_16","alias_value":"YS4AO72QXJS654NA","created_at":"2026-06-30T02:18:07Z"},{"alias_kind":"pith_short_8","alias_value":"YS4AO72Q","created_at":"2026-06-30T02:18:07Z"}],"graph_snapshots":[{"event_id":"sha256:7f97c206f46fc61059c76c0082a6705e533b20a162d42931b05a24e99286ffc3","target":"graph","created_at":"2026-06-30T02:18:07Z","signer":{"key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","signer_id":"pith.science","signer_type":"pith_registry"},"payload":{"graph_snapshot":{"author_claims":{"count":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57","strong_count":0},"builder_version":"pith-number-builder-2026-05-17-v1","claims":{"count":0,"items":[],"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"formal_canon":{"evidence_count":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"integrity":{"available":true,"clean":true,"detectors_run":[],"endpoint":"/pith/2602.23353/integrity.json","findings":[],"snapshot_sha256":"c28c3603d3b5d939e8dc4c7e95fa8dfce3d595e45f758748cecf8e644a296938","summary":{"advisory":0,"by_detector":{},"critical":0,"informational":0}},"paper":{"abstract_excerpt":"The Platonic Representation Hypothesis posits that neural networks trained on different modalities converge toward a shared statistical model of the world. Recent work exploits this convergence by aligning frozen pretrained vision and language models with lightweight alignment layers, but typically relies on contrastive losses and millions of paired samples. In this work, we ask whether meaningful alignment can be achieved with substantially less supervision. We introduce a semi-supervised setting in which pretrained unimodal encoders are aligned using a small number of image-text pairs togeth","authors_text":"Paul Krzakala, Quentin Bouniot, Simon Roschmann, Sonia Mazelet, Zeynep Akata","cross_cats":["cs.AI"],"headline":"","license":"http://creativecommons.org/licenses/by/4.0/","primary_cat":"cs.LG","submitted_at":"2026-02-26T18:55:06Z","title":"SOTAlign: Semi-Supervised Alignment of Unimodal Vision and Language Models via Optimal Transport"},"references":{"count":0,"internal_anchors":0,"resolved_work":0,"sample":[],"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"source":{"id":"2602.23353","kind":"arxiv","version":2},"verdict":{"created_at":null,"id":null,"model_set":{},"one_line_summary":"","pipeline_version":null,"pith_extraction_headline":"","strongest_claim":"","weakest_assumption":""}},"verdict_id":null}}],"author_attestations":[],"timestamp_anchors":[],"storage_attestations":[],"citation_signatures":[],"replication_records":[],"corrections":[],"mirror_hints":[],"record_created":{"event_id":"sha256:48dd3fe130bf2b363115311f69135d2fb268a396f8a0e1716dfb61fe35e98d98","target":"record","created_at":"2026-06-30T02:18:07Z","signer":{"key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","signer_id":"pith.science","signer_type":"pith_registry"},"payload":{"attestation_state":"computed","canonical_record":{"metadata":{"abstract_canon_sha256":"a360e0eebbe18b2d153fb1dd09688a069bf854b444705d4c700b455acd5d5b03","cross_cats_sorted":["cs.AI"],"license":"http://creativecommons.org/licenses/by/4.0/","primary_cat":"cs.LG","submitted_at":"2026-02-26T18:55:06Z","title_canon_sha256":"fe0d8b0ec9918fb1ea40c2f823afabf96b2aeb5939e0dd8b277b55bb3cc0cdd9"},"schema_version":"1.0","source":{"id":"2602.23353","kind":"arxiv","version":2}},"canonical_sha256":"c4b8077f50ba65eef1a048039b6e706df90eb5882285b3154f35c43028a90ad8","receipt":{"algorithm":"ed25519","builder_version":"pith-number-builder-2026-05-17-v1","canonical_sha256":"c4b8077f50ba65eef1a048039b6e706df90eb5882285b3154f35c43028a90ad8","first_computed_at":"2026-06-30T02:18:07.209767Z","key_id":"pith-v1-2026-05","kind":"pith_receipt","last_reissued_at":"2026-06-30T02:18:07.209767Z","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","receipt_version":"0.3","signature_b64":"ggl1Q5zGAzRy69xPyT6//0SghB3Ljs0rHr8DquLu8sRMAIhUShrCP90GmoWTHyLNPgZqQx/3lKGjrZu4+0oyDA==","signature_status":"signed_v1","signed_at":"2026-06-30T02:18:07.210325Z","signed_message":"canonical_sha256_bytes"},"source_id":"2602.23353","source_kind":"arxiv","source_version":2}}},"equivocations":[],"invalid_events":[],"applied_event_ids":["sha256:48dd3fe130bf2b363115311f69135d2fb268a396f8a0e1716dfb61fe35e98d98","sha256:7f97c206f46fc61059c76c0082a6705e533b20a162d42931b05a24e99286ffc3"],"state_sha256":"9f4d7634da2cb639172ba2c1c53e0219c94b6cd8dd740e92434311323e8d6d54"},"bundle_signature":{"signature_status":"signed_v1","algorithm":"ed25519","key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","signature_b64":"EHhwQZpj5hS82I8uvvmphZRvIhbVPrkCV6GTxvRpAkJ93QNTx9NPGFrC9aixSsAK/WdyHnYogBHdU3w+zA0+BA==","signed_message":"bundle_sha256_bytes","signed_at":"2026-07-01T15:38:37.404596Z","bundle_sha256":"446fe8683427df0a6794ac68458ed11e525c0d770f214cf9c7899862f2d1c4c5"}}