{"bundle_type":"pith_open_graph_bundle","bundle_version":"1.0","pith_number":"pith:2026:Y3FB54FRTYVHNZ2JYSFBWWZ5A2","short_pith_number":"pith:Y3FB54FR","canonical_record":{"source":{"id":"2605.29628","kind":"arxiv","version":1},"metadata":{"license":"http://arxiv.org/licenses/nonexclusive-distrib/1.0/","primary_cat":"cs.SD","submitted_at":"2026-05-28T09:00:44Z","cross_cats_sorted":["cs.AI","cs.CL","cs.LG","eess.AS"],"title_canon_sha256":"64acf0129969e3080c4de71e0f0ada9af5eba3ff42f3cfc97a5514d05be22515","abstract_canon_sha256":"214ea80155e1efa6d67bb122b1b9139f7cba38f2f9034be83610064656d568ae"},"schema_version":"1.0"},"canonical_sha256":"c6ca1ef0b19e2a76e749c48a1b5b3d06a088a3a4a9cf3ff96fe605f9664fc5b8","source":{"kind":"arxiv","id":"2605.29628","version":1},"source_aliases":[{"alias_kind":"arxiv","alias_value":"2605.29628","created_at":"2026-05-29T01:05:51Z"},{"alias_kind":"arxiv_version","alias_value":"2605.29628v1","created_at":"2026-05-29T01:05:51Z"},{"alias_kind":"doi","alias_value":"10.48550/arxiv.2605.29628","created_at":"2026-05-29T01:05:51Z"},{"alias_kind":"pith_short_12","alias_value":"Y3FB54FRTYVH","created_at":"2026-05-29T01:05:51Z"},{"alias_kind":"pith_short_16","alias_value":"Y3FB54FRTYVHNZ2J","created_at":"2026-05-29T01:05:51Z"},{"alias_kind":"pith_short_8","alias_value":"Y3FB54FR","created_at":"2026-05-29T01:05:51Z"}],"events":[{"event_type":"record_created","subject_pith_number":"pith:2026:Y3FB54FRTYVHNZ2JYSFBWWZ5A2","target":"record","payload":{"canonical_record":{"source":{"id":"2605.29628","kind":"arxiv","version":1},"metadata":{"license":"http://arxiv.org/licenses/nonexclusive-distrib/1.0/","primary_cat":"cs.SD","submitted_at":"2026-05-28T09:00:44Z","cross_cats_sorted":["cs.AI","cs.CL","cs.LG","eess.AS"],"title_canon_sha256":"64acf0129969e3080c4de71e0f0ada9af5eba3ff42f3cfc97a5514d05be22515","abstract_canon_sha256":"214ea80155e1efa6d67bb122b1b9139f7cba38f2f9034be83610064656d568ae"},"schema_version":"1.0"},"canonical_sha256":"c6ca1ef0b19e2a76e749c48a1b5b3d06a088a3a4a9cf3ff96fe605f9664fc5b8","receipt":{"kind":"pith_receipt","key_id":"pith-v1-2026-05","algorithm":"ed25519","signed_at":"2026-05-29T01:05:51.802787Z","signature_b64":"Lavf4E1y3z6/rmixIEooGlm+nRXOujSXZuh37fUKKTYrTqoUp3j/JxA4zeX1oKAHqvFQlaSkxmG1ZmR5ia15AQ==","signed_message":"canonical_sha256_bytes","builder_version":"pith-number-builder-2026-05-17-v1","receipt_version":"0.3","canonical_sha256":"c6ca1ef0b19e2a76e749c48a1b5b3d06a088a3a4a9cf3ff96fe605f9664fc5b8","last_reissued_at":"2026-05-29T01:05:51.802159Z","signature_status":"signed_v1","first_computed_at":"2026-05-29T01:05:51.802159Z","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54"},"source_kind":"arxiv","source_id":"2605.29628","source_version":1,"attestation_state":"computed"},"signer":{"signer_id":"pith.science","signer_type":"pith_registry","key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54"},"created_at":"2026-05-29T01:05:51Z","supersedes":[],"prev_event":null,"signature":{"signature_status":"signed_v1","algorithm":"ed25519","key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","signature_b64":"W0Y+SnO+u5ZTQXOc4SBEHGnmE3HzjugICUiKt9iab1V8qJuex3NlzIXa8wZjP4CURl/xbZzRo7LuPrJfhnRkDg==","signed_message":"open_graph_event_sha256_bytes","signed_at":"2026-06-03T17:21:30.763657Z"},"content_sha256":"a7f6f74d139538b2303eb6003d28eec61746247b50ccb77b7165afaa2beb1cd7","schema_version":"1.0","event_id":"sha256:a7f6f74d139538b2303eb6003d28eec61746247b50ccb77b7165afaa2beb1cd7"},{"event_type":"graph_snapshot","subject_pith_number":"pith:2026:Y3FB54FRTYVHNZ2JYSFBWWZ5A2","target":"graph","payload":{"graph_snapshot":{"paper":{"title":"COMET: Concept Space Dissection of the Modality Gap in Audio-Text Multimodal Contrastive Embeddings","license":"http://arxiv.org/licenses/nonexclusive-distrib/1.0/","headline":"","cross_cats":["cs.AI","cs.CL","cs.LG","eess.AS"],"primary_cat":"cs.SD","authors_text":"Aidong Men, Liting Gao, Wenwu Wang, Yonggang Zhu","submitted_at":"2026-05-28T09:00:44Z","abstract_excerpt":"Contrastive Language-Audio Pretraining (CLAP) models are widely used for audio understanding and support modality-agnostic condition swapping in many zero-shot applications. However, their performance is heavily affected by the modality gap between audio and text embeddings. Existing explanations mainly attribute this gap to the cone effect, treating it as a shift between mean embeddings, yet correcting the mean alone yields only limited improvements. Alternative hypotheses, such as information imbalance and dimensionality collapse, have also been proposed, but they remain insufficiently verif"},"claims":{"count":0,"items":[],"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"source":{"id":"2605.29628","kind":"arxiv","version":1},"verdict":{"id":null,"model_set":{},"created_at":null,"strongest_claim":"","one_line_summary":"","pipeline_version":null,"weakest_assumption":"","pith_extraction_headline":""},"integrity":{"clean":true,"summary":{"advisory":0,"critical":0,"by_detector":{},"informational":0},"endpoint":"/pith/2605.29628/integrity.json","findings":[],"available":true,"detectors_run":[],"snapshot_sha256":"c28c3603d3b5d939e8dc4c7e95fa8dfce3d595e45f758748cecf8e644a296938"},"references":{"count":0,"sample":[],"resolved_work":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57","internal_anchors":0},"formal_canon":{"evidence_count":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"author_claims":{"count":0,"strong_count":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"builder_version":"pith-number-builder-2026-05-17-v1"},"verdict_id":null},"signer":{"signer_id":"pith.science","signer_type":"pith_registry","key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54"},"created_at":"2026-05-29T01:05:51Z","supersedes":[],"prev_event":null,"signature":{"signature_status":"signed_v1","algorithm":"ed25519","key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","signature_b64":"aA+BLT8OJmwTCGjGJT18uA1PirmGourh/mk9TVkMljHzJvkQvjFRTjYKrSq5WgGjL64UmY6vZWoWKirk4WmnDw==","signed_message":"open_graph_event_sha256_bytes","signed_at":"2026-06-03T17:21:30.764034Z"},"content_sha256":"6d5e9b9b6fb309fd54766d88a0d5dc83b01e8f9833217a2975684ab0d844ef5a","schema_version":"1.0","event_id":"sha256:6d5e9b9b6fb309fd54766d88a0d5dc83b01e8f9833217a2975684ab0d844ef5a"}],"timestamp_proofs":[],"mirror_hints":[{"mirror_type":"https","name":"Pith Resolver","base_url":"https://pith.science","bundle_url":"https://pith.science/pith/Y3FB54FRTYVHNZ2JYSFBWWZ5A2/bundle.json","state_url":"https://pith.science/pith/Y3FB54FRTYVHNZ2JYSFBWWZ5A2/state.json","well_known_bundle_url":"https://pith.science/.well-known/pith/Y3FB54FRTYVHNZ2JYSFBWWZ5A2/bundle.json","status":"primary"}],"public_keys":[{"key_id":"pith-v1-2026-05","algorithm":"ed25519","format":"raw","public_key_b64":"stVStoiQhXFxp4s2pdzPNoqVNBMojDU/fJ2db5S3CbM=","public_key_hex":"b2d552b68890857171a78b36a5dccf368a953413288c353f7c9d9d6f94b709b3","fingerprint_sha256_b32_first128bits":"RVFV5Z2OI2J3ZUO7ERDEBCYNKS","fingerprint_sha256_hex":"8d4b5ee74e4693bcd1df2446408b0d54","rotates_at":null,"url":"https://pith.science/pith-signing-key.json","notes":"Pith uses this Ed25519 key to sign canonical record SHA-256 digests. Verify with: ed25519_verify(public_key, message=canonical_sha256_bytes, signature=base64decode(signature_b64))."}],"merge_version":"pith-open-graph-merge-v1","built_at":"2026-06-03T17:21:30Z","links":{"resolver":"https://pith.science/pith/Y3FB54FRTYVHNZ2JYSFBWWZ5A2","bundle":"https://pith.science/pith/Y3FB54FRTYVHNZ2JYSFBWWZ5A2/bundle.json","state":"https://pith.science/pith/Y3FB54FRTYVHNZ2JYSFBWWZ5A2/state.json","well_known_bundle":"https://pith.science/.well-known/pith/Y3FB54FRTYVHNZ2JYSFBWWZ5A2/bundle.json"},"state":{"state_type":"pith_open_graph_state","state_version":"1.0","pith_number":"pith:2026:Y3FB54FRTYVHNZ2JYSFBWWZ5A2","merge_version":"pith-open-graph-merge-v1","event_count":2,"valid_event_count":2,"invalid_event_count":0,"equivocation_count":0,"current":{"canonical_record":{"metadata":{"abstract_canon_sha256":"214ea80155e1efa6d67bb122b1b9139f7cba38f2f9034be83610064656d568ae","cross_cats_sorted":["cs.AI","cs.CL","cs.LG","eess.AS"],"license":"http://arxiv.org/licenses/nonexclusive-distrib/1.0/","primary_cat":"cs.SD","submitted_at":"2026-05-28T09:00:44Z","title_canon_sha256":"64acf0129969e3080c4de71e0f0ada9af5eba3ff42f3cfc97a5514d05be22515"},"schema_version":"1.0","source":{"id":"2605.29628","kind":"arxiv","version":1}},"source_aliases":[{"alias_kind":"arxiv","alias_value":"2605.29628","created_at":"2026-05-29T01:05:51Z"},{"alias_kind":"arxiv_version","alias_value":"2605.29628v1","created_at":"2026-05-29T01:05:51Z"},{"alias_kind":"doi","alias_value":"10.48550/arxiv.2605.29628","created_at":"2026-05-29T01:05:51Z"},{"alias_kind":"pith_short_12","alias_value":"Y3FB54FRTYVH","created_at":"2026-05-29T01:05:51Z"},{"alias_kind":"pith_short_16","alias_value":"Y3FB54FRTYVHNZ2J","created_at":"2026-05-29T01:05:51Z"},{"alias_kind":"pith_short_8","alias_value":"Y3FB54FR","created_at":"2026-05-29T01:05:51Z"}],"graph_snapshots":[{"event_id":"sha256:6d5e9b9b6fb309fd54766d88a0d5dc83b01e8f9833217a2975684ab0d844ef5a","target":"graph","created_at":"2026-05-29T01:05:51Z","signer":{"key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","signer_id":"pith.science","signer_type":"pith_registry"},"payload":{"graph_snapshot":{"author_claims":{"count":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57","strong_count":0},"builder_version":"pith-number-builder-2026-05-17-v1","claims":{"count":0,"items":[],"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"formal_canon":{"evidence_count":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"integrity":{"available":true,"clean":true,"detectors_run":[],"endpoint":"/pith/2605.29628/integrity.json","findings":[],"snapshot_sha256":"c28c3603d3b5d939e8dc4c7e95fa8dfce3d595e45f758748cecf8e644a296938","summary":{"advisory":0,"by_detector":{},"critical":0,"informational":0}},"paper":{"abstract_excerpt":"Contrastive Language-Audio Pretraining (CLAP) models are widely used for audio understanding and support modality-agnostic condition swapping in many zero-shot applications. However, their performance is heavily affected by the modality gap between audio and text embeddings. Existing explanations mainly attribute this gap to the cone effect, treating it as a shift between mean embeddings, yet correcting the mean alone yields only limited improvements. Alternative hypotheses, such as information imbalance and dimensionality collapse, have also been proposed, but they remain insufficiently verif","authors_text":"Aidong Men, Liting Gao, Wenwu Wang, Yonggang Zhu","cross_cats":["cs.AI","cs.CL","cs.LG","eess.AS"],"headline":"","license":"http://arxiv.org/licenses/nonexclusive-distrib/1.0/","primary_cat":"cs.SD","submitted_at":"2026-05-28T09:00:44Z","title":"COMET: Concept Space Dissection of the Modality Gap in Audio-Text Multimodal Contrastive Embeddings"},"references":{"count":0,"internal_anchors":0,"resolved_work":0,"sample":[],"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"source":{"id":"2605.29628","kind":"arxiv","version":1},"verdict":{"created_at":null,"id":null,"model_set":{},"one_line_summary":"","pipeline_version":null,"pith_extraction_headline":"","strongest_claim":"","weakest_assumption":""}},"verdict_id":null}}],"author_attestations":[],"timestamp_anchors":[],"storage_attestations":[],"citation_signatures":[],"replication_records":[],"corrections":[],"mirror_hints":[],"record_created":{"event_id":"sha256:a7f6f74d139538b2303eb6003d28eec61746247b50ccb77b7165afaa2beb1cd7","target":"record","created_at":"2026-05-29T01:05:51Z","signer":{"key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","signer_id":"pith.science","signer_type":"pith_registry"},"payload":{"attestation_state":"computed","canonical_record":{"metadata":{"abstract_canon_sha256":"214ea80155e1efa6d67bb122b1b9139f7cba38f2f9034be83610064656d568ae","cross_cats_sorted":["cs.AI","cs.CL","cs.LG","eess.AS"],"license":"http://arxiv.org/licenses/nonexclusive-distrib/1.0/","primary_cat":"cs.SD","submitted_at":"2026-05-28T09:00:44Z","title_canon_sha256":"64acf0129969e3080c4de71e0f0ada9af5eba3ff42f3cfc97a5514d05be22515"},"schema_version":"1.0","source":{"id":"2605.29628","kind":"arxiv","version":1}},"canonical_sha256":"c6ca1ef0b19e2a76e749c48a1b5b3d06a088a3a4a9cf3ff96fe605f9664fc5b8","receipt":{"algorithm":"ed25519","builder_version":"pith-number-builder-2026-05-17-v1","canonical_sha256":"c6ca1ef0b19e2a76e749c48a1b5b3d06a088a3a4a9cf3ff96fe605f9664fc5b8","first_computed_at":"2026-05-29T01:05:51.802159Z","key_id":"pith-v1-2026-05","kind":"pith_receipt","last_reissued_at":"2026-05-29T01:05:51.802159Z","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","receipt_version":"0.3","signature_b64":"Lavf4E1y3z6/rmixIEooGlm+nRXOujSXZuh37fUKKTYrTqoUp3j/JxA4zeX1oKAHqvFQlaSkxmG1ZmR5ia15AQ==","signature_status":"signed_v1","signed_at":"2026-05-29T01:05:51.802787Z","signed_message":"canonical_sha256_bytes"},"source_id":"2605.29628","source_kind":"arxiv","source_version":1}}},"equivocations":[],"invalid_events":[],"applied_event_ids":["sha256:a7f6f74d139538b2303eb6003d28eec61746247b50ccb77b7165afaa2beb1cd7","sha256:6d5e9b9b6fb309fd54766d88a0d5dc83b01e8f9833217a2975684ab0d844ef5a"],"state_sha256":"7a3507bc130a0ebabba79a5988b55fb758e0d9d65a32970a9f3b36026c68c347"},"bundle_signature":{"signature_status":"signed_v1","algorithm":"ed25519","key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","signature_b64":"EyH8oNnESPpxU0jjDYVj2RbqUQJ33udBDAERTHV7u3CDxrtAztesD24x9jZ7dtfhk5AHycIVZe71p9PToDfUCg==","signed_message":"bundle_sha256_bytes","signed_at":"2026-06-03T17:21:30.766090Z","bundle_sha256":"f6c43e0a66011e226f90f2f24097b1bdc091c0895b502db4373c1530b76d0a3c"}}