{"bundle_type":"pith_open_graph_bundle","bundle_version":"1.0","pith_number":"pith:2026:U4GG4VYPDRLDGSEISMMOPQUYSJ","short_pith_number":"pith:U4GG4VYP","canonical_record":{"source":{"id":"2605.22202","kind":"arxiv","version":1},"metadata":{"license":"http://creativecommons.org/licenses/by-sa/4.0/","primary_cat":"cs.CL","submitted_at":"2026-05-21T09:05:55Z","cross_cats_sorted":[],"title_canon_sha256":"8559c2bd48519ca7fefcbafaddb5fc41556e59f8a0cc27821ed3951adfa5d266","abstract_canon_sha256":"7b66197ff7a8fd2318ed66d8537eaabecc0d3a559ad3645e43c743219bf51fc1"},"schema_version":"1.0"},"canonical_sha256":"a70c6e570f1c563348889318e7c298924f05d23464acdd8f40b4c01da55bd5d9","source":{"kind":"arxiv","id":"2605.22202","version":1},"source_aliases":[{"alias_kind":"arxiv","alias_value":"2605.22202","created_at":"2026-05-22T01:04:31Z"},{"alias_kind":"arxiv_version","alias_value":"2605.22202v1","created_at":"2026-05-22T01:04:31Z"},{"alias_kind":"doi","alias_value":"10.48550/arxiv.2605.22202","created_at":"2026-05-22T01:04:31Z"},{"alias_kind":"pith_short_12","alias_value":"U4GG4VYPDRLD","created_at":"2026-05-22T01:04:31Z"},{"alias_kind":"pith_short_16","alias_value":"U4GG4VYPDRLDGSEI","created_at":"2026-05-22T01:04:31Z"},{"alias_kind":"pith_short_8","alias_value":"U4GG4VYP","created_at":"2026-05-22T01:04:31Z"}],"events":[{"event_type":"record_created","subject_pith_number":"pith:2026:U4GG4VYPDRLDGSEISMMOPQUYSJ","target":"record","payload":{"canonical_record":{"source":{"id":"2605.22202","kind":"arxiv","version":1},"metadata":{"license":"http://creativecommons.org/licenses/by-sa/4.0/","primary_cat":"cs.CL","submitted_at":"2026-05-21T09:05:55Z","cross_cats_sorted":[],"title_canon_sha256":"8559c2bd48519ca7fefcbafaddb5fc41556e59f8a0cc27821ed3951adfa5d266","abstract_canon_sha256":"7b66197ff7a8fd2318ed66d8537eaabecc0d3a559ad3645e43c743219bf51fc1"},"schema_version":"1.0"},"canonical_sha256":"a70c6e570f1c563348889318e7c298924f05d23464acdd8f40b4c01da55bd5d9","receipt":{"kind":"pith_receipt","key_id":"pith-v1-2026-05","algorithm":"ed25519","signed_at":"2026-05-22T01:04:31.977890Z","signature_b64":"2iQEEhWgHGHzt/u4P+qc9lNRJPreXA9MudCpmFpHu8WAMb+if8EfdytAErpJgs+jBuAdSG0AFjMuSUP4t7IbAw==","signed_message":"canonical_sha256_bytes","builder_version":"pith-number-builder-2026-05-17-v1","receipt_version":"0.3","canonical_sha256":"a70c6e570f1c563348889318e7c298924f05d23464acdd8f40b4c01da55bd5d9","last_reissued_at":"2026-05-22T01:04:31.977117Z","signature_status":"signed_v1","first_computed_at":"2026-05-22T01:04:31.977117Z","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54"},"source_kind":"arxiv","source_id":"2605.22202","source_version":1,"attestation_state":"computed"},"signer":{"signer_id":"pith.science","signer_type":"pith_registry","key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54"},"created_at":"2026-05-22T01:04:31Z","supersedes":[],"prev_event":null,"signature":{"signature_status":"signed_v1","algorithm":"ed25519","key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","signature_b64":"rK2PDNDN0vfNKr/sY794p2aEOqOzBjWcCE5Be7PsmCjuW3O/tu5k2lLcKe0dvAj0I7olz/KZ6tAy5eKM083cAw==","signed_message":"open_graph_event_sha256_bytes","signed_at":"2026-05-25T20:35:49.431417Z"},"content_sha256":"2c6b9d0193f22b60a5793f724dc52b9011e8a530b127533bd7168935c668b40e","schema_version":"1.0","event_id":"sha256:2c6b9d0193f22b60a5793f724dc52b9011e8a530b127533bd7168935c668b40e"},{"event_type":"graph_snapshot","subject_pith_number":"pith:2026:U4GG4VYPDRLDGSEISMMOPQUYSJ","target":"graph","payload":{"graph_snapshot":{"paper":{"title":"Structure Retention in Embedding Spaces as a Predictor of Benchmark Performance","license":"http://creativecommons.org/licenses/by-sa/4.0/","headline":"","cross_cats":[],"primary_cat":"cs.CL","authors_text":"Amanda Myntti, Filip Ginter, Jenna Kanerva, Veronika Laippala","submitted_at":"2026-05-21T09:05:55Z","abstract_excerpt":"In this paper, we show that high-performing embedding models organize their embedding spaces in a consistent way. We evaluate 25 contemporary embedding models on five MTEB tasks spanning four diverse task categories (retrieval, bitext mining, pair classification, and summarization) in both English and multilingual settings, and reveal that nearest-neighbor overlap and magnitude differences in independent component analysis (ICA) between paired text instances strongly correlate (even up to 0.97) with performance on the given task. Ultimately, we show that embedding tasks display varying degrees"},"claims":{"count":0,"items":[],"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"source":{"id":"2605.22202","kind":"arxiv","version":1},"verdict":{"id":null,"model_set":{},"created_at":null,"strongest_claim":"","one_line_summary":"","pipeline_version":null,"weakest_assumption":"","pith_extraction_headline":""},"integrity":{"clean":true,"summary":{"advisory":0,"critical":0,"by_detector":{},"informational":0},"endpoint":"/pith/2605.22202/integrity.json","findings":[],"available":true,"detectors_run":[],"snapshot_sha256":"c28c3603d3b5d939e8dc4c7e95fa8dfce3d595e45f758748cecf8e644a296938"},"references":{"count":0,"sample":[],"resolved_work":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57","internal_anchors":0},"formal_canon":{"evidence_count":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"author_claims":{"count":0,"strong_count":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"builder_version":"pith-number-builder-2026-05-17-v1"},"verdict_id":null},"signer":{"signer_id":"pith.science","signer_type":"pith_registry","key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54"},"created_at":"2026-05-22T01:04:31Z","supersedes":[],"prev_event":null,"signature":{"signature_status":"signed_v1","algorithm":"ed25519","key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","signature_b64":"P8mrmQgbLWgs6QAxp30KzArrRVz8aM+U4EaI1YjWi9XJlK1u5eaSGAHPRTdGDsNOsUP8d9e2jCe2pTnWReWtCw==","signed_message":"open_graph_event_sha256_bytes","signed_at":"2026-05-25T20:35:49.432184Z"},"content_sha256":"3bf2ed4e9378decbe3043cb74e8f60eae1b1d577debcea663f8293824caeb189","schema_version":"1.0","event_id":"sha256:3bf2ed4e9378decbe3043cb74e8f60eae1b1d577debcea663f8293824caeb189"}],"timestamp_proofs":[],"mirror_hints":[{"mirror_type":"https","name":"Pith Resolver","base_url":"https://pith.science","bundle_url":"https://pith.science/pith/U4GG4VYPDRLDGSEISMMOPQUYSJ/bundle.json","state_url":"https://pith.science/pith/U4GG4VYPDRLDGSEISMMOPQUYSJ/state.json","well_known_bundle_url":"https://pith.science/.well-known/pith/U4GG4VYPDRLDGSEISMMOPQUYSJ/bundle.json","status":"primary"}],"public_keys":[{"key_id":"pith-v1-2026-05","algorithm":"ed25519","format":"raw","public_key_b64":"stVStoiQhXFxp4s2pdzPNoqVNBMojDU/fJ2db5S3CbM=","public_key_hex":"b2d552b68890857171a78b36a5dccf368a953413288c353f7c9d9d6f94b709b3","fingerprint_sha256_b32_first128bits":"RVFV5Z2OI2J3ZUO7ERDEBCYNKS","fingerprint_sha256_hex":"8d4b5ee74e4693bcd1df2446408b0d54","rotates_at":null,"url":"https://pith.science/pith-signing-key.json","notes":"Pith uses this Ed25519 key to sign canonical record SHA-256 digests. Verify with: ed25519_verify(public_key, message=canonical_sha256_bytes, signature=base64decode(signature_b64))."}],"merge_version":"pith-open-graph-merge-v1","built_at":"2026-05-25T20:35:49Z","links":{"resolver":"https://pith.science/pith/U4GG4VYPDRLDGSEISMMOPQUYSJ","bundle":"https://pith.science/pith/U4GG4VYPDRLDGSEISMMOPQUYSJ/bundle.json","state":"https://pith.science/pith/U4GG4VYPDRLDGSEISMMOPQUYSJ/state.json","well_known_bundle":"https://pith.science/.well-known/pith/U4GG4VYPDRLDGSEISMMOPQUYSJ/bundle.json"},"state":{"state_type":"pith_open_graph_state","state_version":"1.0","pith_number":"pith:2026:U4GG4VYPDRLDGSEISMMOPQUYSJ","merge_version":"pith-open-graph-merge-v1","event_count":2,"valid_event_count":2,"invalid_event_count":0,"equivocation_count":0,"current":{"canonical_record":{"metadata":{"abstract_canon_sha256":"7b66197ff7a8fd2318ed66d8537eaabecc0d3a559ad3645e43c743219bf51fc1","cross_cats_sorted":[],"license":"http://creativecommons.org/licenses/by-sa/4.0/","primary_cat":"cs.CL","submitted_at":"2026-05-21T09:05:55Z","title_canon_sha256":"8559c2bd48519ca7fefcbafaddb5fc41556e59f8a0cc27821ed3951adfa5d266"},"schema_version":"1.0","source":{"id":"2605.22202","kind":"arxiv","version":1}},"source_aliases":[{"alias_kind":"arxiv","alias_value":"2605.22202","created_at":"2026-05-22T01:04:31Z"},{"alias_kind":"arxiv_version","alias_value":"2605.22202v1","created_at":"2026-05-22T01:04:31Z"},{"alias_kind":"doi","alias_value":"10.48550/arxiv.2605.22202","created_at":"2026-05-22T01:04:31Z"},{"alias_kind":"pith_short_12","alias_value":"U4GG4VYPDRLD","created_at":"2026-05-22T01:04:31Z"},{"alias_kind":"pith_short_16","alias_value":"U4GG4VYPDRLDGSEI","created_at":"2026-05-22T01:04:31Z"},{"alias_kind":"pith_short_8","alias_value":"U4GG4VYP","created_at":"2026-05-22T01:04:31Z"}],"graph_snapshots":[{"event_id":"sha256:3bf2ed4e9378decbe3043cb74e8f60eae1b1d577debcea663f8293824caeb189","target":"graph","created_at":"2026-05-22T01:04:31Z","signer":{"key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","signer_id":"pith.science","signer_type":"pith_registry"},"payload":{"graph_snapshot":{"author_claims":{"count":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57","strong_count":0},"builder_version":"pith-number-builder-2026-05-17-v1","claims":{"count":0,"items":[],"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"formal_canon":{"evidence_count":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"integrity":{"available":true,"clean":true,"detectors_run":[],"endpoint":"/pith/2605.22202/integrity.json","findings":[],"snapshot_sha256":"c28c3603d3b5d939e8dc4c7e95fa8dfce3d595e45f758748cecf8e644a296938","summary":{"advisory":0,"by_detector":{},"critical":0,"informational":0}},"paper":{"abstract_excerpt":"In this paper, we show that high-performing embedding models organize their embedding spaces in a consistent way. We evaluate 25 contemporary embedding models on five MTEB tasks spanning four diverse task categories (retrieval, bitext mining, pair classification, and summarization) in both English and multilingual settings, and reveal that nearest-neighbor overlap and magnitude differences in independent component analysis (ICA) between paired text instances strongly correlate (even up to 0.97) with performance on the given task. Ultimately, we show that embedding tasks display varying degrees","authors_text":"Amanda Myntti, Filip Ginter, Jenna Kanerva, Veronika Laippala","cross_cats":[],"headline":"","license":"http://creativecommons.org/licenses/by-sa/4.0/","primary_cat":"cs.CL","submitted_at":"2026-05-21T09:05:55Z","title":"Structure Retention in Embedding Spaces as a Predictor of Benchmark Performance"},"references":{"count":0,"internal_anchors":0,"resolved_work":0,"sample":[],"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"source":{"id":"2605.22202","kind":"arxiv","version":1},"verdict":{"created_at":null,"id":null,"model_set":{},"one_line_summary":"","pipeline_version":null,"pith_extraction_headline":"","strongest_claim":"","weakest_assumption":""}},"verdict_id":null}}],"author_attestations":[],"timestamp_anchors":[],"storage_attestations":[],"citation_signatures":[],"replication_records":[],"corrections":[],"mirror_hints":[],"record_created":{"event_id":"sha256:2c6b9d0193f22b60a5793f724dc52b9011e8a530b127533bd7168935c668b40e","target":"record","created_at":"2026-05-22T01:04:31Z","signer":{"key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","signer_id":"pith.science","signer_type":"pith_registry"},"payload":{"attestation_state":"computed","canonical_record":{"metadata":{"abstract_canon_sha256":"7b66197ff7a8fd2318ed66d8537eaabecc0d3a559ad3645e43c743219bf51fc1","cross_cats_sorted":[],"license":"http://creativecommons.org/licenses/by-sa/4.0/","primary_cat":"cs.CL","submitted_at":"2026-05-21T09:05:55Z","title_canon_sha256":"8559c2bd48519ca7fefcbafaddb5fc41556e59f8a0cc27821ed3951adfa5d266"},"schema_version":"1.0","source":{"id":"2605.22202","kind":"arxiv","version":1}},"canonical_sha256":"a70c6e570f1c563348889318e7c298924f05d23464acdd8f40b4c01da55bd5d9","receipt":{"algorithm":"ed25519","builder_version":"pith-number-builder-2026-05-17-v1","canonical_sha256":"a70c6e570f1c563348889318e7c298924f05d23464acdd8f40b4c01da55bd5d9","first_computed_at":"2026-05-22T01:04:31.977117Z","key_id":"pith-v1-2026-05","kind":"pith_receipt","last_reissued_at":"2026-05-22T01:04:31.977117Z","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","receipt_version":"0.3","signature_b64":"2iQEEhWgHGHzt/u4P+qc9lNRJPreXA9MudCpmFpHu8WAMb+if8EfdytAErpJgs+jBuAdSG0AFjMuSUP4t7IbAw==","signature_status":"signed_v1","signed_at":"2026-05-22T01:04:31.977890Z","signed_message":"canonical_sha256_bytes"},"source_id":"2605.22202","source_kind":"arxiv","source_version":1}}},"equivocations":[],"invalid_events":[],"applied_event_ids":["sha256:2c6b9d0193f22b60a5793f724dc52b9011e8a530b127533bd7168935c668b40e","sha256:3bf2ed4e9378decbe3043cb74e8f60eae1b1d577debcea663f8293824caeb189"],"state_sha256":"3022fd847a99a3a7897bd7e57564a5d8a3f1c4c951e346e9d4657ec07c400990"},"bundle_signature":{"signature_status":"signed_v1","algorithm":"ed25519","key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","signature_b64":"fDTW77zCmWtGLT4zws4EsxVQZHmOyiMZxYZ8ubUVKaSlvwYkIhfEK3WyFYIWg/NsfasBO5b8Mk45URajbQ+qCw==","signed_message":"bundle_sha256_bytes","signed_at":"2026-05-25T20:35:49.436084Z","bundle_sha256":"41e5c27b4e907237ec87c4f1a34d9af13161268bb0b37c4036a1914be9e511f7"}}