{"bundle_type":"pith_open_graph_bundle","bundle_version":"1.0","pith_number":"pith:2025:I4XVZUWP7XFG42JEFHPZLHS5HI","short_pith_number":"pith:I4XVZUWP","canonical_record":{"source":{"id":"2510.22276","kind":"arxiv","version":3},"metadata":{"license":"http://creativecommons.org/licenses/by/4.0/","primary_cat":"cs.CV","submitted_at":"2025-10-25T12:42:42Z","cross_cats_sorted":["cs.CL"],"title_canon_sha256":"ca0fb48143a01a9a3fb11997f542fecc0374f61558acc529ebc5c0d609701a68","abstract_canon_sha256":"d72f4ef96a3628e802a0b88e8028e270fe859a5a714de83f51db7b6c2d6cd37e"},"schema_version":"1.0"},"canonical_sha256":"472f5cd2cffdca6e692429df959e5d3a27c1d7c50be24d09573b4c830dabe399","source":{"kind":"arxiv","id":"2510.22276","version":3},"source_aliases":[{"alias_kind":"arxiv","alias_value":"2510.22276","created_at":"2026-06-02T02:04:10Z"},{"alias_kind":"arxiv_version","alias_value":"2510.22276v3","created_at":"2026-06-02T02:04:10Z"},{"alias_kind":"doi","alias_value":"10.48550/arxiv.2510.22276","created_at":"2026-06-02T02:04:10Z"},{"alias_kind":"pith_short_12","alias_value":"I4XVZUWP7XFG","created_at":"2026-06-02T02:04:10Z"},{"alias_kind":"pith_short_16","alias_value":"I4XVZUWP7XFG42JE","created_at":"2026-06-02T02:04:10Z"},{"alias_kind":"pith_short_8","alias_value":"I4XVZUWP","created_at":"2026-06-02T02:04:10Z"}],"events":[{"event_type":"record_created","subject_pith_number":"pith:2025:I4XVZUWP7XFG42JEFHPZLHS5HI","target":"record","payload":{"canonical_record":{"source":{"id":"2510.22276","kind":"arxiv","version":3},"metadata":{"license":"http://creativecommons.org/licenses/by/4.0/","primary_cat":"cs.CV","submitted_at":"2025-10-25T12:42:42Z","cross_cats_sorted":["cs.CL"],"title_canon_sha256":"ca0fb48143a01a9a3fb11997f542fecc0374f61558acc529ebc5c0d609701a68","abstract_canon_sha256":"d72f4ef96a3628e802a0b88e8028e270fe859a5a714de83f51db7b6c2d6cd37e"},"schema_version":"1.0"},"canonical_sha256":"472f5cd2cffdca6e692429df959e5d3a27c1d7c50be24d09573b4c830dabe399","receipt":{"kind":"pith_receipt","key_id":"pith-v1-2026-05","algorithm":"ed25519","signed_at":"2026-06-02T02:04:10.339104Z","signature_b64":"nOVP3JFN0Qg7GGRMf1ctMMe4kUsxNw2UR6fj1rYld3F1wRNrXdqXdp+lXNvLvAhDyvvd9ltBvHcySGNZqYAhAg==","signed_message":"canonical_sha256_bytes","builder_version":"pith-number-builder-2026-05-17-v1","receipt_version":"0.3","canonical_sha256":"472f5cd2cffdca6e692429df959e5d3a27c1d7c50be24d09573b4c830dabe399","last_reissued_at":"2026-06-02T02:04:10.338641Z","signature_status":"signed_v1","first_computed_at":"2026-06-02T02:04:10.338641Z","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54"},"source_kind":"arxiv","source_id":"2510.22276","source_version":3,"attestation_state":"computed"},"signer":{"signer_id":"pith.science","signer_type":"pith_registry","key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54"},"created_at":"2026-06-02T02:04:10Z","supersedes":[],"prev_event":null,"signature":{"signature_status":"signed_v1","algorithm":"ed25519","key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","signature_b64":"v+yY8EkhPfx/U6VbXrJgVMHWiSCZfzW7QNZyyBbvA9Uz+PZYrBvqA0pfTI4YNC2p64YMTFa4fUhOaj8bMuVkBQ==","signed_message":"open_graph_event_sha256_bytes","signed_at":"2026-06-06T14:52:32.978752Z"},"content_sha256":"466eea8687f6b437c17f8f3a0ff5239daefd73ace80a5a22e719dcb9de59fe68","schema_version":"1.0","event_id":"sha256:466eea8687f6b437c17f8f3a0ff5239daefd73ace80a5a22e719dcb9de59fe68"},{"event_type":"graph_snapshot","subject_pith_number":"pith:2025:I4XVZUWP7XFG42JEFHPZLHS5HI","target":"graph","payload":{"graph_snapshot":{"paper":{"title":"WAON: A Large-Scale Japanese Image-Text Dataset for Cultural Adaptation in Contrastive Vision-Language Models","license":"http://creativecommons.org/licenses/by/4.0/","headline":"","cross_cats":["cs.CL"],"primary_cat":"cs.CV","authors_text":"Daisuke Kawahara, Issa Sugiura, Naoaki Okazaki, Shuhei Kurita, Yasuo Okabe, Yusuke Oda","submitted_at":"2025-10-25T12:42:42Z","abstract_excerpt":"Contrastive vision-language models have achieved remarkable progress through large-scale pretraining. Recent work has shown that removing English-only caption filters and pretraining on global data is effective for improving multicultural performance. We study whether such global pretraining is sufficient for culture-specific understanding, or whether further adaptation with natively sourced data can boost performance beyond what global pretraining alone achieves. To enable this investigation, we present WAON, the largest publicly available native Japanese image-text dataset constructed from n"},"claims":{"count":0,"items":[],"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"source":{"id":"2510.22276","kind":"arxiv","version":3},"verdict":{"id":null,"model_set":{},"created_at":null,"strongest_claim":"","one_line_summary":"","pipeline_version":null,"weakest_assumption":"","pith_extraction_headline":""},"integrity":{"clean":true,"summary":{"advisory":0,"critical":0,"by_detector":{},"informational":0},"endpoint":"/pith/2510.22276/integrity.json","findings":[],"available":true,"detectors_run":[],"snapshot_sha256":"c28c3603d3b5d939e8dc4c7e95fa8dfce3d595e45f758748cecf8e644a296938"},"references":{"count":0,"sample":[],"resolved_work":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57","internal_anchors":0},"formal_canon":{"evidence_count":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"author_claims":{"count":0,"strong_count":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"builder_version":"pith-number-builder-2026-05-17-v1"},"verdict_id":null},"signer":{"signer_id":"pith.science","signer_type":"pith_registry","key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54"},"created_at":"2026-06-02T02:04:10Z","supersedes":[],"prev_event":null,"signature":{"signature_status":"signed_v1","algorithm":"ed25519","key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","signature_b64":"ZDSaeC67jYp8QbIYqGBBg91fgrN9PlUDPccoz6LYH1tsM8GUkqcXkDZZwu84VDJvjZQqpMQc8/2XrSAX/ozSAg==","signed_message":"open_graph_event_sha256_bytes","signed_at":"2026-06-06T14:52:32.979488Z"},"content_sha256":"b559aa86e9f82c7ec2e39005ad46d4bb0a7d060b785b3de6dbb766eff5f5308d","schema_version":"1.0","event_id":"sha256:b559aa86e9f82c7ec2e39005ad46d4bb0a7d060b785b3de6dbb766eff5f5308d"}],"timestamp_proofs":[],"mirror_hints":[{"mirror_type":"https","name":"Pith Resolver","base_url":"https://pith.science","bundle_url":"https://pith.science/pith/I4XVZUWP7XFG42JEFHPZLHS5HI/bundle.json","state_url":"https://pith.science/pith/I4XVZUWP7XFG42JEFHPZLHS5HI/state.json","well_known_bundle_url":"https://pith.science/.well-known/pith/I4XVZUWP7XFG42JEFHPZLHS5HI/bundle.json","status":"primary"}],"public_keys":[{"key_id":"pith-v1-2026-05","algorithm":"ed25519","format":"raw","public_key_b64":"stVStoiQhXFxp4s2pdzPNoqVNBMojDU/fJ2db5S3CbM=","public_key_hex":"b2d552b68890857171a78b36a5dccf368a953413288c353f7c9d9d6f94b709b3","fingerprint_sha256_b32_first128bits":"RVFV5Z2OI2J3ZUO7ERDEBCYNKS","fingerprint_sha256_hex":"8d4b5ee74e4693bcd1df2446408b0d54","rotates_at":null,"url":"https://pith.science/pith-signing-key.json","notes":"Pith uses this Ed25519 key to sign canonical record SHA-256 digests. Verify with: ed25519_verify(public_key, message=canonical_sha256_bytes, signature=base64decode(signature_b64))."}],"merge_version":"pith-open-graph-merge-v1","built_at":"2026-06-06T14:52:32Z","links":{"resolver":"https://pith.science/pith/I4XVZUWP7XFG42JEFHPZLHS5HI","bundle":"https://pith.science/pith/I4XVZUWP7XFG42JEFHPZLHS5HI/bundle.json","state":"https://pith.science/pith/I4XVZUWP7XFG42JEFHPZLHS5HI/state.json","well_known_bundle":"https://pith.science/.well-known/pith/I4XVZUWP7XFG42JEFHPZLHS5HI/bundle.json"},"state":{"state_type":"pith_open_graph_state","state_version":"1.0","pith_number":"pith:2025:I4XVZUWP7XFG42JEFHPZLHS5HI","merge_version":"pith-open-graph-merge-v1","event_count":2,"valid_event_count":2,"invalid_event_count":0,"equivocation_count":0,"current":{"canonical_record":{"metadata":{"abstract_canon_sha256":"d72f4ef96a3628e802a0b88e8028e270fe859a5a714de83f51db7b6c2d6cd37e","cross_cats_sorted":["cs.CL"],"license":"http://creativecommons.org/licenses/by/4.0/","primary_cat":"cs.CV","submitted_at":"2025-10-25T12:42:42Z","title_canon_sha256":"ca0fb48143a01a9a3fb11997f542fecc0374f61558acc529ebc5c0d609701a68"},"schema_version":"1.0","source":{"id":"2510.22276","kind":"arxiv","version":3}},"source_aliases":[{"alias_kind":"arxiv","alias_value":"2510.22276","created_at":"2026-06-02T02:04:10Z"},{"alias_kind":"arxiv_version","alias_value":"2510.22276v3","created_at":"2026-06-02T02:04:10Z"},{"alias_kind":"doi","alias_value":"10.48550/arxiv.2510.22276","created_at":"2026-06-02T02:04:10Z"},{"alias_kind":"pith_short_12","alias_value":"I4XVZUWP7XFG","created_at":"2026-06-02T02:04:10Z"},{"alias_kind":"pith_short_16","alias_value":"I4XVZUWP7XFG42JE","created_at":"2026-06-02T02:04:10Z"},{"alias_kind":"pith_short_8","alias_value":"I4XVZUWP","created_at":"2026-06-02T02:04:10Z"}],"graph_snapshots":[{"event_id":"sha256:b559aa86e9f82c7ec2e39005ad46d4bb0a7d060b785b3de6dbb766eff5f5308d","target":"graph","created_at":"2026-06-02T02:04:10Z","signer":{"key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","signer_id":"pith.science","signer_type":"pith_registry"},"payload":{"graph_snapshot":{"author_claims":{"count":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57","strong_count":0},"builder_version":"pith-number-builder-2026-05-17-v1","claims":{"count":0,"items":[],"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"formal_canon":{"evidence_count":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"integrity":{"available":true,"clean":true,"detectors_run":[],"endpoint":"/pith/2510.22276/integrity.json","findings":[],"snapshot_sha256":"c28c3603d3b5d939e8dc4c7e95fa8dfce3d595e45f758748cecf8e644a296938","summary":{"advisory":0,"by_detector":{},"critical":0,"informational":0}},"paper":{"abstract_excerpt":"Contrastive vision-language models have achieved remarkable progress through large-scale pretraining. Recent work has shown that removing English-only caption filters and pretraining on global data is effective for improving multicultural performance. We study whether such global pretraining is sufficient for culture-specific understanding, or whether further adaptation with natively sourced data can boost performance beyond what global pretraining alone achieves. To enable this investigation, we present WAON, the largest publicly available native Japanese image-text dataset constructed from n","authors_text":"Daisuke Kawahara, Issa Sugiura, Naoaki Okazaki, Shuhei Kurita, Yasuo Okabe, Yusuke Oda","cross_cats":["cs.CL"],"headline":"","license":"http://creativecommons.org/licenses/by/4.0/","primary_cat":"cs.CV","submitted_at":"2025-10-25T12:42:42Z","title":"WAON: A Large-Scale Japanese Image-Text Dataset for Cultural Adaptation in Contrastive Vision-Language Models"},"references":{"count":0,"internal_anchors":0,"resolved_work":0,"sample":[],"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"source":{"id":"2510.22276","kind":"arxiv","version":3},"verdict":{"created_at":null,"id":null,"model_set":{},"one_line_summary":"","pipeline_version":null,"pith_extraction_headline":"","strongest_claim":"","weakest_assumption":""}},"verdict_id":null}}],"author_attestations":[],"timestamp_anchors":[],"storage_attestations":[],"citation_signatures":[],"replication_records":[],"corrections":[],"mirror_hints":[],"record_created":{"event_id":"sha256:466eea8687f6b437c17f8f3a0ff5239daefd73ace80a5a22e719dcb9de59fe68","target":"record","created_at":"2026-06-02T02:04:10Z","signer":{"key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","signer_id":"pith.science","signer_type":"pith_registry"},"payload":{"attestation_state":"computed","canonical_record":{"metadata":{"abstract_canon_sha256":"d72f4ef96a3628e802a0b88e8028e270fe859a5a714de83f51db7b6c2d6cd37e","cross_cats_sorted":["cs.CL"],"license":"http://creativecommons.org/licenses/by/4.0/","primary_cat":"cs.CV","submitted_at":"2025-10-25T12:42:42Z","title_canon_sha256":"ca0fb48143a01a9a3fb11997f542fecc0374f61558acc529ebc5c0d609701a68"},"schema_version":"1.0","source":{"id":"2510.22276","kind":"arxiv","version":3}},"canonical_sha256":"472f5cd2cffdca6e692429df959e5d3a27c1d7c50be24d09573b4c830dabe399","receipt":{"algorithm":"ed25519","builder_version":"pith-number-builder-2026-05-17-v1","canonical_sha256":"472f5cd2cffdca6e692429df959e5d3a27c1d7c50be24d09573b4c830dabe399","first_computed_at":"2026-06-02T02:04:10.338641Z","key_id":"pith-v1-2026-05","kind":"pith_receipt","last_reissued_at":"2026-06-02T02:04:10.338641Z","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","receipt_version":"0.3","signature_b64":"nOVP3JFN0Qg7GGRMf1ctMMe4kUsxNw2UR6fj1rYld3F1wRNrXdqXdp+lXNvLvAhDyvvd9ltBvHcySGNZqYAhAg==","signature_status":"signed_v1","signed_at":"2026-06-02T02:04:10.339104Z","signed_message":"canonical_sha256_bytes"},"source_id":"2510.22276","source_kind":"arxiv","source_version":3}}},"equivocations":[],"invalid_events":[],"applied_event_ids":["sha256:466eea8687f6b437c17f8f3a0ff5239daefd73ace80a5a22e719dcb9de59fe68","sha256:b559aa86e9f82c7ec2e39005ad46d4bb0a7d060b785b3de6dbb766eff5f5308d"],"state_sha256":"14da2cab1410339d9e3630205cd84deee00ca3e78192dccd0a451c0df4eb643f"},"bundle_signature":{"signature_status":"signed_v1","algorithm":"ed25519","key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","signature_b64":"fL9zluKvsaiyS5QazlL3UN8lViLeGxBUJaINxxE+DTsnezYK+FQNmuhz0vTE5iGZ+1XVIZz+wwEOffeC5WSGDA==","signed_message":"bundle_sha256_bytes","signed_at":"2026-06-06T14:52:32.983519Z","bundle_sha256":"15dbdb5f14edd027b6d7b2929fe38c8a8a8ab9b378b7d78e990e9ab0f32eb373"}}