{"bundle_type":"pith_open_graph_bundle","bundle_version":"1.0","pith_number":"pith:2025:ZAGTGH5XUOO7KSFHXJVMG3VOBC","short_pith_number":"pith:ZAGTGH5X","canonical_record":{"source":{"id":"2504.04065","kind":"arxiv","version":2},"metadata":{"license":"http://creativecommons.org/licenses/by-nc-sa/4.0/","primary_cat":"cs.CV","submitted_at":"2025-04-05T05:42:12Z","cross_cats_sorted":["cs.IR","cs.MM"],"title_canon_sha256":"2069b758c10fcdea997a8f1586c9467d4a553502e67c07117ba3cc4ed6bf9b92","abstract_canon_sha256":"a33392b959a01a484fc40566a4ae8ebde746d73473039127d2e4698f2b1c78a4"},"schema_version":"1.0"},"canonical_sha256":"c80d331fb7a39df548a7ba6ac36eae08876b3955f36170e5dfbb34f3ae782b23","source":{"kind":"arxiv","id":"2504.04065","version":2},"source_aliases":[{"alias_kind":"arxiv","alias_value":"2504.04065","created_at":"2026-05-20T01:04:53Z"},{"alias_kind":"arxiv_version","alias_value":"2504.04065v2","created_at":"2026-05-20T01:04:53Z"},{"alias_kind":"doi","alias_value":"10.48550/arxiv.2504.04065","created_at":"2026-05-20T01:04:53Z"},{"alias_kind":"pith_short_12","alias_value":"ZAGTGH5XUOO7","created_at":"2026-05-20T01:04:53Z"},{"alias_kind":"pith_short_16","alias_value":"ZAGTGH5XUOO7KSFH","created_at":"2026-05-20T01:04:53Z"},{"alias_kind":"pith_short_8","alias_value":"ZAGTGH5X","created_at":"2026-05-20T01:04:53Z"}],"events":[{"event_type":"record_created","subject_pith_number":"pith:2025:ZAGTGH5XUOO7KSFHXJVMG3VOBC","target":"record","payload":{"canonical_record":{"source":{"id":"2504.04065","kind":"arxiv","version":2},"metadata":{"license":"http://creativecommons.org/licenses/by-nc-sa/4.0/","primary_cat":"cs.CV","submitted_at":"2025-04-05T05:42:12Z","cross_cats_sorted":["cs.IR","cs.MM"],"title_canon_sha256":"2069b758c10fcdea997a8f1586c9467d4a553502e67c07117ba3cc4ed6bf9b92","abstract_canon_sha256":"a33392b959a01a484fc40566a4ae8ebde746d73473039127d2e4698f2b1c78a4"},"schema_version":"1.0"},"canonical_sha256":"c80d331fb7a39df548a7ba6ac36eae08876b3955f36170e5dfbb34f3ae782b23","receipt":{"kind":"pith_receipt","key_id":"pith-v1-2026-05","algorithm":"ed25519","signed_at":"2026-05-20T01:04:53.525528Z","signature_b64":"SGTozVjHHAcqVZbGKb0j2eqfal1zT//QLVSEyXIrba8GHVgG5svI6hN2rT5U5GgkUIN1ZwCSFoQafSZs6SSRBQ==","signed_message":"canonical_sha256_bytes","builder_version":"pith-number-builder-2026-05-17-v1","receipt_version":"0.3","canonical_sha256":"c80d331fb7a39df548a7ba6ac36eae08876b3955f36170e5dfbb34f3ae782b23","last_reissued_at":"2026-05-20T01:04:53.524679Z","signature_status":"signed_v1","first_computed_at":"2026-05-20T01:04:53.524679Z","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54"},"source_kind":"arxiv","source_id":"2504.04065","source_version":2,"attestation_state":"computed"},"signer":{"signer_id":"pith.science","signer_type":"pith_registry","key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54"},"created_at":"2026-05-20T01:04:53Z","supersedes":[],"prev_event":null,"signature":{"signature_status":"signed_v1","algorithm":"ed25519","key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","signature_b64":"rQMx455wY9sEUVNaVEgYSrqD/hwYW0pYBJZZcOUY3zYXDKHCnVBenk2bzFLNcQcaE5620p6zSpDNhN06KU62CQ==","signed_message":"open_graph_event_sha256_bytes","signed_at":"2026-05-25T23:14:48.308545Z"},"content_sha256":"3e28be854d5795a016e6878c93bd056d76c614983097887f733049ca079bee96","schema_version":"1.0","event_id":"sha256:3e28be854d5795a016e6878c93bd056d76c614983097887f733049ca079bee96"},{"event_type":"graph_snapshot","subject_pith_number":"pith:2025:ZAGTGH5XUOO7KSFHXJVMG3VOBC","target":"graph","payload":{"graph_snapshot":{"paper":{"title":"Enabling Collaborative Parametric Knowledge Calibration for Retrieval-Augmented Vision Question Answering","license":"http://creativecommons.org/licenses/by-nc-sa/4.0/","headline":"","cross_cats":["cs.IR","cs.MM"],"primary_cat":"cs.CV","authors_text":"Dingxian Wang, Guandong Xu, Huan Huo, Jiaqi Deng, Kaize Shi, Zonghan Wu","submitted_at":"2025-04-05T05:42:12Z","abstract_excerpt":"Knowledge-based Vision Question Answering (KB-VQA) systems address complex visual-grounded questions with knowledge retrieved from external knowledge bases. The tasks of knowledge retrieval and answer generation tasks both necessitate precise multimodal understanding of question context and external knowledge. However, existing methods treat these two stages as separate modules with limited interaction during training, which hinders bi-directional parametric knowledge sharing, ultimately leading to suboptimal performance. To fully exploit the cross-task synergy in KB-VQA, we propose a unified "},"claims":{"count":0,"items":[],"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"source":{"id":"2504.04065","kind":"arxiv","version":2},"verdict":{"id":null,"model_set":{},"created_at":null,"strongest_claim":"","one_line_summary":"","pipeline_version":null,"weakest_assumption":"","pith_extraction_headline":""},"integrity":{"clean":true,"summary":{"advisory":0,"critical":0,"by_detector":{},"informational":0},"endpoint":"/pith/2504.04065/integrity.json","findings":[],"available":true,"detectors_run":[],"snapshot_sha256":"c28c3603d3b5d939e8dc4c7e95fa8dfce3d595e45f758748cecf8e644a296938"},"references":{"count":0,"sample":[],"resolved_work":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57","internal_anchors":0},"formal_canon":{"evidence_count":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"author_claims":{"count":0,"strong_count":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"builder_version":"pith-number-builder-2026-05-17-v1"},"verdict_id":null},"signer":{"signer_id":"pith.science","signer_type":"pith_registry","key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54"},"created_at":"2026-05-20T01:04:53Z","supersedes":[],"prev_event":null,"signature":{"signature_status":"signed_v1","algorithm":"ed25519","key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","signature_b64":"VkBe+3Kq2IoRIK7/00mBe1YC160M1hxU6UFICSLD3tCpohIHmoCYFl7Y3PXT+t/Kr/kMTR+yLk+a0bRbbdhKCw==","signed_message":"open_graph_event_sha256_bytes","signed_at":"2026-05-25T23:14:48.309281Z"},"content_sha256":"1a5fd471418c4e6eb9b2b9cde022792c449f6d1794a66e120fea0e64d26e1a01","schema_version":"1.0","event_id":"sha256:1a5fd471418c4e6eb9b2b9cde022792c449f6d1794a66e120fea0e64d26e1a01"}],"timestamp_proofs":[],"mirror_hints":[{"mirror_type":"https","name":"Pith Resolver","base_url":"https://pith.science","bundle_url":"https://pith.science/pith/ZAGTGH5XUOO7KSFHXJVMG3VOBC/bundle.json","state_url":"https://pith.science/pith/ZAGTGH5XUOO7KSFHXJVMG3VOBC/state.json","well_known_bundle_url":"https://pith.science/.well-known/pith/ZAGTGH5XUOO7KSFHXJVMG3VOBC/bundle.json","status":"primary"}],"public_keys":[{"key_id":"pith-v1-2026-05","algorithm":"ed25519","format":"raw","public_key_b64":"stVStoiQhXFxp4s2pdzPNoqVNBMojDU/fJ2db5S3CbM=","public_key_hex":"b2d552b68890857171a78b36a5dccf368a953413288c353f7c9d9d6f94b709b3","fingerprint_sha256_b32_first128bits":"RVFV5Z2OI2J3ZUO7ERDEBCYNKS","fingerprint_sha256_hex":"8d4b5ee74e4693bcd1df2446408b0d54","rotates_at":null,"url":"https://pith.science/pith-signing-key.json","notes":"Pith uses this Ed25519 key to sign canonical record SHA-256 digests. Verify with: ed25519_verify(public_key, message=canonical_sha256_bytes, signature=base64decode(signature_b64))."}],"merge_version":"pith-open-graph-merge-v1","built_at":"2026-05-25T23:14:48Z","links":{"resolver":"https://pith.science/pith/ZAGTGH5XUOO7KSFHXJVMG3VOBC","bundle":"https://pith.science/pith/ZAGTGH5XUOO7KSFHXJVMG3VOBC/bundle.json","state":"https://pith.science/pith/ZAGTGH5XUOO7KSFHXJVMG3VOBC/state.json","well_known_bundle":"https://pith.science/.well-known/pith/ZAGTGH5XUOO7KSFHXJVMG3VOBC/bundle.json"},"state":{"state_type":"pith_open_graph_state","state_version":"1.0","pith_number":"pith:2025:ZAGTGH5XUOO7KSFHXJVMG3VOBC","merge_version":"pith-open-graph-merge-v1","event_count":2,"valid_event_count":2,"invalid_event_count":0,"equivocation_count":0,"current":{"canonical_record":{"metadata":{"abstract_canon_sha256":"a33392b959a01a484fc40566a4ae8ebde746d73473039127d2e4698f2b1c78a4","cross_cats_sorted":["cs.IR","cs.MM"],"license":"http://creativecommons.org/licenses/by-nc-sa/4.0/","primary_cat":"cs.CV","submitted_at":"2025-04-05T05:42:12Z","title_canon_sha256":"2069b758c10fcdea997a8f1586c9467d4a553502e67c07117ba3cc4ed6bf9b92"},"schema_version":"1.0","source":{"id":"2504.04065","kind":"arxiv","version":2}},"source_aliases":[{"alias_kind":"arxiv","alias_value":"2504.04065","created_at":"2026-05-20T01:04:53Z"},{"alias_kind":"arxiv_version","alias_value":"2504.04065v2","created_at":"2026-05-20T01:04:53Z"},{"alias_kind":"doi","alias_value":"10.48550/arxiv.2504.04065","created_at":"2026-05-20T01:04:53Z"},{"alias_kind":"pith_short_12","alias_value":"ZAGTGH5XUOO7","created_at":"2026-05-20T01:04:53Z"},{"alias_kind":"pith_short_16","alias_value":"ZAGTGH5XUOO7KSFH","created_at":"2026-05-20T01:04:53Z"},{"alias_kind":"pith_short_8","alias_value":"ZAGTGH5X","created_at":"2026-05-20T01:04:53Z"}],"graph_snapshots":[{"event_id":"sha256:1a5fd471418c4e6eb9b2b9cde022792c449f6d1794a66e120fea0e64d26e1a01","target":"graph","created_at":"2026-05-20T01:04:53Z","signer":{"key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","signer_id":"pith.science","signer_type":"pith_registry"},"payload":{"graph_snapshot":{"author_claims":{"count":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57","strong_count":0},"builder_version":"pith-number-builder-2026-05-17-v1","claims":{"count":0,"items":[],"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"formal_canon":{"evidence_count":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"integrity":{"available":true,"clean":true,"detectors_run":[],"endpoint":"/pith/2504.04065/integrity.json","findings":[],"snapshot_sha256":"c28c3603d3b5d939e8dc4c7e95fa8dfce3d595e45f758748cecf8e644a296938","summary":{"advisory":0,"by_detector":{},"critical":0,"informational":0}},"paper":{"abstract_excerpt":"Knowledge-based Vision Question Answering (KB-VQA) systems address complex visual-grounded questions with knowledge retrieved from external knowledge bases. The tasks of knowledge retrieval and answer generation tasks both necessitate precise multimodal understanding of question context and external knowledge. However, existing methods treat these two stages as separate modules with limited interaction during training, which hinders bi-directional parametric knowledge sharing, ultimately leading to suboptimal performance. To fully exploit the cross-task synergy in KB-VQA, we propose a unified ","authors_text":"Dingxian Wang, Guandong Xu, Huan Huo, Jiaqi Deng, Kaize Shi, Zonghan Wu","cross_cats":["cs.IR","cs.MM"],"headline":"","license":"http://creativecommons.org/licenses/by-nc-sa/4.0/","primary_cat":"cs.CV","submitted_at":"2025-04-05T05:42:12Z","title":"Enabling Collaborative Parametric Knowledge Calibration for Retrieval-Augmented Vision Question Answering"},"references":{"count":0,"internal_anchors":0,"resolved_work":0,"sample":[],"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"source":{"id":"2504.04065","kind":"arxiv","version":2},"verdict":{"created_at":null,"id":null,"model_set":{},"one_line_summary":"","pipeline_version":null,"pith_extraction_headline":"","strongest_claim":"","weakest_assumption":""}},"verdict_id":null}}],"author_attestations":[],"timestamp_anchors":[],"storage_attestations":[],"citation_signatures":[],"replication_records":[],"corrections":[],"mirror_hints":[],"record_created":{"event_id":"sha256:3e28be854d5795a016e6878c93bd056d76c614983097887f733049ca079bee96","target":"record","created_at":"2026-05-20T01:04:53Z","signer":{"key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","signer_id":"pith.science","signer_type":"pith_registry"},"payload":{"attestation_state":"computed","canonical_record":{"metadata":{"abstract_canon_sha256":"a33392b959a01a484fc40566a4ae8ebde746d73473039127d2e4698f2b1c78a4","cross_cats_sorted":["cs.IR","cs.MM"],"license":"http://creativecommons.org/licenses/by-nc-sa/4.0/","primary_cat":"cs.CV","submitted_at":"2025-04-05T05:42:12Z","title_canon_sha256":"2069b758c10fcdea997a8f1586c9467d4a553502e67c07117ba3cc4ed6bf9b92"},"schema_version":"1.0","source":{"id":"2504.04065","kind":"arxiv","version":2}},"canonical_sha256":"c80d331fb7a39df548a7ba6ac36eae08876b3955f36170e5dfbb34f3ae782b23","receipt":{"algorithm":"ed25519","builder_version":"pith-number-builder-2026-05-17-v1","canonical_sha256":"c80d331fb7a39df548a7ba6ac36eae08876b3955f36170e5dfbb34f3ae782b23","first_computed_at":"2026-05-20T01:04:53.524679Z","key_id":"pith-v1-2026-05","kind":"pith_receipt","last_reissued_at":"2026-05-20T01:04:53.524679Z","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","receipt_version":"0.3","signature_b64":"SGTozVjHHAcqVZbGKb0j2eqfal1zT//QLVSEyXIrba8GHVgG5svI6hN2rT5U5GgkUIN1ZwCSFoQafSZs6SSRBQ==","signature_status":"signed_v1","signed_at":"2026-05-20T01:04:53.525528Z","signed_message":"canonical_sha256_bytes"},"source_id":"2504.04065","source_kind":"arxiv","source_version":2}}},"equivocations":[],"invalid_events":[],"applied_event_ids":["sha256:3e28be854d5795a016e6878c93bd056d76c614983097887f733049ca079bee96","sha256:1a5fd471418c4e6eb9b2b9cde022792c449f6d1794a66e120fea0e64d26e1a01"],"state_sha256":"1b88dc45273cbbbad24189bcc55f88bca4b52943fdaa9e43d54d45572f7eab07"},"bundle_signature":{"signature_status":"signed_v1","algorithm":"ed25519","key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","signature_b64":"f8afxCrYv09JAZ9dHxoXKs2vQX0srZqBIHi4AW4STNPs8fnA1cyRO83h/40vV5Z0M6hIqyz9lkyClzXIJRjpDw==","signed_message":"bundle_sha256_bytes","signed_at":"2026-05-25T23:14:48.313076Z","bundle_sha256":"99143775413d9beed844b08d88e461d72533180b3f265f90f9ff08a8a90abb03"}}