{"bundle_type":"pith_open_graph_bundle","bundle_version":"1.0","pith_number":"pith:2023:MTO732OKVJ32L75FQIEZXKWQIL","short_pith_number":"pith:MTO732OK","canonical_record":{"source":{"id":"2308.09351","kind":"arxiv","version":1},"metadata":{"license":"http://arxiv.org/licenses/nonexclusive-distrib/1.0/","primary_cat":"cs.CV","submitted_at":"2023-08-18T07:17:09Z","cross_cats_sorted":["cs.AI","cs.LG","cs.MM"],"title_canon_sha256":"e1e7818069a286354947192fd46a7aa296203a81897e948b219c890eb4ecf68d","abstract_canon_sha256":"14239cadde485168ba87bddf1107eba2f21262682ee41f5f522c0d2f84ee215f"},"schema_version":"1.0"},"canonical_sha256":"64ddfde9caaa77a5ffa582099baad042fc0803e8579fb549c3fd660e8ff9c901","source":{"kind":"arxiv","id":"2308.09351","version":1},"source_aliases":[{"alias_kind":"arxiv","alias_value":"2308.09351","created_at":"2026-07-05T06:42:31Z"},{"alias_kind":"arxiv_version","alias_value":"2308.09351v1","created_at":"2026-07-05T06:42:31Z"},{"alias_kind":"doi","alias_value":"10.48550/arxiv.2308.09351","created_at":"2026-07-05T06:42:31Z"},{"alias_kind":"pith_short_12","alias_value":"MTO732OKVJ32","created_at":"2026-07-05T06:42:31Z"},{"alias_kind":"pith_short_16","alias_value":"MTO732OKVJ32L75F","created_at":"2026-07-05T06:42:31Z"},{"alias_kind":"pith_short_8","alias_value":"MTO732OK","created_at":"2026-07-05T06:42:31Z"}],"events":[{"event_type":"record_created","subject_pith_number":"pith:2023:MTO732OKVJ32L75FQIEZXKWQIL","target":"record","payload":{"canonical_record":{"source":{"id":"2308.09351","kind":"arxiv","version":1},"metadata":{"license":"http://arxiv.org/licenses/nonexclusive-distrib/1.0/","primary_cat":"cs.CV","submitted_at":"2023-08-18T07:17:09Z","cross_cats_sorted":["cs.AI","cs.LG","cs.MM"],"title_canon_sha256":"e1e7818069a286354947192fd46a7aa296203a81897e948b219c890eb4ecf68d","abstract_canon_sha256":"14239cadde485168ba87bddf1107eba2f21262682ee41f5f522c0d2f84ee215f"},"schema_version":"1.0"},"canonical_sha256":"64ddfde9caaa77a5ffa582099baad042fc0803e8579fb549c3fd660e8ff9c901","receipt":{"kind":"pith_receipt","key_id":"pith-v1-2026-05","algorithm":"ed25519","signed_at":"2026-07-05T06:42:31.290450Z","signature_b64":"odeRtvT2kQC5A5YW1p/sb7qW1Ngrqfhmzc6JV6HHe+0iCVYz7v5CkdKWfjrQuFsVfCfDJSbtlg11ZNjIsH1mAA==","signed_message":"canonical_sha256_bytes","builder_version":"pith-number-builder-2026-05-17-v1","receipt_version":"0.3","canonical_sha256":"64ddfde9caaa77a5ffa582099baad042fc0803e8579fb549c3fd660e8ff9c901","last_reissued_at":"2026-07-05T06:42:31.290066Z","signature_status":"signed_v1","first_computed_at":"2026-07-05T06:42:31.290066Z","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54"},"source_kind":"arxiv","source_id":"2308.09351","source_version":1,"attestation_state":"computed"},"signer":{"signer_id":"pith.science","signer_type":"pith_registry","key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54"},"created_at":"2026-07-05T06:42:31Z","supersedes":[],"prev_event":null,"signature":{"signature_status":"signed_v1","algorithm":"ed25519","key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","signature_b64":"hWEQHG1U66i/ffQk997ARx1b0UyE9Q9wb5ECdlBeP3/gE1xwQwwgTUV9/Weuf6f0beCbGRFDvxgCBbRVFbc0DA==","signed_message":"open_graph_event_sha256_bytes","signed_at":"2026-07-05T15:43:25.849636Z"},"content_sha256":"8dfdb62b6b590710f87397e0307b12610bf4174e49ace85c34e254cd2f22c1f0","schema_version":"1.0","event_id":"sha256:8dfdb62b6b590710f87397e0307b12610bf4174e49ace85c34e254cd2f22c1f0"},{"event_type":"graph_snapshot","subject_pith_number":"pith:2023:MTO732OKVJ32L75FQIEZXKWQIL","target":"graph","payload":{"graph_snapshot":{"paper":{"title":"RLIPv2: Fast Scaling of Relational Language-Image Pre-training","license":"http://arxiv.org/licenses/nonexclusive-distrib/1.0/","headline":"","cross_cats":["cs.AI","cs.LG","cs.MM"],"primary_cat":"cs.CV","authors_text":"Deli Zhao, Dong Ni, Hangjie Yuan, Jianwen Jiang, Samuel Albanie, Shiwei Zhang, Tao Feng, Xiang Wang, Yingya Zhang, Yining Pan","submitted_at":"2023-08-18T07:17:09Z","abstract_excerpt":"Relational Language-Image Pre-training (RLIP) aims to align vision representations with relational texts, thereby advancing the capability of relational reasoning in computer vision tasks. However, hindered by the slow convergence of RLIPv1 architecture and the limited availability of existing scene graph data, scaling RLIPv1 is challenging. In this paper, we propose RLIPv2, a fast converging model that enables the scaling of relational pre-training to large-scale pseudo-labelled scene graph data. To enable fast scaling, RLIPv2 introduces Asymmetric Language-Image Fusion (ALIF), a mechanism th"},"claims":{"count":0,"items":[],"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"source":{"id":"2308.09351","kind":"arxiv","version":1},"verdict":{"id":null,"model_set":{},"created_at":null,"strongest_claim":"","one_line_summary":"","pipeline_version":null,"weakest_assumption":"","pith_extraction_headline":""},"integrity":{"clean":true,"summary":{"advisory":0,"critical":0,"by_detector":{},"informational":0},"endpoint":"/pith/2308.09351/integrity.json","findings":[],"available":true,"detectors_run":[],"snapshot_sha256":"c28c3603d3b5d939e8dc4c7e95fa8dfce3d595e45f758748cecf8e644a296938"},"references":{"count":0,"sample":[],"resolved_work":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57","internal_anchors":0},"formal_canon":{"evidence_count":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"author_claims":{"count":0,"strong_count":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"builder_version":"pith-number-builder-2026-05-17-v1"},"verdict_id":null},"signer":{"signer_id":"pith.science","signer_type":"pith_registry","key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54"},"created_at":"2026-07-05T06:42:31Z","supersedes":[],"prev_event":null,"signature":{"signature_status":"signed_v1","algorithm":"ed25519","key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","signature_b64":"yxB1rJvo6d5d4PI8nrWMRAHlJqYwmrJfU4trs3c+jqbBTIxAXKAGrs+0/TApRT+UZpL6v5C9JTCXDQ1a1ZkCBg==","signed_message":"open_graph_event_sha256_bytes","signed_at":"2026-07-05T15:43:25.850012Z"},"content_sha256":"8a98001d37a123e8285542f6d69afee4c73f411719536345bb7bb60b8bf87438","schema_version":"1.0","event_id":"sha256:8a98001d37a123e8285542f6d69afee4c73f411719536345bb7bb60b8bf87438"}],"timestamp_proofs":[],"mirror_hints":[{"mirror_type":"https","name":"Pith Resolver","base_url":"https://pith.science","bundle_url":"https://pith.science/pith/MTO732OKVJ32L75FQIEZXKWQIL/bundle.json","state_url":"https://pith.science/pith/MTO732OKVJ32L75FQIEZXKWQIL/state.json","well_known_bundle_url":"https://pith.science/.well-known/pith/MTO732OKVJ32L75FQIEZXKWQIL/bundle.json","status":"primary"}],"public_keys":[{"key_id":"pith-v1-2026-05","algorithm":"ed25519","format":"raw","public_key_b64":"stVStoiQhXFxp4s2pdzPNoqVNBMojDU/fJ2db5S3CbM=","public_key_hex":"b2d552b68890857171a78b36a5dccf368a953413288c353f7c9d9d6f94b709b3","fingerprint_sha256_b32_first128bits":"RVFV5Z2OI2J3ZUO7ERDEBCYNKS","fingerprint_sha256_hex":"8d4b5ee74e4693bcd1df2446408b0d54","rotates_at":null,"url":"https://pith.science/pith-signing-key.json","notes":"Pith uses this Ed25519 key to sign canonical record SHA-256 digests. Verify with: ed25519_verify(public_key, message=canonical_sha256_bytes, signature=base64decode(signature_b64))."}],"merge_version":"pith-open-graph-merge-v1","built_at":"2026-07-05T15:43:25Z","links":{"resolver":"https://pith.science/pith/MTO732OKVJ32L75FQIEZXKWQIL","bundle":"https://pith.science/pith/MTO732OKVJ32L75FQIEZXKWQIL/bundle.json","state":"https://pith.science/pith/MTO732OKVJ32L75FQIEZXKWQIL/state.json","well_known_bundle":"https://pith.science/.well-known/pith/MTO732OKVJ32L75FQIEZXKWQIL/bundle.json"},"state":{"state_type":"pith_open_graph_state","state_version":"1.0","pith_number":"pith:2023:MTO732OKVJ32L75FQIEZXKWQIL","merge_version":"pith-open-graph-merge-v1","event_count":2,"valid_event_count":2,"invalid_event_count":0,"equivocation_count":0,"current":{"canonical_record":{"metadata":{"abstract_canon_sha256":"14239cadde485168ba87bddf1107eba2f21262682ee41f5f522c0d2f84ee215f","cross_cats_sorted":["cs.AI","cs.LG","cs.MM"],"license":"http://arxiv.org/licenses/nonexclusive-distrib/1.0/","primary_cat":"cs.CV","submitted_at":"2023-08-18T07:17:09Z","title_canon_sha256":"e1e7818069a286354947192fd46a7aa296203a81897e948b219c890eb4ecf68d"},"schema_version":"1.0","source":{"id":"2308.09351","kind":"arxiv","version":1}},"source_aliases":[{"alias_kind":"arxiv","alias_value":"2308.09351","created_at":"2026-07-05T06:42:31Z"},{"alias_kind":"arxiv_version","alias_value":"2308.09351v1","created_at":"2026-07-05T06:42:31Z"},{"alias_kind":"doi","alias_value":"10.48550/arxiv.2308.09351","created_at":"2026-07-05T06:42:31Z"},{"alias_kind":"pith_short_12","alias_value":"MTO732OKVJ32","created_at":"2026-07-05T06:42:31Z"},{"alias_kind":"pith_short_16","alias_value":"MTO732OKVJ32L75F","created_at":"2026-07-05T06:42:31Z"},{"alias_kind":"pith_short_8","alias_value":"MTO732OK","created_at":"2026-07-05T06:42:31Z"}],"graph_snapshots":[{"event_id":"sha256:8a98001d37a123e8285542f6d69afee4c73f411719536345bb7bb60b8bf87438","target":"graph","created_at":"2026-07-05T06:42:31Z","signer":{"key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","signer_id":"pith.science","signer_type":"pith_registry"},"payload":{"graph_snapshot":{"author_claims":{"count":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57","strong_count":0},"builder_version":"pith-number-builder-2026-05-17-v1","claims":{"count":0,"items":[],"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"formal_canon":{"evidence_count":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"integrity":{"available":true,"clean":true,"detectors_run":[],"endpoint":"/pith/2308.09351/integrity.json","findings":[],"snapshot_sha256":"c28c3603d3b5d939e8dc4c7e95fa8dfce3d595e45f758748cecf8e644a296938","summary":{"advisory":0,"by_detector":{},"critical":0,"informational":0}},"paper":{"abstract_excerpt":"Relational Language-Image Pre-training (RLIP) aims to align vision representations with relational texts, thereby advancing the capability of relational reasoning in computer vision tasks. However, hindered by the slow convergence of RLIPv1 architecture and the limited availability of existing scene graph data, scaling RLIPv1 is challenging. In this paper, we propose RLIPv2, a fast converging model that enables the scaling of relational pre-training to large-scale pseudo-labelled scene graph data. To enable fast scaling, RLIPv2 introduces Asymmetric Language-Image Fusion (ALIF), a mechanism th","authors_text":"Deli Zhao, Dong Ni, Hangjie Yuan, Jianwen Jiang, Samuel Albanie, Shiwei Zhang, Tao Feng, Xiang Wang, Yingya Zhang, Yining Pan","cross_cats":["cs.AI","cs.LG","cs.MM"],"headline":"","license":"http://arxiv.org/licenses/nonexclusive-distrib/1.0/","primary_cat":"cs.CV","submitted_at":"2023-08-18T07:17:09Z","title":"RLIPv2: Fast Scaling of Relational Language-Image Pre-training"},"references":{"count":0,"internal_anchors":0,"resolved_work":0,"sample":[],"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"source":{"id":"2308.09351","kind":"arxiv","version":1},"verdict":{"created_at":null,"id":null,"model_set":{},"one_line_summary":"","pipeline_version":null,"pith_extraction_headline":"","strongest_claim":"","weakest_assumption":""}},"verdict_id":null}}],"author_attestations":[],"timestamp_anchors":[],"storage_attestations":[],"citation_signatures":[],"replication_records":[],"corrections":[],"mirror_hints":[],"record_created":{"event_id":"sha256:8dfdb62b6b590710f87397e0307b12610bf4174e49ace85c34e254cd2f22c1f0","target":"record","created_at":"2026-07-05T06:42:31Z","signer":{"key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","signer_id":"pith.science","signer_type":"pith_registry"},"payload":{"attestation_state":"computed","canonical_record":{"metadata":{"abstract_canon_sha256":"14239cadde485168ba87bddf1107eba2f21262682ee41f5f522c0d2f84ee215f","cross_cats_sorted":["cs.AI","cs.LG","cs.MM"],"license":"http://arxiv.org/licenses/nonexclusive-distrib/1.0/","primary_cat":"cs.CV","submitted_at":"2023-08-18T07:17:09Z","title_canon_sha256":"e1e7818069a286354947192fd46a7aa296203a81897e948b219c890eb4ecf68d"},"schema_version":"1.0","source":{"id":"2308.09351","kind":"arxiv","version":1}},"canonical_sha256":"64ddfde9caaa77a5ffa582099baad042fc0803e8579fb549c3fd660e8ff9c901","receipt":{"algorithm":"ed25519","builder_version":"pith-number-builder-2026-05-17-v1","canonical_sha256":"64ddfde9caaa77a5ffa582099baad042fc0803e8579fb549c3fd660e8ff9c901","first_computed_at":"2026-07-05T06:42:31.290066Z","key_id":"pith-v1-2026-05","kind":"pith_receipt","last_reissued_at":"2026-07-05T06:42:31.290066Z","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","receipt_version":"0.3","signature_b64":"odeRtvT2kQC5A5YW1p/sb7qW1Ngrqfhmzc6JV6HHe+0iCVYz7v5CkdKWfjrQuFsVfCfDJSbtlg11ZNjIsH1mAA==","signature_status":"signed_v1","signed_at":"2026-07-05T06:42:31.290450Z","signed_message":"canonical_sha256_bytes"},"source_id":"2308.09351","source_kind":"arxiv","source_version":1}}},"equivocations":[],"invalid_events":[],"applied_event_ids":["sha256:8dfdb62b6b590710f87397e0307b12610bf4174e49ace85c34e254cd2f22c1f0","sha256:8a98001d37a123e8285542f6d69afee4c73f411719536345bb7bb60b8bf87438"],"state_sha256":"3fdeee767631f50aef7f455863cbf468331d3d7e598e90f2750d1c65b4d38b24"},"bundle_signature":{"signature_status":"signed_v1","algorithm":"ed25519","key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","signature_b64":"nI8PZf8owS679HXEMSPlX7Nrb8NCEoGdhP43R+wz+mqKrV1upfYChZAl1h9wcTbdLGGt7u+PlzDBkDtyCWdhBw==","signed_message":"bundle_sha256_bytes","signed_at":"2026-07-05T15:43:25.852014Z","bundle_sha256":"d6261e40f9b14288804a22e229e5ca5a51677223659b380991e3c5a65d1693a9"}}