{"bundle_type":"pith_open_graph_bundle","bundle_version":"1.0","pith_number":"pith:2025:URTZ6GV2WY2JL4N5IZ5KSIFOBG","short_pith_number":"pith:URTZ6GV2","canonical_record":{"source":{"id":"2510.16416","kind":"arxiv","version":4},"metadata":{"license":"http://creativecommons.org/licenses/by/4.0/","primary_cat":"cs.CV","submitted_at":"2025-10-18T09:22:40Z","cross_cats_sorted":["cs.AI"],"title_canon_sha256":"dc4a5f9a2c4244bbfc8a2d4f13edbd3a2859d918b730aa5d900a6c0d2994b153","abstract_canon_sha256":"4eda7f472ee1c0deba60cd9e9c02f998a989a7d8aa3519a97067320ebe99f022"},"schema_version":"1.0"},"canonical_sha256":"a4679f1abab63495f1bd467aa920ae09b14683f5da72892856cfc01138dbc296","source":{"kind":"arxiv","id":"2510.16416","version":4},"source_aliases":[{"alias_kind":"arxiv","alias_value":"2510.16416","created_at":"2026-05-20T00:02:57Z"},{"alias_kind":"arxiv_version","alias_value":"2510.16416v4","created_at":"2026-05-20T00:02:57Z"},{"alias_kind":"doi","alias_value":"10.48550/arxiv.2510.16416","created_at":"2026-05-20T00:02:57Z"},{"alias_kind":"pith_short_12","alias_value":"URTZ6GV2WY2J","created_at":"2026-05-20T00:02:57Z"},{"alias_kind":"pith_short_16","alias_value":"URTZ6GV2WY2JL4N5","created_at":"2026-05-20T00:02:57Z"},{"alias_kind":"pith_short_8","alias_value":"URTZ6GV2","created_at":"2026-05-20T00:02:57Z"}],"events":[{"event_type":"record_created","subject_pith_number":"pith:2025:URTZ6GV2WY2JL4N5IZ5KSIFOBG","target":"record","payload":{"canonical_record":{"source":{"id":"2510.16416","kind":"arxiv","version":4},"metadata":{"license":"http://creativecommons.org/licenses/by/4.0/","primary_cat":"cs.CV","submitted_at":"2025-10-18T09:22:40Z","cross_cats_sorted":["cs.AI"],"title_canon_sha256":"dc4a5f9a2c4244bbfc8a2d4f13edbd3a2859d918b730aa5d900a6c0d2994b153","abstract_canon_sha256":"4eda7f472ee1c0deba60cd9e9c02f998a989a7d8aa3519a97067320ebe99f022"},"schema_version":"1.0"},"canonical_sha256":"a4679f1abab63495f1bd467aa920ae09b14683f5da72892856cfc01138dbc296","receipt":{"kind":"pith_receipt","key_id":"pith-v1-2026-05","algorithm":"ed25519","signed_at":"2026-05-20T00:02:57.586549Z","signature_b64":"W8C0h3IhBTSWmkosnucV6M4uLof2ZkBN41dId3DpUE/8s0dQGhCh1FAD+NwlNQCsR3zn/zTE/Q5EKUmNCpUoCg==","signed_message":"canonical_sha256_bytes","builder_version":"pith-number-builder-2026-05-17-v1","receipt_version":"0.3","canonical_sha256":"a4679f1abab63495f1bd467aa920ae09b14683f5da72892856cfc01138dbc296","last_reissued_at":"2026-05-20T00:02:57.585729Z","signature_status":"signed_v1","first_computed_at":"2026-05-20T00:02:57.585729Z","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54"},"source_kind":"arxiv","source_id":"2510.16416","source_version":4,"attestation_state":"computed"},"signer":{"signer_id":"pith.science","signer_type":"pith_registry","key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54"},"created_at":"2026-05-20T00:02:57Z","supersedes":[],"prev_event":null,"signature":{"signature_status":"signed_v1","algorithm":"ed25519","key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","signature_b64":"kI50V36F6Ox6nJmuBcPa+NwQZOMGjj2JCD4AOOYVQIq98jYlVrMZSLDY8K5ySO7LDfOwP/DBWLvNmCeVlRgSBw==","signed_message":"open_graph_event_sha256_bytes","signed_at":"2026-05-22T13:15:42.686570Z"},"content_sha256":"9f2f37db2460273b28f2cd22c20cccd56799751dd6036d40ab4e24bc600a6827","schema_version":"1.0","event_id":"sha256:9f2f37db2460273b28f2cd22c20cccd56799751dd6036d40ab4e24bc600a6827"},{"event_type":"graph_snapshot","subject_pith_number":"pith:2025:URTZ6GV2WY2JL4N5IZ5KSIFOBG","target":"graph","payload":{"graph_snapshot":{"paper":{"title":"SSL4RL: Revisiting Self-supervised Learning as Intrinsic Reward for Visual-Language Reasoning","license":"http://creativecommons.org/licenses/by/4.0/","headline":"","cross_cats":["cs.AI"],"primary_cat":"cs.CV","authors_text":"Chenheng Zhang, Guojun Yin, Jiajun Chai, Qi Zhang, Runyu Zhou, Stefanie Jegelka, Wei Lin, Xiaohan Wang, Xiaojun Guo, Yifei Wang, Yisen Wang","submitted_at":"2025-10-18T09:22:40Z","abstract_excerpt":"Vision-language models (VLMs) have shown remarkable abilities by integrating large language models with visual inputs. However, they often fail to utilize visual evidence adequately, either depending on linguistic priors in vision-centric tasks or resorting to textual shortcuts during reasoning. Although reinforcement learning (RL) can align models with desired behaviors, its application to VLMs has been hindered by the lack of scalable and reliable reward mechanisms. To overcome this challenge, we propose SSL4RL, a novel framework that leverages self-supervised learning (SSL) tasks as a sourc"},"claims":{"count":0,"items":[],"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"source":{"id":"2510.16416","kind":"arxiv","version":4},"verdict":{"id":null,"model_set":{},"created_at":null,"strongest_claim":"","one_line_summary":"","pipeline_version":null,"weakest_assumption":"","pith_extraction_headline":""},"integrity":{"clean":true,"summary":{"advisory":0,"critical":0,"by_detector":{},"informational":0},"endpoint":"/pith/2510.16416/integrity.json","findings":[],"available":true,"detectors_run":[],"snapshot_sha256":"c28c3603d3b5d939e8dc4c7e95fa8dfce3d595e45f758748cecf8e644a296938"},"references":{"count":0,"sample":[],"resolved_work":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57","internal_anchors":0},"formal_canon":{"evidence_count":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"author_claims":{"count":0,"strong_count":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"builder_version":"pith-number-builder-2026-05-17-v1"},"verdict_id":null},"signer":{"signer_id":"pith.science","signer_type":"pith_registry","key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54"},"created_at":"2026-05-20T00:02:57Z","supersedes":[],"prev_event":null,"signature":{"signature_status":"signed_v1","algorithm":"ed25519","key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","signature_b64":"sKInQlgLomwHefhwerVFi+xtcjRKu5lO55Zg6f+7DBPXoUPjZKCOyV7Z+1iLmIbI6dTlgg9FXCdE45k/ZEEKDw==","signed_message":"open_graph_event_sha256_bytes","signed_at":"2026-05-22T13:15:42.687266Z"},"content_sha256":"a488497dd0f1d8c6d1e6f4fedd98436be71d728191804af07d5cf9b5144e19a1","schema_version":"1.0","event_id":"sha256:a488497dd0f1d8c6d1e6f4fedd98436be71d728191804af07d5cf9b5144e19a1"}],"timestamp_proofs":[],"mirror_hints":[{"mirror_type":"https","name":"Pith Resolver","base_url":"https://pith.science","bundle_url":"https://pith.science/pith/URTZ6GV2WY2JL4N5IZ5KSIFOBG/bundle.json","state_url":"https://pith.science/pith/URTZ6GV2WY2JL4N5IZ5KSIFOBG/state.json","well_known_bundle_url":"https://pith.science/.well-known/pith/URTZ6GV2WY2JL4N5IZ5KSIFOBG/bundle.json","status":"primary"}],"public_keys":[{"key_id":"pith-v1-2026-05","algorithm":"ed25519","format":"raw","public_key_b64":"stVStoiQhXFxp4s2pdzPNoqVNBMojDU/fJ2db5S3CbM=","public_key_hex":"b2d552b68890857171a78b36a5dccf368a953413288c353f7c9d9d6f94b709b3","fingerprint_sha256_b32_first128bits":"RVFV5Z2OI2J3ZUO7ERDEBCYNKS","fingerprint_sha256_hex":"8d4b5ee74e4693bcd1df2446408b0d54","rotates_at":null,"url":"https://pith.science/pith-signing-key.json","notes":"Pith uses this Ed25519 key to sign canonical record SHA-256 digests. Verify with: ed25519_verify(public_key, message=canonical_sha256_bytes, signature=base64decode(signature_b64))."}],"merge_version":"pith-open-graph-merge-v1","built_at":"2026-05-22T13:15:42Z","links":{"resolver":"https://pith.science/pith/URTZ6GV2WY2JL4N5IZ5KSIFOBG","bundle":"https://pith.science/pith/URTZ6GV2WY2JL4N5IZ5KSIFOBG/bundle.json","state":"https://pith.science/pith/URTZ6GV2WY2JL4N5IZ5KSIFOBG/state.json","well_known_bundle":"https://pith.science/.well-known/pith/URTZ6GV2WY2JL4N5IZ5KSIFOBG/bundle.json"},"state":{"state_type":"pith_open_graph_state","state_version":"1.0","pith_number":"pith:2025:URTZ6GV2WY2JL4N5IZ5KSIFOBG","merge_version":"pith-open-graph-merge-v1","event_count":2,"valid_event_count":2,"invalid_event_count":0,"equivocation_count":0,"current":{"canonical_record":{"metadata":{"abstract_canon_sha256":"4eda7f472ee1c0deba60cd9e9c02f998a989a7d8aa3519a97067320ebe99f022","cross_cats_sorted":["cs.AI"],"license":"http://creativecommons.org/licenses/by/4.0/","primary_cat":"cs.CV","submitted_at":"2025-10-18T09:22:40Z","title_canon_sha256":"dc4a5f9a2c4244bbfc8a2d4f13edbd3a2859d918b730aa5d900a6c0d2994b153"},"schema_version":"1.0","source":{"id":"2510.16416","kind":"arxiv","version":4}},"source_aliases":[{"alias_kind":"arxiv","alias_value":"2510.16416","created_at":"2026-05-20T00:02:57Z"},{"alias_kind":"arxiv_version","alias_value":"2510.16416v4","created_at":"2026-05-20T00:02:57Z"},{"alias_kind":"doi","alias_value":"10.48550/arxiv.2510.16416","created_at":"2026-05-20T00:02:57Z"},{"alias_kind":"pith_short_12","alias_value":"URTZ6GV2WY2J","created_at":"2026-05-20T00:02:57Z"},{"alias_kind":"pith_short_16","alias_value":"URTZ6GV2WY2JL4N5","created_at":"2026-05-20T00:02:57Z"},{"alias_kind":"pith_short_8","alias_value":"URTZ6GV2","created_at":"2026-05-20T00:02:57Z"}],"graph_snapshots":[{"event_id":"sha256:a488497dd0f1d8c6d1e6f4fedd98436be71d728191804af07d5cf9b5144e19a1","target":"graph","created_at":"2026-05-20T00:02:57Z","signer":{"key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","signer_id":"pith.science","signer_type":"pith_registry"},"payload":{"graph_snapshot":{"author_claims":{"count":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57","strong_count":0},"builder_version":"pith-number-builder-2026-05-17-v1","claims":{"count":0,"items":[],"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"formal_canon":{"evidence_count":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"integrity":{"available":true,"clean":true,"detectors_run":[],"endpoint":"/pith/2510.16416/integrity.json","findings":[],"snapshot_sha256":"c28c3603d3b5d939e8dc4c7e95fa8dfce3d595e45f758748cecf8e644a296938","summary":{"advisory":0,"by_detector":{},"critical":0,"informational":0}},"paper":{"abstract_excerpt":"Vision-language models (VLMs) have shown remarkable abilities by integrating large language models with visual inputs. However, they often fail to utilize visual evidence adequately, either depending on linguistic priors in vision-centric tasks or resorting to textual shortcuts during reasoning. Although reinforcement learning (RL) can align models with desired behaviors, its application to VLMs has been hindered by the lack of scalable and reliable reward mechanisms. To overcome this challenge, we propose SSL4RL, a novel framework that leverages self-supervised learning (SSL) tasks as a sourc","authors_text":"Chenheng Zhang, Guojun Yin, Jiajun Chai, Qi Zhang, Runyu Zhou, Stefanie Jegelka, Wei Lin, Xiaohan Wang, Xiaojun Guo, Yifei Wang, Yisen Wang","cross_cats":["cs.AI"],"headline":"","license":"http://creativecommons.org/licenses/by/4.0/","primary_cat":"cs.CV","submitted_at":"2025-10-18T09:22:40Z","title":"SSL4RL: Revisiting Self-supervised Learning as Intrinsic Reward for Visual-Language Reasoning"},"references":{"count":0,"internal_anchors":0,"resolved_work":0,"sample":[],"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"source":{"id":"2510.16416","kind":"arxiv","version":4},"verdict":{"created_at":null,"id":null,"model_set":{},"one_line_summary":"","pipeline_version":null,"pith_extraction_headline":"","strongest_claim":"","weakest_assumption":""}},"verdict_id":null}}],"author_attestations":[],"timestamp_anchors":[],"storage_attestations":[],"citation_signatures":[],"replication_records":[],"corrections":[],"mirror_hints":[],"record_created":{"event_id":"sha256:9f2f37db2460273b28f2cd22c20cccd56799751dd6036d40ab4e24bc600a6827","target":"record","created_at":"2026-05-20T00:02:57Z","signer":{"key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","signer_id":"pith.science","signer_type":"pith_registry"},"payload":{"attestation_state":"computed","canonical_record":{"metadata":{"abstract_canon_sha256":"4eda7f472ee1c0deba60cd9e9c02f998a989a7d8aa3519a97067320ebe99f022","cross_cats_sorted":["cs.AI"],"license":"http://creativecommons.org/licenses/by/4.0/","primary_cat":"cs.CV","submitted_at":"2025-10-18T09:22:40Z","title_canon_sha256":"dc4a5f9a2c4244bbfc8a2d4f13edbd3a2859d918b730aa5d900a6c0d2994b153"},"schema_version":"1.0","source":{"id":"2510.16416","kind":"arxiv","version":4}},"canonical_sha256":"a4679f1abab63495f1bd467aa920ae09b14683f5da72892856cfc01138dbc296","receipt":{"algorithm":"ed25519","builder_version":"pith-number-builder-2026-05-17-v1","canonical_sha256":"a4679f1abab63495f1bd467aa920ae09b14683f5da72892856cfc01138dbc296","first_computed_at":"2026-05-20T00:02:57.585729Z","key_id":"pith-v1-2026-05","kind":"pith_receipt","last_reissued_at":"2026-05-20T00:02:57.585729Z","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","receipt_version":"0.3","signature_b64":"W8C0h3IhBTSWmkosnucV6M4uLof2ZkBN41dId3DpUE/8s0dQGhCh1FAD+NwlNQCsR3zn/zTE/Q5EKUmNCpUoCg==","signature_status":"signed_v1","signed_at":"2026-05-20T00:02:57.586549Z","signed_message":"canonical_sha256_bytes"},"source_id":"2510.16416","source_kind":"arxiv","source_version":4}}},"equivocations":[],"invalid_events":[],"applied_event_ids":["sha256:9f2f37db2460273b28f2cd22c20cccd56799751dd6036d40ab4e24bc600a6827","sha256:a488497dd0f1d8c6d1e6f4fedd98436be71d728191804af07d5cf9b5144e19a1"],"state_sha256":"60a349fb0748f41c67109c775153506fc585acaf1114747b4c52b78c119b1807"},"bundle_signature":{"signature_status":"signed_v1","algorithm":"ed25519","key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","signature_b64":"fJuQnjW3vBP+6Zwa0hF/KWx82ColpHWPTrlIZ5NER6ndRMg+9AewdCLtA8YpChgtn7uZSE/ReI8w+aqs7VyMBg==","signed_message":"bundle_sha256_bytes","signed_at":"2026-05-22T13:15:42.690892Z","bundle_sha256":"5dd940dfcd949791e0a9db0c7ccc6237de603051ed39642ccf70aa9c8f426535"}}