{"bundle_type":"pith_open_graph_bundle","bundle_version":"1.0","pith_number":"pith:2026:CG6LJ435QCNTHCACFR2SZZKLUC","short_pith_number":"pith:CG6LJ435","canonical_record":{"source":{"id":"2606.00564","kind":"arxiv","version":1},"metadata":{"license":"http://arxiv.org/licenses/nonexclusive-distrib/1.0/","primary_cat":"cs.CV","submitted_at":"2026-05-30T06:34:37Z","cross_cats_sorted":["cs.CL"],"title_canon_sha256":"84fe8c9faf53448966d47f07040c85be892ab2779048a7b267176539289fd0b0","abstract_canon_sha256":"26ada1e71a9fbf4b073b929c5184cbd08b2d44e318293290ee41515044d0c4d4"},"schema_version":"1.0"},"canonical_sha256":"11bcb4f37d809b3388022c752ce54ba0beaa545d3414383e546eddebb37c20fd","source":{"kind":"arxiv","id":"2606.00564","version":1},"source_aliases":[{"alias_kind":"arxiv","alias_value":"2606.00564","created_at":"2026-06-02T01:03:58Z"},{"alias_kind":"arxiv_version","alias_value":"2606.00564v1","created_at":"2026-06-02T01:03:58Z"},{"alias_kind":"doi","alias_value":"10.48550/arxiv.2606.00564","created_at":"2026-06-02T01:03:58Z"},{"alias_kind":"pith_short_12","alias_value":"CG6LJ435QCNT","created_at":"2026-06-02T01:03:58Z"},{"alias_kind":"pith_short_16","alias_value":"CG6LJ435QCNTHCAC","created_at":"2026-06-02T01:03:58Z"},{"alias_kind":"pith_short_8","alias_value":"CG6LJ435","created_at":"2026-06-02T01:03:58Z"}],"events":[{"event_type":"record_created","subject_pith_number":"pith:2026:CG6LJ435QCNTHCACFR2SZZKLUC","target":"record","payload":{"canonical_record":{"source":{"id":"2606.00564","kind":"arxiv","version":1},"metadata":{"license":"http://arxiv.org/licenses/nonexclusive-distrib/1.0/","primary_cat":"cs.CV","submitted_at":"2026-05-30T06:34:37Z","cross_cats_sorted":["cs.CL"],"title_canon_sha256":"84fe8c9faf53448966d47f07040c85be892ab2779048a7b267176539289fd0b0","abstract_canon_sha256":"26ada1e71a9fbf4b073b929c5184cbd08b2d44e318293290ee41515044d0c4d4"},"schema_version":"1.0"},"canonical_sha256":"11bcb4f37d809b3388022c752ce54ba0beaa545d3414383e546eddebb37c20fd","receipt":{"kind":"pith_receipt","key_id":"pith-v1-2026-05","algorithm":"ed25519","signed_at":"2026-06-02T01:03:58.407523Z","signature_b64":"Ny+vcSyMiVjYy+kVHdUIL/sGBPO9SpcE9rVBjcHZZt8ZrceiZ46/Kuzn+ntaIZejFWbKzddBtpn8HOJOEASlDw==","signed_message":"canonical_sha256_bytes","builder_version":"pith-number-builder-2026-05-17-v1","receipt_version":"0.3","canonical_sha256":"11bcb4f37d809b3388022c752ce54ba0beaa545d3414383e546eddebb37c20fd","last_reissued_at":"2026-06-02T01:03:58.407096Z","signature_status":"signed_v1","first_computed_at":"2026-06-02T01:03:58.407096Z","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54"},"source_kind":"arxiv","source_id":"2606.00564","source_version":1,"attestation_state":"computed"},"signer":{"signer_id":"pith.science","signer_type":"pith_registry","key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54"},"created_at":"2026-06-02T01:03:58Z","supersedes":[],"prev_event":null,"signature":{"signature_status":"signed_v1","algorithm":"ed25519","key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","signature_b64":"ko7qyEEUcMcDEyor890EpOU0KRs7aZUDK8GVOA5MXrKCibRKSoUpP6bf5ZzbdMrStOCoQzQbYVe4KJveaVXECg==","signed_message":"open_graph_event_sha256_bytes","signed_at":"2026-06-06T16:54:38.389876Z"},"content_sha256":"b28fd8c8f6fe30fad1a896d6d855b0ea7e18a95a43a233bfc9a4dc6519f51400","schema_version":"1.0","event_id":"sha256:b28fd8c8f6fe30fad1a896d6d855b0ea7e18a95a43a233bfc9a4dc6519f51400"},{"event_type":"graph_snapshot","subject_pith_number":"pith:2026:CG6LJ435QCNTHCACFR2SZZKLUC","target":"graph","payload":{"graph_snapshot":{"paper":{"title":"Decomposed On-Policy Distillation for Vision-Language Reasoning: Steering Gradients for Visual Grounding","license":"http://arxiv.org/licenses/nonexclusive-distrib/1.0/","headline":"","cross_cats":["cs.CL"],"primary_cat":"cs.CV","authors_text":"Chang D. Yoo, Chong Luo, Eunseop Yoon, Hee Suk Yoon, Jaehyun Jang, Ji Woo Hong, Mark Hasegawa-Johnson, Qi Dai, SooHwan Eom","submitted_at":"2026-05-30T06:34:37Z","abstract_excerpt":"While on-policy distillation offers dense supervision for training small reasoning models, its optimization dynamics in the multimodal domain remain under-explored. In this work, we challenge the standard monolithic view of Vision-Language Model (VLM) distillation by mathematically decomposing the loss into two distinct components: the language prior and visual grounding. Our analysis uncovers that gradient vectors for these components are nearly orthogonal, indicating that the objective of aligning with the teacher's language distribution is geometrically independent from the objective of mat"},"claims":{"count":0,"items":[],"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"source":{"id":"2606.00564","kind":"arxiv","version":1},"verdict":{"id":null,"model_set":{},"created_at":null,"strongest_claim":"","one_line_summary":"","pipeline_version":null,"weakest_assumption":"","pith_extraction_headline":""},"integrity":{"clean":true,"summary":{"advisory":0,"critical":0,"by_detector":{},"informational":0},"endpoint":"/pith/2606.00564/integrity.json","findings":[],"available":true,"detectors_run":[],"snapshot_sha256":"c28c3603d3b5d939e8dc4c7e95fa8dfce3d595e45f758748cecf8e644a296938"},"references":{"count":0,"sample":[],"resolved_work":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57","internal_anchors":0},"formal_canon":{"evidence_count":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"author_claims":{"count":0,"strong_count":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"builder_version":"pith-number-builder-2026-05-17-v1"},"verdict_id":null},"signer":{"signer_id":"pith.science","signer_type":"pith_registry","key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54"},"created_at":"2026-06-02T01:03:58Z","supersedes":[],"prev_event":null,"signature":{"signature_status":"signed_v1","algorithm":"ed25519","key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","signature_b64":"Kgvn/XZnxe/MjOXdB/XNVi+ElTPnkdWOV24OjRBZDCSXsVsbuud+tzMs/l6BveieIPfbeLo4c/rDo1RulT2AAw==","signed_message":"open_graph_event_sha256_bytes","signed_at":"2026-06-06T16:54:38.390254Z"},"content_sha256":"549fc1835d0fb48406b55d4293e9b9a609d8e55eda0a33d9bfb4638b43c91b36","schema_version":"1.0","event_id":"sha256:549fc1835d0fb48406b55d4293e9b9a609d8e55eda0a33d9bfb4638b43c91b36"}],"timestamp_proofs":[],"mirror_hints":[{"mirror_type":"https","name":"Pith Resolver","base_url":"https://pith.science","bundle_url":"https://pith.science/pith/CG6LJ435QCNTHCACFR2SZZKLUC/bundle.json","state_url":"https://pith.science/pith/CG6LJ435QCNTHCACFR2SZZKLUC/state.json","well_known_bundle_url":"https://pith.science/.well-known/pith/CG6LJ435QCNTHCACFR2SZZKLUC/bundle.json","status":"primary"}],"public_keys":[{"key_id":"pith-v1-2026-05","algorithm":"ed25519","format":"raw","public_key_b64":"stVStoiQhXFxp4s2pdzPNoqVNBMojDU/fJ2db5S3CbM=","public_key_hex":"b2d552b68890857171a78b36a5dccf368a953413288c353f7c9d9d6f94b709b3","fingerprint_sha256_b32_first128bits":"RVFV5Z2OI2J3ZUO7ERDEBCYNKS","fingerprint_sha256_hex":"8d4b5ee74e4693bcd1df2446408b0d54","rotates_at":null,"url":"https://pith.science/pith-signing-key.json","notes":"Pith uses this Ed25519 key to sign canonical record SHA-256 digests. Verify with: ed25519_verify(public_key, message=canonical_sha256_bytes, signature=base64decode(signature_b64))."}],"merge_version":"pith-open-graph-merge-v1","built_at":"2026-06-06T16:54:38Z","links":{"resolver":"https://pith.science/pith/CG6LJ435QCNTHCACFR2SZZKLUC","bundle":"https://pith.science/pith/CG6LJ435QCNTHCACFR2SZZKLUC/bundle.json","state":"https://pith.science/pith/CG6LJ435QCNTHCACFR2SZZKLUC/state.json","well_known_bundle":"https://pith.science/.well-known/pith/CG6LJ435QCNTHCACFR2SZZKLUC/bundle.json"},"state":{"state_type":"pith_open_graph_state","state_version":"1.0","pith_number":"pith:2026:CG6LJ435QCNTHCACFR2SZZKLUC","merge_version":"pith-open-graph-merge-v1","event_count":2,"valid_event_count":2,"invalid_event_count":0,"equivocation_count":0,"current":{"canonical_record":{"metadata":{"abstract_canon_sha256":"26ada1e71a9fbf4b073b929c5184cbd08b2d44e318293290ee41515044d0c4d4","cross_cats_sorted":["cs.CL"],"license":"http://arxiv.org/licenses/nonexclusive-distrib/1.0/","primary_cat":"cs.CV","submitted_at":"2026-05-30T06:34:37Z","title_canon_sha256":"84fe8c9faf53448966d47f07040c85be892ab2779048a7b267176539289fd0b0"},"schema_version":"1.0","source":{"id":"2606.00564","kind":"arxiv","version":1}},"source_aliases":[{"alias_kind":"arxiv","alias_value":"2606.00564","created_at":"2026-06-02T01:03:58Z"},{"alias_kind":"arxiv_version","alias_value":"2606.00564v1","created_at":"2026-06-02T01:03:58Z"},{"alias_kind":"doi","alias_value":"10.48550/arxiv.2606.00564","created_at":"2026-06-02T01:03:58Z"},{"alias_kind":"pith_short_12","alias_value":"CG6LJ435QCNT","created_at":"2026-06-02T01:03:58Z"},{"alias_kind":"pith_short_16","alias_value":"CG6LJ435QCNTHCAC","created_at":"2026-06-02T01:03:58Z"},{"alias_kind":"pith_short_8","alias_value":"CG6LJ435","created_at":"2026-06-02T01:03:58Z"}],"graph_snapshots":[{"event_id":"sha256:549fc1835d0fb48406b55d4293e9b9a609d8e55eda0a33d9bfb4638b43c91b36","target":"graph","created_at":"2026-06-02T01:03:58Z","signer":{"key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","signer_id":"pith.science","signer_type":"pith_registry"},"payload":{"graph_snapshot":{"author_claims":{"count":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57","strong_count":0},"builder_version":"pith-number-builder-2026-05-17-v1","claims":{"count":0,"items":[],"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"formal_canon":{"evidence_count":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"integrity":{"available":true,"clean":true,"detectors_run":[],"endpoint":"/pith/2606.00564/integrity.json","findings":[],"snapshot_sha256":"c28c3603d3b5d939e8dc4c7e95fa8dfce3d595e45f758748cecf8e644a296938","summary":{"advisory":0,"by_detector":{},"critical":0,"informational":0}},"paper":{"abstract_excerpt":"While on-policy distillation offers dense supervision for training small reasoning models, its optimization dynamics in the multimodal domain remain under-explored. In this work, we challenge the standard monolithic view of Vision-Language Model (VLM) distillation by mathematically decomposing the loss into two distinct components: the language prior and visual grounding. Our analysis uncovers that gradient vectors for these components are nearly orthogonal, indicating that the objective of aligning with the teacher's language distribution is geometrically independent from the objective of mat","authors_text":"Chang D. Yoo, Chong Luo, Eunseop Yoon, Hee Suk Yoon, Jaehyun Jang, Ji Woo Hong, Mark Hasegawa-Johnson, Qi Dai, SooHwan Eom","cross_cats":["cs.CL"],"headline":"","license":"http://arxiv.org/licenses/nonexclusive-distrib/1.0/","primary_cat":"cs.CV","submitted_at":"2026-05-30T06:34:37Z","title":"Decomposed On-Policy Distillation for Vision-Language Reasoning: Steering Gradients for Visual Grounding"},"references":{"count":0,"internal_anchors":0,"resolved_work":0,"sample":[],"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"source":{"id":"2606.00564","kind":"arxiv","version":1},"verdict":{"created_at":null,"id":null,"model_set":{},"one_line_summary":"","pipeline_version":null,"pith_extraction_headline":"","strongest_claim":"","weakest_assumption":""}},"verdict_id":null}}],"author_attestations":[],"timestamp_anchors":[],"storage_attestations":[],"citation_signatures":[],"replication_records":[],"corrections":[],"mirror_hints":[],"record_created":{"event_id":"sha256:b28fd8c8f6fe30fad1a896d6d855b0ea7e18a95a43a233bfc9a4dc6519f51400","target":"record","created_at":"2026-06-02T01:03:58Z","signer":{"key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","signer_id":"pith.science","signer_type":"pith_registry"},"payload":{"attestation_state":"computed","canonical_record":{"metadata":{"abstract_canon_sha256":"26ada1e71a9fbf4b073b929c5184cbd08b2d44e318293290ee41515044d0c4d4","cross_cats_sorted":["cs.CL"],"license":"http://arxiv.org/licenses/nonexclusive-distrib/1.0/","primary_cat":"cs.CV","submitted_at":"2026-05-30T06:34:37Z","title_canon_sha256":"84fe8c9faf53448966d47f07040c85be892ab2779048a7b267176539289fd0b0"},"schema_version":"1.0","source":{"id":"2606.00564","kind":"arxiv","version":1}},"canonical_sha256":"11bcb4f37d809b3388022c752ce54ba0beaa545d3414383e546eddebb37c20fd","receipt":{"algorithm":"ed25519","builder_version":"pith-number-builder-2026-05-17-v1","canonical_sha256":"11bcb4f37d809b3388022c752ce54ba0beaa545d3414383e546eddebb37c20fd","first_computed_at":"2026-06-02T01:03:58.407096Z","key_id":"pith-v1-2026-05","kind":"pith_receipt","last_reissued_at":"2026-06-02T01:03:58.407096Z","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","receipt_version":"0.3","signature_b64":"Ny+vcSyMiVjYy+kVHdUIL/sGBPO9SpcE9rVBjcHZZt8ZrceiZ46/Kuzn+ntaIZejFWbKzddBtpn8HOJOEASlDw==","signature_status":"signed_v1","signed_at":"2026-06-02T01:03:58.407523Z","signed_message":"canonical_sha256_bytes"},"source_id":"2606.00564","source_kind":"arxiv","source_version":1}}},"equivocations":[],"invalid_events":[],"applied_event_ids":["sha256:b28fd8c8f6fe30fad1a896d6d855b0ea7e18a95a43a233bfc9a4dc6519f51400","sha256:549fc1835d0fb48406b55d4293e9b9a609d8e55eda0a33d9bfb4638b43c91b36"],"state_sha256":"cca4459bc44fdc7de0b3bc4ee793fe0ed39e03ffb88495ed8125f42dcd51cc76"},"bundle_signature":{"signature_status":"signed_v1","algorithm":"ed25519","key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","signature_b64":"GnSqW1t+Hdvb+io9ClLZhpDsDFx17YareYMJsO+HojnSY52356e3hQlcCJxDY9I9DjSMXmczsOtbcaKOqf0HDg==","signed_message":"bundle_sha256_bytes","signed_at":"2026-06-06T16:54:38.392606Z","bundle_sha256":"86b84a45e53f821863460addb21ceeeb7d7b51948753c5163970c8640a51b2df"}}