{"bundle_type":"pith_open_graph_bundle","bundle_version":"1.0","pith_number":"pith:2026:3LCP4KS3COZVR5SCQFVS4U5E5R","short_pith_number":"pith:3LCP4KS3","canonical_record":{"source":{"id":"2606.06819","kind":"arxiv","version":1},"metadata":{"license":"http://arxiv.org/licenses/nonexclusive-distrib/1.0/","primary_cat":"cs.CV","submitted_at":"2026-06-05T01:44:38Z","cross_cats_sorted":[],"title_canon_sha256":"732b326777bd1e9bffee539a290bfb6b919c8c16d110634e4d9e6ce46b579abc","abstract_canon_sha256":"d0805f6edd2541a4a5b621e1d70498fd07a43471a7b3635870b979300524e772"},"schema_version":"1.0"},"canonical_sha256":"dac4fe2a5b13b358f642816b2e53a4ec7e75f122a298a087555a53bd42fff984","source":{"kind":"arxiv","id":"2606.06819","version":1},"source_aliases":[{"alias_kind":"arxiv","alias_value":"2606.06819","created_at":"2026-06-08T01:04:29Z"},{"alias_kind":"arxiv_version","alias_value":"2606.06819v1","created_at":"2026-06-08T01:04:29Z"},{"alias_kind":"doi","alias_value":"10.48550/arxiv.2606.06819","created_at":"2026-06-08T01:04:29Z"},{"alias_kind":"pith_short_12","alias_value":"3LCP4KS3COZV","created_at":"2026-06-08T01:04:29Z"},{"alias_kind":"pith_short_16","alias_value":"3LCP4KS3COZVR5SC","created_at":"2026-06-08T01:04:29Z"},{"alias_kind":"pith_short_8","alias_value":"3LCP4KS3","created_at":"2026-06-08T01:04:29Z"}],"events":[{"event_type":"record_created","subject_pith_number":"pith:2026:3LCP4KS3COZVR5SCQFVS4U5E5R","target":"record","payload":{"canonical_record":{"source":{"id":"2606.06819","kind":"arxiv","version":1},"metadata":{"license":"http://arxiv.org/licenses/nonexclusive-distrib/1.0/","primary_cat":"cs.CV","submitted_at":"2026-06-05T01:44:38Z","cross_cats_sorted":[],"title_canon_sha256":"732b326777bd1e9bffee539a290bfb6b919c8c16d110634e4d9e6ce46b579abc","abstract_canon_sha256":"d0805f6edd2541a4a5b621e1d70498fd07a43471a7b3635870b979300524e772"},"schema_version":"1.0"},"canonical_sha256":"dac4fe2a5b13b358f642816b2e53a4ec7e75f122a298a087555a53bd42fff984","receipt":{"kind":"pith_receipt","key_id":"pith-v1-2026-05","algorithm":"ed25519","signed_at":"2026-06-08T01:04:29.815513Z","signature_b64":"O8ef7y2kzgP2IBIMeld6/QPcdANtbv4P/IOPeyZMd43oD/ZZvZ8ycTGvRfXJdFxbrP6qftV5AN47igw8YJ5yBg==","signed_message":"canonical_sha256_bytes","builder_version":"pith-number-builder-2026-05-17-v1","receipt_version":"0.3","canonical_sha256":"dac4fe2a5b13b358f642816b2e53a4ec7e75f122a298a087555a53bd42fff984","last_reissued_at":"2026-06-08T01:04:29.814680Z","signature_status":"signed_v1","first_computed_at":"2026-06-08T01:04:29.814680Z","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54"},"source_kind":"arxiv","source_id":"2606.06819","source_version":1,"attestation_state":"computed"},"signer":{"signer_id":"pith.science","signer_type":"pith_registry","key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54"},"created_at":"2026-06-08T01:04:29Z","supersedes":[],"prev_event":null,"signature":{"signature_status":"signed_v1","algorithm":"ed25519","key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","signature_b64":"7JjTkB+1l9RKXY21TIVwPxprW3JZsPqv2dasbZLwAbZ8gGi56fw5LrGwmgszwTUzI/5tlC1k0jrFYMY9fjEwBA==","signed_message":"open_graph_event_sha256_bytes","signed_at":"2026-06-30T21:01:17.041675Z"},"content_sha256":"fc2b92144c4492042e20aa05479e4d7da65eb95cbb74a3bdb684a307ec080ebc","schema_version":"1.0","event_id":"sha256:fc2b92144c4492042e20aa05479e4d7da65eb95cbb74a3bdb684a307ec080ebc"},{"event_type":"graph_snapshot","subject_pith_number":"pith:2026:3LCP4KS3COZVR5SCQFVS4U5E5R","target":"graph","payload":{"graph_snapshot":{"paper":{"title":"VideoSEG-O3: A Multi-turn Reinforcement Learning Framework for Reasoning Video Object Segmentation","license":"http://arxiv.org/licenses/nonexclusive-distrib/1.0/","headline":"","cross_cats":[],"primary_cat":"cs.CV","authors_text":"Boqiang Duan, Boyuan Tong, Jiedong Zhuang, Jingdong Wang, Ming Dai, Sen Yang, Wankou Yang","submitted_at":"2026-06-05T01:44:38Z","abstract_excerpt":"Reasoning Video Object Segmentation (RVOS) demands a sophisticated integration of temporal dynamics, spatial details, and linguistic reasoning to achieve precise pixel-level localization. Existing methods are limited to reasoning over fixed initial inputs and lack the capacity to actively acquire further visual evidence, which is often essential for resolving complex references in long or intricate videos. To address this, we propose \\textbf{VideoSEG-O3}, the first multi-turn reinforcement learning framework for RVOS that emulates the human \\textit{``coarse-to-fine''} cognitive process. It emp"},"claims":{"count":0,"items":[],"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"source":{"id":"2606.06819","kind":"arxiv","version":1},"verdict":{"id":null,"model_set":{},"created_at":null,"strongest_claim":"","one_line_summary":"","pipeline_version":null,"weakest_assumption":"","pith_extraction_headline":""},"integrity":{"clean":true,"summary":{"advisory":0,"critical":0,"by_detector":{},"informational":0},"endpoint":"/pith/2606.06819/integrity.json","findings":[],"available":true,"detectors_run":[],"snapshot_sha256":"c28c3603d3b5d939e8dc4c7e95fa8dfce3d595e45f758748cecf8e644a296938"},"references":{"count":0,"sample":[],"resolved_work":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57","internal_anchors":0},"formal_canon":{"evidence_count":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"author_claims":{"count":0,"strong_count":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"builder_version":"pith-number-builder-2026-05-17-v1"},"verdict_id":null},"signer":{"signer_id":"pith.science","signer_type":"pith_registry","key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54"},"created_at":"2026-06-08T01:04:29Z","supersedes":[],"prev_event":null,"signature":{"signature_status":"signed_v1","algorithm":"ed25519","key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","signature_b64":"FmQN9EdYrIGR2BlXW0fKErhPRVkuMM8KnZVQDaH1X3Kf1Y+7Zkpk4v3U1S5NcqRMUv0JmoEse1mPO7lgr/hFDg==","signed_message":"open_graph_event_sha256_bytes","signed_at":"2026-06-30T21:01:17.042061Z"},"content_sha256":"a0b08aba6975dc0dcea183d1805df794f9212e9fda8d45df55329c227917ca45","schema_version":"1.0","event_id":"sha256:a0b08aba6975dc0dcea183d1805df794f9212e9fda8d45df55329c227917ca45"}],"timestamp_proofs":[],"mirror_hints":[{"mirror_type":"https","name":"Pith Resolver","base_url":"https://pith.science","bundle_url":"https://pith.science/pith/3LCP4KS3COZVR5SCQFVS4U5E5R/bundle.json","state_url":"https://pith.science/pith/3LCP4KS3COZVR5SCQFVS4U5E5R/state.json","well_known_bundle_url":"https://pith.science/.well-known/pith/3LCP4KS3COZVR5SCQFVS4U5E5R/bundle.json","status":"primary"}],"public_keys":[{"key_id":"pith-v1-2026-05","algorithm":"ed25519","format":"raw","public_key_b64":"stVStoiQhXFxp4s2pdzPNoqVNBMojDU/fJ2db5S3CbM=","public_key_hex":"b2d552b68890857171a78b36a5dccf368a953413288c353f7c9d9d6f94b709b3","fingerprint_sha256_b32_first128bits":"RVFV5Z2OI2J3ZUO7ERDEBCYNKS","fingerprint_sha256_hex":"8d4b5ee74e4693bcd1df2446408b0d54","rotates_at":null,"url":"https://pith.science/pith-signing-key.json","notes":"Pith uses this Ed25519 key to sign canonical record SHA-256 digests. Verify with: ed25519_verify(public_key, message=canonical_sha256_bytes, signature=base64decode(signature_b64))."}],"merge_version":"pith-open-graph-merge-v1","built_at":"2026-06-30T21:01:17Z","links":{"resolver":"https://pith.science/pith/3LCP4KS3COZVR5SCQFVS4U5E5R","bundle":"https://pith.science/pith/3LCP4KS3COZVR5SCQFVS4U5E5R/bundle.json","state":"https://pith.science/pith/3LCP4KS3COZVR5SCQFVS4U5E5R/state.json","well_known_bundle":"https://pith.science/.well-known/pith/3LCP4KS3COZVR5SCQFVS4U5E5R/bundle.json"},"state":{"state_type":"pith_open_graph_state","state_version":"1.0","pith_number":"pith:2026:3LCP4KS3COZVR5SCQFVS4U5E5R","merge_version":"pith-open-graph-merge-v1","event_count":2,"valid_event_count":2,"invalid_event_count":0,"equivocation_count":0,"current":{"canonical_record":{"metadata":{"abstract_canon_sha256":"d0805f6edd2541a4a5b621e1d70498fd07a43471a7b3635870b979300524e772","cross_cats_sorted":[],"license":"http://arxiv.org/licenses/nonexclusive-distrib/1.0/","primary_cat":"cs.CV","submitted_at":"2026-06-05T01:44:38Z","title_canon_sha256":"732b326777bd1e9bffee539a290bfb6b919c8c16d110634e4d9e6ce46b579abc"},"schema_version":"1.0","source":{"id":"2606.06819","kind":"arxiv","version":1}},"source_aliases":[{"alias_kind":"arxiv","alias_value":"2606.06819","created_at":"2026-06-08T01:04:29Z"},{"alias_kind":"arxiv_version","alias_value":"2606.06819v1","created_at":"2026-06-08T01:04:29Z"},{"alias_kind":"doi","alias_value":"10.48550/arxiv.2606.06819","created_at":"2026-06-08T01:04:29Z"},{"alias_kind":"pith_short_12","alias_value":"3LCP4KS3COZV","created_at":"2026-06-08T01:04:29Z"},{"alias_kind":"pith_short_16","alias_value":"3LCP4KS3COZVR5SC","created_at":"2026-06-08T01:04:29Z"},{"alias_kind":"pith_short_8","alias_value":"3LCP4KS3","created_at":"2026-06-08T01:04:29Z"}],"graph_snapshots":[{"event_id":"sha256:a0b08aba6975dc0dcea183d1805df794f9212e9fda8d45df55329c227917ca45","target":"graph","created_at":"2026-06-08T01:04:29Z","signer":{"key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","signer_id":"pith.science","signer_type":"pith_registry"},"payload":{"graph_snapshot":{"author_claims":{"count":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57","strong_count":0},"builder_version":"pith-number-builder-2026-05-17-v1","claims":{"count":0,"items":[],"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"formal_canon":{"evidence_count":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"integrity":{"available":true,"clean":true,"detectors_run":[],"endpoint":"/pith/2606.06819/integrity.json","findings":[],"snapshot_sha256":"c28c3603d3b5d939e8dc4c7e95fa8dfce3d595e45f758748cecf8e644a296938","summary":{"advisory":0,"by_detector":{},"critical":0,"informational":0}},"paper":{"abstract_excerpt":"Reasoning Video Object Segmentation (RVOS) demands a sophisticated integration of temporal dynamics, spatial details, and linguistic reasoning to achieve precise pixel-level localization. Existing methods are limited to reasoning over fixed initial inputs and lack the capacity to actively acquire further visual evidence, which is often essential for resolving complex references in long or intricate videos. To address this, we propose \\textbf{VideoSEG-O3}, the first multi-turn reinforcement learning framework for RVOS that emulates the human \\textit{``coarse-to-fine''} cognitive process. It emp","authors_text":"Boqiang Duan, Boyuan Tong, Jiedong Zhuang, Jingdong Wang, Ming Dai, Sen Yang, Wankou Yang","cross_cats":[],"headline":"","license":"http://arxiv.org/licenses/nonexclusive-distrib/1.0/","primary_cat":"cs.CV","submitted_at":"2026-06-05T01:44:38Z","title":"VideoSEG-O3: A Multi-turn Reinforcement Learning Framework for Reasoning Video Object Segmentation"},"references":{"count":0,"internal_anchors":0,"resolved_work":0,"sample":[],"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"source":{"id":"2606.06819","kind":"arxiv","version":1},"verdict":{"created_at":null,"id":null,"model_set":{},"one_line_summary":"","pipeline_version":null,"pith_extraction_headline":"","strongest_claim":"","weakest_assumption":""}},"verdict_id":null}}],"author_attestations":[],"timestamp_anchors":[],"storage_attestations":[],"citation_signatures":[],"replication_records":[],"corrections":[],"mirror_hints":[],"record_created":{"event_id":"sha256:fc2b92144c4492042e20aa05479e4d7da65eb95cbb74a3bdb684a307ec080ebc","target":"record","created_at":"2026-06-08T01:04:29Z","signer":{"key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","signer_id":"pith.science","signer_type":"pith_registry"},"payload":{"attestation_state":"computed","canonical_record":{"metadata":{"abstract_canon_sha256":"d0805f6edd2541a4a5b621e1d70498fd07a43471a7b3635870b979300524e772","cross_cats_sorted":[],"license":"http://arxiv.org/licenses/nonexclusive-distrib/1.0/","primary_cat":"cs.CV","submitted_at":"2026-06-05T01:44:38Z","title_canon_sha256":"732b326777bd1e9bffee539a290bfb6b919c8c16d110634e4d9e6ce46b579abc"},"schema_version":"1.0","source":{"id":"2606.06819","kind":"arxiv","version":1}},"canonical_sha256":"dac4fe2a5b13b358f642816b2e53a4ec7e75f122a298a087555a53bd42fff984","receipt":{"algorithm":"ed25519","builder_version":"pith-number-builder-2026-05-17-v1","canonical_sha256":"dac4fe2a5b13b358f642816b2e53a4ec7e75f122a298a087555a53bd42fff984","first_computed_at":"2026-06-08T01:04:29.814680Z","key_id":"pith-v1-2026-05","kind":"pith_receipt","last_reissued_at":"2026-06-08T01:04:29.814680Z","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","receipt_version":"0.3","signature_b64":"O8ef7y2kzgP2IBIMeld6/QPcdANtbv4P/IOPeyZMd43oD/ZZvZ8ycTGvRfXJdFxbrP6qftV5AN47igw8YJ5yBg==","signature_status":"signed_v1","signed_at":"2026-06-08T01:04:29.815513Z","signed_message":"canonical_sha256_bytes"},"source_id":"2606.06819","source_kind":"arxiv","source_version":1}}},"equivocations":[],"invalid_events":[],"applied_event_ids":["sha256:fc2b92144c4492042e20aa05479e4d7da65eb95cbb74a3bdb684a307ec080ebc","sha256:a0b08aba6975dc0dcea183d1805df794f9212e9fda8d45df55329c227917ca45"],"state_sha256":"53ecd80c101270848afcb26b6734fd5c2f38943d64f5bcf20423c8f7407df88d"},"bundle_signature":{"signature_status":"signed_v1","algorithm":"ed25519","key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","signature_b64":"Gw+h0G3fX6y3Vi/zvBF0wEeZLaALTGZ448K5lHhInx9FLJi2RneViLX+2NAfie78ynrY2xmpWTbIoP2rqW33CQ==","signed_message":"bundle_sha256_bytes","signed_at":"2026-06-30T21:01:17.044196Z","bundle_sha256":"c6f18006cecf5197927676696293235dd0f57250362cd7600ce00ee9975c7ab7"}}