{"bundle_type":"pith_open_graph_bundle","bundle_version":"1.0","pith_number":"pith:2026:2WN3GPRCKQ2TMBKQ64TBJAFVOJ","short_pith_number":"pith:2WN3GPRC","canonical_record":{"source":{"id":"2605.29416","kind":"arxiv","version":1},"metadata":{"license":"http://creativecommons.org/licenses/by-nc-sa/4.0/","primary_cat":"cs.RO","submitted_at":"2026-05-28T06:07:57Z","cross_cats_sorted":["cs.CV"],"title_canon_sha256":"24cf268ec1f39f0bbd4b5cdf2214d039f5a73c7a42c48a54b2c58b4d89ec70c0","abstract_canon_sha256":"d26258d6ba15aef4cdd69b7ee653a44f01e12be94ca91a0b30af7e4cc4325e25"},"schema_version":"1.0"},"canonical_sha256":"d59bb33e225435360550f7261480b5725e4bfd3bf18888ca48694a4efcfa2cf4","source":{"kind":"arxiv","id":"2605.29416","version":1},"source_aliases":[{"alias_kind":"arxiv","alias_value":"2605.29416","created_at":"2026-05-29T01:05:37Z"},{"alias_kind":"arxiv_version","alias_value":"2605.29416v1","created_at":"2026-05-29T01:05:37Z"},{"alias_kind":"doi","alias_value":"10.48550/arxiv.2605.29416","created_at":"2026-05-29T01:05:37Z"},{"alias_kind":"pith_short_12","alias_value":"2WN3GPRCKQ2T","created_at":"2026-05-29T01:05:37Z"},{"alias_kind":"pith_short_16","alias_value":"2WN3GPRCKQ2TMBKQ","created_at":"2026-05-29T01:05:37Z"},{"alias_kind":"pith_short_8","alias_value":"2WN3GPRC","created_at":"2026-05-29T01:05:37Z"}],"events":[{"event_type":"record_created","subject_pith_number":"pith:2026:2WN3GPRCKQ2TMBKQ64TBJAFVOJ","target":"record","payload":{"canonical_record":{"source":{"id":"2605.29416","kind":"arxiv","version":1},"metadata":{"license":"http://creativecommons.org/licenses/by-nc-sa/4.0/","primary_cat":"cs.RO","submitted_at":"2026-05-28T06:07:57Z","cross_cats_sorted":["cs.CV"],"title_canon_sha256":"24cf268ec1f39f0bbd4b5cdf2214d039f5a73c7a42c48a54b2c58b4d89ec70c0","abstract_canon_sha256":"d26258d6ba15aef4cdd69b7ee653a44f01e12be94ca91a0b30af7e4cc4325e25"},"schema_version":"1.0"},"canonical_sha256":"d59bb33e225435360550f7261480b5725e4bfd3bf18888ca48694a4efcfa2cf4","receipt":{"kind":"pith_receipt","key_id":"pith-v1-2026-05","algorithm":"ed25519","signed_at":"2026-05-29T01:05:37.730248Z","signature_b64":"js6D2XWxoHo81b+Wii6yOrYH4IaqLGZtSR8IBMqRxeabgcNcx/y76NB1K4nGQxZVV2PcJIfojKJWORK6bV7WBg==","signed_message":"canonical_sha256_bytes","builder_version":"pith-number-builder-2026-05-17-v1","receipt_version":"0.3","canonical_sha256":"d59bb33e225435360550f7261480b5725e4bfd3bf18888ca48694a4efcfa2cf4","last_reissued_at":"2026-05-29T01:05:37.729756Z","signature_status":"signed_v1","first_computed_at":"2026-05-29T01:05:37.729756Z","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54"},"source_kind":"arxiv","source_id":"2605.29416","source_version":1,"attestation_state":"computed"},"signer":{"signer_id":"pith.science","signer_type":"pith_registry","key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54"},"created_at":"2026-05-29T01:05:37Z","supersedes":[],"prev_event":null,"signature":{"signature_status":"signed_v1","algorithm":"ed25519","key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","signature_b64":"G/9GVhB0cSLHu8EaDuZYVFBMiPJheCs4KFn+ivmG9TimV9kY8Cqa4iQ1Saxpy9SQHMsBGqJPHL+18npRZn+vDw==","signed_message":"open_graph_event_sha256_bytes","signed_at":"2026-06-03T15:11:59.515250Z"},"content_sha256":"5186ac1fe0e9e8bbc61cab23c47f243bec14dc89b881fbd87927f7a9904921ba","schema_version":"1.0","event_id":"sha256:5186ac1fe0e9e8bbc61cab23c47f243bec14dc89b881fbd87927f7a9904921ba"},{"event_type":"graph_snapshot","subject_pith_number":"pith:2026:2WN3GPRCKQ2TMBKQ64TBJAFVOJ","target":"graph","payload":{"graph_snapshot":{"paper":{"title":"3DVLA: Enhancing Vision-Language-Action Models via 3D Spatial and Instance Understanding","license":"http://creativecommons.org/licenses/by-nc-sa/4.0/","headline":"","cross_cats":["cs.CV"],"primary_cat":"cs.RO","authors_text":"Bingqing Wei, Yongtao Wang, Yousen Tang, Zhongyu Xia","submitted_at":"2026-05-28T06:07:57Z","abstract_excerpt":"Vision-Language-Action models have achieved remarkable progress in robotic manipulation, yet they suffer from a critical limitation: a lack of 3D scene understanding. This deficiency manifests as three intertwined challenges: weak extraction of 3D spatial positions without enforcing multi-view consistency, inadequate 3D instance understanding, and fragile reasoning under occlusion. Although mature 3D perception methods exist, their direct integration into VLA pipelines is hindered by architectural incompatibility and by heavy reliance on costly instance-level annotations. To address the above "},"claims":{"count":0,"items":[],"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"source":{"id":"2605.29416","kind":"arxiv","version":1},"verdict":{"id":null,"model_set":{},"created_at":null,"strongest_claim":"","one_line_summary":"","pipeline_version":null,"weakest_assumption":"","pith_extraction_headline":""},"integrity":{"clean":true,"summary":{"advisory":0,"critical":0,"by_detector":{},"informational":0},"endpoint":"/pith/2605.29416/integrity.json","findings":[],"available":true,"detectors_run":[],"snapshot_sha256":"c28c3603d3b5d939e8dc4c7e95fa8dfce3d595e45f758748cecf8e644a296938"},"references":{"count":0,"sample":[],"resolved_work":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57","internal_anchors":0},"formal_canon":{"evidence_count":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"author_claims":{"count":0,"strong_count":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"builder_version":"pith-number-builder-2026-05-17-v1"},"verdict_id":null},"signer":{"signer_id":"pith.science","signer_type":"pith_registry","key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54"},"created_at":"2026-05-29T01:05:37Z","supersedes":[],"prev_event":null,"signature":{"signature_status":"signed_v1","algorithm":"ed25519","key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","signature_b64":"TQCWyvaNBJ2BPHL3vod8jdFJf0/poLuenRLLv59VV/gBcKZwWF1zU9So0d7G6IqIv4henZRq9Jx829aW1mUUBg==","signed_message":"open_graph_event_sha256_bytes","signed_at":"2026-06-03T15:11:59.515912Z"},"content_sha256":"fdc15ea338e06e92e1a9e143bf7248e6af9d0a628443b113002f8bfc936d9b37","schema_version":"1.0","event_id":"sha256:fdc15ea338e06e92e1a9e143bf7248e6af9d0a628443b113002f8bfc936d9b37"}],"timestamp_proofs":[],"mirror_hints":[{"mirror_type":"https","name":"Pith Resolver","base_url":"https://pith.science","bundle_url":"https://pith.science/pith/2WN3GPRCKQ2TMBKQ64TBJAFVOJ/bundle.json","state_url":"https://pith.science/pith/2WN3GPRCKQ2TMBKQ64TBJAFVOJ/state.json","well_known_bundle_url":"https://pith.science/.well-known/pith/2WN3GPRCKQ2TMBKQ64TBJAFVOJ/bundle.json","status":"primary"}],"public_keys":[{"key_id":"pith-v1-2026-05","algorithm":"ed25519","format":"raw","public_key_b64":"stVStoiQhXFxp4s2pdzPNoqVNBMojDU/fJ2db5S3CbM=","public_key_hex":"b2d552b68890857171a78b36a5dccf368a953413288c353f7c9d9d6f94b709b3","fingerprint_sha256_b32_first128bits":"RVFV5Z2OI2J3ZUO7ERDEBCYNKS","fingerprint_sha256_hex":"8d4b5ee74e4693bcd1df2446408b0d54","rotates_at":null,"url":"https://pith.science/pith-signing-key.json","notes":"Pith uses this Ed25519 key to sign canonical record SHA-256 digests. Verify with: ed25519_verify(public_key, message=canonical_sha256_bytes, signature=base64decode(signature_b64))."}],"merge_version":"pith-open-graph-merge-v1","built_at":"2026-06-03T15:11:59Z","links":{"resolver":"https://pith.science/pith/2WN3GPRCKQ2TMBKQ64TBJAFVOJ","bundle":"https://pith.science/pith/2WN3GPRCKQ2TMBKQ64TBJAFVOJ/bundle.json","state":"https://pith.science/pith/2WN3GPRCKQ2TMBKQ64TBJAFVOJ/state.json","well_known_bundle":"https://pith.science/.well-known/pith/2WN3GPRCKQ2TMBKQ64TBJAFVOJ/bundle.json"},"state":{"state_type":"pith_open_graph_state","state_version":"1.0","pith_number":"pith:2026:2WN3GPRCKQ2TMBKQ64TBJAFVOJ","merge_version":"pith-open-graph-merge-v1","event_count":2,"valid_event_count":2,"invalid_event_count":0,"equivocation_count":0,"current":{"canonical_record":{"metadata":{"abstract_canon_sha256":"d26258d6ba15aef4cdd69b7ee653a44f01e12be94ca91a0b30af7e4cc4325e25","cross_cats_sorted":["cs.CV"],"license":"http://creativecommons.org/licenses/by-nc-sa/4.0/","primary_cat":"cs.RO","submitted_at":"2026-05-28T06:07:57Z","title_canon_sha256":"24cf268ec1f39f0bbd4b5cdf2214d039f5a73c7a42c48a54b2c58b4d89ec70c0"},"schema_version":"1.0","source":{"id":"2605.29416","kind":"arxiv","version":1}},"source_aliases":[{"alias_kind":"arxiv","alias_value":"2605.29416","created_at":"2026-05-29T01:05:37Z"},{"alias_kind":"arxiv_version","alias_value":"2605.29416v1","created_at":"2026-05-29T01:05:37Z"},{"alias_kind":"doi","alias_value":"10.48550/arxiv.2605.29416","created_at":"2026-05-29T01:05:37Z"},{"alias_kind":"pith_short_12","alias_value":"2WN3GPRCKQ2T","created_at":"2026-05-29T01:05:37Z"},{"alias_kind":"pith_short_16","alias_value":"2WN3GPRCKQ2TMBKQ","created_at":"2026-05-29T01:05:37Z"},{"alias_kind":"pith_short_8","alias_value":"2WN3GPRC","created_at":"2026-05-29T01:05:37Z"}],"graph_snapshots":[{"event_id":"sha256:fdc15ea338e06e92e1a9e143bf7248e6af9d0a628443b113002f8bfc936d9b37","target":"graph","created_at":"2026-05-29T01:05:37Z","signer":{"key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","signer_id":"pith.science","signer_type":"pith_registry"},"payload":{"graph_snapshot":{"author_claims":{"count":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57","strong_count":0},"builder_version":"pith-number-builder-2026-05-17-v1","claims":{"count":0,"items":[],"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"formal_canon":{"evidence_count":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"integrity":{"available":true,"clean":true,"detectors_run":[],"endpoint":"/pith/2605.29416/integrity.json","findings":[],"snapshot_sha256":"c28c3603d3b5d939e8dc4c7e95fa8dfce3d595e45f758748cecf8e644a296938","summary":{"advisory":0,"by_detector":{},"critical":0,"informational":0}},"paper":{"abstract_excerpt":"Vision-Language-Action models have achieved remarkable progress in robotic manipulation, yet they suffer from a critical limitation: a lack of 3D scene understanding. This deficiency manifests as three intertwined challenges: weak extraction of 3D spatial positions without enforcing multi-view consistency, inadequate 3D instance understanding, and fragile reasoning under occlusion. Although mature 3D perception methods exist, their direct integration into VLA pipelines is hindered by architectural incompatibility and by heavy reliance on costly instance-level annotations. To address the above ","authors_text":"Bingqing Wei, Yongtao Wang, Yousen Tang, Zhongyu Xia","cross_cats":["cs.CV"],"headline":"","license":"http://creativecommons.org/licenses/by-nc-sa/4.0/","primary_cat":"cs.RO","submitted_at":"2026-05-28T06:07:57Z","title":"3DVLA: Enhancing Vision-Language-Action Models via 3D Spatial and Instance Understanding"},"references":{"count":0,"internal_anchors":0,"resolved_work":0,"sample":[],"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"source":{"id":"2605.29416","kind":"arxiv","version":1},"verdict":{"created_at":null,"id":null,"model_set":{},"one_line_summary":"","pipeline_version":null,"pith_extraction_headline":"","strongest_claim":"","weakest_assumption":""}},"verdict_id":null}}],"author_attestations":[],"timestamp_anchors":[],"storage_attestations":[],"citation_signatures":[],"replication_records":[],"corrections":[],"mirror_hints":[],"record_created":{"event_id":"sha256:5186ac1fe0e9e8bbc61cab23c47f243bec14dc89b881fbd87927f7a9904921ba","target":"record","created_at":"2026-05-29T01:05:37Z","signer":{"key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","signer_id":"pith.science","signer_type":"pith_registry"},"payload":{"attestation_state":"computed","canonical_record":{"metadata":{"abstract_canon_sha256":"d26258d6ba15aef4cdd69b7ee653a44f01e12be94ca91a0b30af7e4cc4325e25","cross_cats_sorted":["cs.CV"],"license":"http://creativecommons.org/licenses/by-nc-sa/4.0/","primary_cat":"cs.RO","submitted_at":"2026-05-28T06:07:57Z","title_canon_sha256":"24cf268ec1f39f0bbd4b5cdf2214d039f5a73c7a42c48a54b2c58b4d89ec70c0"},"schema_version":"1.0","source":{"id":"2605.29416","kind":"arxiv","version":1}},"canonical_sha256":"d59bb33e225435360550f7261480b5725e4bfd3bf18888ca48694a4efcfa2cf4","receipt":{"algorithm":"ed25519","builder_version":"pith-number-builder-2026-05-17-v1","canonical_sha256":"d59bb33e225435360550f7261480b5725e4bfd3bf18888ca48694a4efcfa2cf4","first_computed_at":"2026-05-29T01:05:37.729756Z","key_id":"pith-v1-2026-05","kind":"pith_receipt","last_reissued_at":"2026-05-29T01:05:37.729756Z","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","receipt_version":"0.3","signature_b64":"js6D2XWxoHo81b+Wii6yOrYH4IaqLGZtSR8IBMqRxeabgcNcx/y76NB1K4nGQxZVV2PcJIfojKJWORK6bV7WBg==","signature_status":"signed_v1","signed_at":"2026-05-29T01:05:37.730248Z","signed_message":"canonical_sha256_bytes"},"source_id":"2605.29416","source_kind":"arxiv","source_version":1}}},"equivocations":[],"invalid_events":[],"applied_event_ids":["sha256:5186ac1fe0e9e8bbc61cab23c47f243bec14dc89b881fbd87927f7a9904921ba","sha256:fdc15ea338e06e92e1a9e143bf7248e6af9d0a628443b113002f8bfc936d9b37"],"state_sha256":"44141037dfb53d296ea5fce3d48258685b2ed41035df54f07538e70fc53b0388"},"bundle_signature":{"signature_status":"signed_v1","algorithm":"ed25519","key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","signature_b64":"U+CEgQbcSuUU+cjYv4BG1kTpw176EMeQPe2+lOVmkXdBqJmqaFsHboRTIPMkrEVZMk5P8bzaq6rucnYnGYcPAQ==","signed_message":"bundle_sha256_bytes","signed_at":"2026-06-03T15:11:59.518322Z","bundle_sha256":"1f21f975e1fa013d67371ef07b3c1676813487d5a6946c26d29a6549f07af69c"}}