{"bundle_type":"pith_open_graph_bundle","bundle_version":"1.0","pith_number":"pith:2026:2Z6UCPVSXLBIATCRDYUJ2ETOA3","short_pith_number":"pith:2Z6UCPVS","canonical_record":{"source":{"id":"2606.11568","kind":"arxiv","version":1},"metadata":{"license":"http://creativecommons.org/licenses/by/4.0/","primary_cat":"cs.CV","submitted_at":"2026-06-10T01:49:55Z","cross_cats_sorted":[],"title_canon_sha256":"ff50ef8022965e69a7cba7a11939ebc166fefeefb424d8795f808f92f7434faa","abstract_canon_sha256":"e2e0af1c434725c036edd0a25c63f7bf137f952977115ef4629ad95949a80718"},"schema_version":"1.0"},"canonical_sha256":"d67d413eb2bac2804c511e289d126e06c209934be4d7d8befbc95ab77737cafa","source":{"kind":"arxiv","id":"2606.11568","version":1},"source_aliases":[{"alias_kind":"arxiv","alias_value":"2606.11568","created_at":"2026-06-11T01:09:56Z"},{"alias_kind":"arxiv_version","alias_value":"2606.11568v1","created_at":"2026-06-11T01:09:56Z"},{"alias_kind":"doi","alias_value":"10.48550/arxiv.2606.11568","created_at":"2026-06-11T01:09:56Z"},{"alias_kind":"pith_short_12","alias_value":"2Z6UCPVSXLBI","created_at":"2026-06-11T01:09:56Z"},{"alias_kind":"pith_short_16","alias_value":"2Z6UCPVSXLBIATCR","created_at":"2026-06-11T01:09:56Z"},{"alias_kind":"pith_short_8","alias_value":"2Z6UCPVS","created_at":"2026-06-11T01:09:56Z"}],"events":[{"event_type":"record_created","subject_pith_number":"pith:2026:2Z6UCPVSXLBIATCRDYUJ2ETOA3","target":"record","payload":{"canonical_record":{"source":{"id":"2606.11568","kind":"arxiv","version":1},"metadata":{"license":"http://creativecommons.org/licenses/by/4.0/","primary_cat":"cs.CV","submitted_at":"2026-06-10T01:49:55Z","cross_cats_sorted":[],"title_canon_sha256":"ff50ef8022965e69a7cba7a11939ebc166fefeefb424d8795f808f92f7434faa","abstract_canon_sha256":"e2e0af1c434725c036edd0a25c63f7bf137f952977115ef4629ad95949a80718"},"schema_version":"1.0"},"canonical_sha256":"d67d413eb2bac2804c511e289d126e06c209934be4d7d8befbc95ab77737cafa","receipt":{"kind":"pith_receipt","key_id":"pith-v1-2026-05","algorithm":"ed25519","signed_at":"2026-06-11T01:09:56.583350Z","signature_b64":"0Y0KEcLis6qFAmQrLKcg/BLB6SbYHDLP5E6X5QWwC4XB2tfgK8a/ZTTCOAhwXKzuBGkr/bDbSIXPf7bPqOZOCA==","signed_message":"canonical_sha256_bytes","builder_version":"pith-number-builder-2026-05-17-v1","receipt_version":"0.3","canonical_sha256":"d67d413eb2bac2804c511e289d126e06c209934be4d7d8befbc95ab77737cafa","last_reissued_at":"2026-06-11T01:09:56.582478Z","signature_status":"signed_v1","first_computed_at":"2026-06-11T01:09:56.582478Z","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54"},"source_kind":"arxiv","source_id":"2606.11568","source_version":1,"attestation_state":"computed"},"signer":{"signer_id":"pith.science","signer_type":"pith_registry","key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54"},"created_at":"2026-06-11T01:09:56Z","supersedes":[],"prev_event":null,"signature":{"signature_status":"signed_v1","algorithm":"ed25519","key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","signature_b64":"38EheFrJZjnobP7nJp4LpEHuLAGoYfSMpTJFQvlYOZu0QOmYEiddKaa4MXu8lYc1brOun/ItCVIxQj5FCWEnDQ==","signed_message":"open_graph_event_sha256_bytes","signed_at":"2026-06-28T01:36:15.813051Z"},"content_sha256":"dd7e24c10a5b8af01b7c132ffaf6c1febd95d79c5cd83f2b5f35c03d130a1795","schema_version":"1.0","event_id":"sha256:dd7e24c10a5b8af01b7c132ffaf6c1febd95d79c5cd83f2b5f35c03d130a1795"},{"event_type":"graph_snapshot","subject_pith_number":"pith:2026:2Z6UCPVSXLBIATCRDYUJ2ETOA3","target":"graph","payload":{"graph_snapshot":{"paper":{"title":"4DP-QA: Scalable QA for 4D Perception in Vision Language Models","license":"http://creativecommons.org/licenses/by/4.0/","headline":"","cross_cats":[],"primary_cat":"cs.CV","authors_text":"Abhishek Badki, Hang Su, Jindong Jiang, Orazio Gallo, Seokju Cho, Seungryong Kim, Sifei Liu, Ziyao Zeng","submitted_at":"2026-06-10T01:49:55Z","abstract_excerpt":"Despite recent advances, Vision Language Models (VLMs) still struggle to grasp the dynamics of the world. We note that the ability to reason about a 4D scene, challenging in itself, is further complicated by two factors. First, VLMs observe motion indirectly via its projection onto 2D images. Second, existing datasets fail to disentangle object and camera motion. To address these challenges, we present a QA generation pipeline that focuses on motion-related scene understanding. We take particular care of the entanglement of camera and object motion by casting tracking in both the traditional w"},"claims":{"count":0,"items":[],"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"source":{"id":"2606.11568","kind":"arxiv","version":1},"verdict":{"id":null,"model_set":{},"created_at":null,"strongest_claim":"","one_line_summary":"","pipeline_version":null,"weakest_assumption":"","pith_extraction_headline":""},"integrity":{"clean":true,"summary":{"advisory":0,"critical":0,"by_detector":{},"informational":0},"endpoint":"/pith/2606.11568/integrity.json","findings":[],"available":true,"detectors_run":[],"snapshot_sha256":"c28c3603d3b5d939e8dc4c7e95fa8dfce3d595e45f758748cecf8e644a296938"},"references":{"count":0,"sample":[],"resolved_work":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57","internal_anchors":0},"formal_canon":{"evidence_count":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"author_claims":{"count":0,"strong_count":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"builder_version":"pith-number-builder-2026-05-17-v1"},"verdict_id":null},"signer":{"signer_id":"pith.science","signer_type":"pith_registry","key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54"},"created_at":"2026-06-11T01:09:56Z","supersedes":[],"prev_event":null,"signature":{"signature_status":"signed_v1","algorithm":"ed25519","key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","signature_b64":"Rgje7J3a92vWt/rg7V5l912k70Lvrfim/raGnUYCjvSo4JVMQEk3IMXUxFyN5nYiPQU6fMHWqKl1kv0siAP0Dw==","signed_message":"open_graph_event_sha256_bytes","signed_at":"2026-06-28T01:36:15.813437Z"},"content_sha256":"d302aacab6942bd053f6c86a378d7300744bade4ea917ee0455f09a35bd498ac","schema_version":"1.0","event_id":"sha256:d302aacab6942bd053f6c86a378d7300744bade4ea917ee0455f09a35bd498ac"}],"timestamp_proofs":[],"mirror_hints":[{"mirror_type":"https","name":"Pith Resolver","base_url":"https://pith.science","bundle_url":"https://pith.science/pith/2Z6UCPVSXLBIATCRDYUJ2ETOA3/bundle.json","state_url":"https://pith.science/pith/2Z6UCPVSXLBIATCRDYUJ2ETOA3/state.json","well_known_bundle_url":"https://pith.science/.well-known/pith/2Z6UCPVSXLBIATCRDYUJ2ETOA3/bundle.json","status":"primary"}],"public_keys":[{"key_id":"pith-v1-2026-05","algorithm":"ed25519","format":"raw","public_key_b64":"stVStoiQhXFxp4s2pdzPNoqVNBMojDU/fJ2db5S3CbM=","public_key_hex":"b2d552b68890857171a78b36a5dccf368a953413288c353f7c9d9d6f94b709b3","fingerprint_sha256_b32_first128bits":"RVFV5Z2OI2J3ZUO7ERDEBCYNKS","fingerprint_sha256_hex":"8d4b5ee74e4693bcd1df2446408b0d54","rotates_at":null,"url":"https://pith.science/pith-signing-key.json","notes":"Pith uses this Ed25519 key to sign canonical record SHA-256 digests. Verify with: ed25519_verify(public_key, message=canonical_sha256_bytes, signature=base64decode(signature_b64))."}],"merge_version":"pith-open-graph-merge-v1","built_at":"2026-06-28T01:36:15Z","links":{"resolver":"https://pith.science/pith/2Z6UCPVSXLBIATCRDYUJ2ETOA3","bundle":"https://pith.science/pith/2Z6UCPVSXLBIATCRDYUJ2ETOA3/bundle.json","state":"https://pith.science/pith/2Z6UCPVSXLBIATCRDYUJ2ETOA3/state.json","well_known_bundle":"https://pith.science/.well-known/pith/2Z6UCPVSXLBIATCRDYUJ2ETOA3/bundle.json"},"state":{"state_type":"pith_open_graph_state","state_version":"1.0","pith_number":"pith:2026:2Z6UCPVSXLBIATCRDYUJ2ETOA3","merge_version":"pith-open-graph-merge-v1","event_count":2,"valid_event_count":2,"invalid_event_count":0,"equivocation_count":0,"current":{"canonical_record":{"metadata":{"abstract_canon_sha256":"e2e0af1c434725c036edd0a25c63f7bf137f952977115ef4629ad95949a80718","cross_cats_sorted":[],"license":"http://creativecommons.org/licenses/by/4.0/","primary_cat":"cs.CV","submitted_at":"2026-06-10T01:49:55Z","title_canon_sha256":"ff50ef8022965e69a7cba7a11939ebc166fefeefb424d8795f808f92f7434faa"},"schema_version":"1.0","source":{"id":"2606.11568","kind":"arxiv","version":1}},"source_aliases":[{"alias_kind":"arxiv","alias_value":"2606.11568","created_at":"2026-06-11T01:09:56Z"},{"alias_kind":"arxiv_version","alias_value":"2606.11568v1","created_at":"2026-06-11T01:09:56Z"},{"alias_kind":"doi","alias_value":"10.48550/arxiv.2606.11568","created_at":"2026-06-11T01:09:56Z"},{"alias_kind":"pith_short_12","alias_value":"2Z6UCPVSXLBI","created_at":"2026-06-11T01:09:56Z"},{"alias_kind":"pith_short_16","alias_value":"2Z6UCPVSXLBIATCR","created_at":"2026-06-11T01:09:56Z"},{"alias_kind":"pith_short_8","alias_value":"2Z6UCPVS","created_at":"2026-06-11T01:09:56Z"}],"graph_snapshots":[{"event_id":"sha256:d302aacab6942bd053f6c86a378d7300744bade4ea917ee0455f09a35bd498ac","target":"graph","created_at":"2026-06-11T01:09:56Z","signer":{"key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","signer_id":"pith.science","signer_type":"pith_registry"},"payload":{"graph_snapshot":{"author_claims":{"count":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57","strong_count":0},"builder_version":"pith-number-builder-2026-05-17-v1","claims":{"count":0,"items":[],"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"formal_canon":{"evidence_count":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"integrity":{"available":true,"clean":true,"detectors_run":[],"endpoint":"/pith/2606.11568/integrity.json","findings":[],"snapshot_sha256":"c28c3603d3b5d939e8dc4c7e95fa8dfce3d595e45f758748cecf8e644a296938","summary":{"advisory":0,"by_detector":{},"critical":0,"informational":0}},"paper":{"abstract_excerpt":"Despite recent advances, Vision Language Models (VLMs) still struggle to grasp the dynamics of the world. We note that the ability to reason about a 4D scene, challenging in itself, is further complicated by two factors. First, VLMs observe motion indirectly via its projection onto 2D images. Second, existing datasets fail to disentangle object and camera motion. To address these challenges, we present a QA generation pipeline that focuses on motion-related scene understanding. We take particular care of the entanglement of camera and object motion by casting tracking in both the traditional w","authors_text":"Abhishek Badki, Hang Su, Jindong Jiang, Orazio Gallo, Seokju Cho, Seungryong Kim, Sifei Liu, Ziyao Zeng","cross_cats":[],"headline":"","license":"http://creativecommons.org/licenses/by/4.0/","primary_cat":"cs.CV","submitted_at":"2026-06-10T01:49:55Z","title":"4DP-QA: Scalable QA for 4D Perception in Vision Language Models"},"references":{"count":0,"internal_anchors":0,"resolved_work":0,"sample":[],"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"source":{"id":"2606.11568","kind":"arxiv","version":1},"verdict":{"created_at":null,"id":null,"model_set":{},"one_line_summary":"","pipeline_version":null,"pith_extraction_headline":"","strongest_claim":"","weakest_assumption":""}},"verdict_id":null}}],"author_attestations":[],"timestamp_anchors":[],"storage_attestations":[],"citation_signatures":[],"replication_records":[],"corrections":[],"mirror_hints":[],"record_created":{"event_id":"sha256:dd7e24c10a5b8af01b7c132ffaf6c1febd95d79c5cd83f2b5f35c03d130a1795","target":"record","created_at":"2026-06-11T01:09:56Z","signer":{"key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","signer_id":"pith.science","signer_type":"pith_registry"},"payload":{"attestation_state":"computed","canonical_record":{"metadata":{"abstract_canon_sha256":"e2e0af1c434725c036edd0a25c63f7bf137f952977115ef4629ad95949a80718","cross_cats_sorted":[],"license":"http://creativecommons.org/licenses/by/4.0/","primary_cat":"cs.CV","submitted_at":"2026-06-10T01:49:55Z","title_canon_sha256":"ff50ef8022965e69a7cba7a11939ebc166fefeefb424d8795f808f92f7434faa"},"schema_version":"1.0","source":{"id":"2606.11568","kind":"arxiv","version":1}},"canonical_sha256":"d67d413eb2bac2804c511e289d126e06c209934be4d7d8befbc95ab77737cafa","receipt":{"algorithm":"ed25519","builder_version":"pith-number-builder-2026-05-17-v1","canonical_sha256":"d67d413eb2bac2804c511e289d126e06c209934be4d7d8befbc95ab77737cafa","first_computed_at":"2026-06-11T01:09:56.582478Z","key_id":"pith-v1-2026-05","kind":"pith_receipt","last_reissued_at":"2026-06-11T01:09:56.582478Z","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","receipt_version":"0.3","signature_b64":"0Y0KEcLis6qFAmQrLKcg/BLB6SbYHDLP5E6X5QWwC4XB2tfgK8a/ZTTCOAhwXKzuBGkr/bDbSIXPf7bPqOZOCA==","signature_status":"signed_v1","signed_at":"2026-06-11T01:09:56.583350Z","signed_message":"canonical_sha256_bytes"},"source_id":"2606.11568","source_kind":"arxiv","source_version":1}}},"equivocations":[],"invalid_events":[],"applied_event_ids":["sha256:dd7e24c10a5b8af01b7c132ffaf6c1febd95d79c5cd83f2b5f35c03d130a1795","sha256:d302aacab6942bd053f6c86a378d7300744bade4ea917ee0455f09a35bd498ac"],"state_sha256":"fc2f1ae912d8a9f197b65f578629b19ed49c61ea2083f006b10ac260f0c4ca92"},"bundle_signature":{"signature_status":"signed_v1","algorithm":"ed25519","key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","signature_b64":"OmVIFHbB6v7pgbPy3Zp8HTxJxilwMUEaOmH0V+18rMnRzdzRPXJwAORJN7n8d/Ai45IwC4D1CQ0Zo7J/6niLBw==","signed_message":"bundle_sha256_bytes","signed_at":"2026-06-28T01:36:15.815372Z","bundle_sha256":"c8f3166b92cbc3890a9f8ed273e1f281e73ece38472bbc9a5180f93c0318cfbc"}}