{"state_type":"pith_open_graph_state","state_version":"1.0","pith_number":"pith:2023:5D2WXBJ2TG7KRTXDLL4DFQEDT7","merge_version":"pith-open-graph-merge-v1","event_count":2,"valid_event_count":2,"invalid_event_count":0,"equivocation_count":0,"current":{"canonical_record":{"metadata":{"abstract_canon_sha256":"59e3f95092acd3d3e1600453722793990336b1ac3f0ae6d26062b22dd654cfa5","cross_cats_sorted":[],"license":"http://creativecommons.org/licenses/by/4.0/","primary_cat":"cs.CV","submitted_at":"2023-11-07T00:12:01Z","title_canon_sha256":"684c7f1de2521ff5a071ec4ec538eca4d9909b03cf4dde61c111b57029cf7325"},"schema_version":"1.0","source":{"id":"2311.03620","kind":"arxiv","version":1}},"source_aliases":[{"alias_kind":"arxiv","alias_value":"2311.03620","created_at":"2026-07-05T07:10:01Z"},{"alias_kind":"arxiv_version","alias_value":"2311.03620v1","created_at":"2026-07-05T07:10:01Z"},{"alias_kind":"doi","alias_value":"10.48550/arxiv.2311.03620","created_at":"2026-07-05T07:10:01Z"},{"alias_kind":"pith_short_12","alias_value":"5D2WXBJ2TG7K","created_at":"2026-07-05T07:10:01Z"},{"alias_kind":"pith_short_16","alias_value":"5D2WXBJ2TG7KRTXD","created_at":"2026-07-05T07:10:01Z"},{"alias_kind":"pith_short_8","alias_value":"5D2WXBJ2","created_at":"2026-07-05T07:10:01Z"}],"graph_snapshots":[{"event_id":"sha256:c282cd2e880fef1fc9fbb1495303f78d228051abf6e6088168261ffcc7703e66","target":"graph","created_at":"2026-07-05T07:10:01Z","signer":{"key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","signer_id":"pith.science","signer_type":"pith_registry"},"payload":{"graph_snapshot":{"author_claims":{"count":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57","strong_count":0},"builder_version":"pith-number-builder-2026-05-17-v1","claims":{"count":0,"items":[],"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"formal_canon":{"evidence_count":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"integrity":{"available":true,"clean":true,"detectors_run":[],"endpoint":"/pith/2311.03620/integrity.json","findings":[],"snapshot_sha256":"c28c3603d3b5d939e8dc4c7e95fa8dfce3d595e45f758748cecf8e644a296938","summary":{"advisory":0,"by_detector":{},"critical":0,"informational":0}},"paper":{"abstract_excerpt":"For 3D object detection, both camera and lidar have been demonstrated to be useful sensory devices for providing complementary information about the same scenery with data representations in different modalities, e.g., 2D RGB image vs 3D point cloud. An effective representation learning and fusion of such multi-modal sensor data is necessary and critical for better 3D object detection performance. To solve the problem, in this paper, we will introduce a novel vision transformer-based 3D object detection model, namely FusionViT. Different from the existing 3D object detection approaches, Fusion","authors_text":"Jiawei Zhang, Xinhao Xiang","cross_cats":[],"headline":"","license":"http://creativecommons.org/licenses/by/4.0/","primary_cat":"cs.CV","submitted_at":"2023-11-07T00:12:01Z","title":"FusionViT: Hierarchical 3D Object Detection via LiDAR-Camera Vision Transformer Fusion"},"references":{"count":0,"internal_anchors":0,"resolved_work":0,"sample":[],"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"source":{"id":"2311.03620","kind":"arxiv","version":1},"verdict":{"created_at":null,"id":null,"model_set":{},"one_line_summary":"","pipeline_version":null,"pith_extraction_headline":"","strongest_claim":"","weakest_assumption":""}},"verdict_id":null}}],"author_attestations":[],"timestamp_anchors":[],"storage_attestations":[],"citation_signatures":[],"replication_records":[],"corrections":[],"mirror_hints":[],"record_created":{"event_id":"sha256:e18876a379bf58d87169236caefc016d048515214ba25b61b9851026c0543740","target":"record","created_at":"2026-07-05T07:10:01Z","signer":{"key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","signer_id":"pith.science","signer_type":"pith_registry"},"payload":{"attestation_state":"computed","canonical_record":{"metadata":{"abstract_canon_sha256":"59e3f95092acd3d3e1600453722793990336b1ac3f0ae6d26062b22dd654cfa5","cross_cats_sorted":[],"license":"http://creativecommons.org/licenses/by/4.0/","primary_cat":"cs.CV","submitted_at":"2023-11-07T00:12:01Z","title_canon_sha256":"684c7f1de2521ff5a071ec4ec538eca4d9909b03cf4dde61c111b57029cf7325"},"schema_version":"1.0","source":{"id":"2311.03620","kind":"arxiv","version":1}},"canonical_sha256":"e8f56b853a99bea8cee35af832c0839fd2883cabbe3cebcd30f5eccba49370cf","receipt":{"algorithm":"ed25519","builder_version":"pith-number-builder-2026-05-17-v1","canonical_sha256":"e8f56b853a99bea8cee35af832c0839fd2883cabbe3cebcd30f5eccba49370cf","first_computed_at":"2026-07-05T07:10:01.227437Z","key_id":"pith-v1-2026-05","kind":"pith_receipt","last_reissued_at":"2026-07-05T07:10:01.227437Z","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","receipt_version":"0.3","signature_b64":"J9c8FKL7seMDMcGHz00aWW0gf3IEKkRzIRWlHY6wzJ+jipYHi4L4qKy8PTgfkTUp0zI8E0q4gWCxCXSnK7CEBQ==","signature_status":"signed_v1","signed_at":"2026-07-05T07:10:01.227988Z","signed_message":"canonical_sha256_bytes"},"source_id":"2311.03620","source_kind":"arxiv","source_version":1}}},"equivocations":[],"invalid_events":[],"applied_event_ids":["sha256:e18876a379bf58d87169236caefc016d048515214ba25b61b9851026c0543740","sha256:c282cd2e880fef1fc9fbb1495303f78d228051abf6e6088168261ffcc7703e66"],"state_sha256":"22dd5634f835c4bbee0d727dc4bf0d10fcb0c4c4311d2362d33ce8940bdbf1ba"}