{"bundle_type":"pith_open_graph_bundle","bundle_version":"1.0","pith_number":"pith:2026:36EBL2IGTSN3MFVMSWGHBXKQ3I","short_pith_number":"pith:36EBL2IG","canonical_record":{"source":{"id":"2605.21258","kind":"arxiv","version":1},"metadata":{"license":"http://creativecommons.org/licenses/by/4.0/","primary_cat":"cs.RO","submitted_at":"2026-05-20T14:48:01Z","cross_cats_sorted":["cs.AI"],"title_canon_sha256":"67e951b9fa47c67fee3a5c79217205d2dfe1cffc8a44d132b3ce738b75ba84e5","abstract_canon_sha256":"fb0fe2d2fa56d12723752d69fa26fb7c36290e0f0866d65306ff722cb1ea886e"},"schema_version":"1.0"},"canonical_sha256":"df8815e9069c9bb616ac958c70dd50da372ae80af7326b339a671a56b0ae8846","source":{"kind":"arxiv","id":"2605.21258","version":1},"source_aliases":[{"alias_kind":"arxiv","alias_value":"2605.21258","created_at":"2026-05-21T02:05:25Z"},{"alias_kind":"arxiv_version","alias_value":"2605.21258v1","created_at":"2026-05-21T02:05:25Z"},{"alias_kind":"doi","alias_value":"10.48550/arxiv.2605.21258","created_at":"2026-05-21T02:05:25Z"},{"alias_kind":"pith_short_12","alias_value":"36EBL2IGTSN3","created_at":"2026-05-21T02:05:25Z"},{"alias_kind":"pith_short_16","alias_value":"36EBL2IGTSN3MFVM","created_at":"2026-05-21T02:05:25Z"},{"alias_kind":"pith_short_8","alias_value":"36EBL2IG","created_at":"2026-05-21T02:05:25Z"}],"events":[{"event_type":"record_created","subject_pith_number":"pith:2026:36EBL2IGTSN3MFVMSWGHBXKQ3I","target":"record","payload":{"canonical_record":{"source":{"id":"2605.21258","kind":"arxiv","version":1},"metadata":{"license":"http://creativecommons.org/licenses/by/4.0/","primary_cat":"cs.RO","submitted_at":"2026-05-20T14:48:01Z","cross_cats_sorted":["cs.AI"],"title_canon_sha256":"67e951b9fa47c67fee3a5c79217205d2dfe1cffc8a44d132b3ce738b75ba84e5","abstract_canon_sha256":"fb0fe2d2fa56d12723752d69fa26fb7c36290e0f0866d65306ff722cb1ea886e"},"schema_version":"1.0"},"canonical_sha256":"df8815e9069c9bb616ac958c70dd50da372ae80af7326b339a671a56b0ae8846","receipt":{"kind":"pith_receipt","key_id":"pith-v1-2026-05","algorithm":"ed25519","signed_at":"2026-05-21T02:05:25.353886Z","signature_b64":"XFnynLykAj6ymAPdanK3KTC1OyffH/Pnd5irpXVdcO5/19pGkouzye0Tumql3vBh9xkOLQfl9k6mvyVYI1qsAA==","signed_message":"canonical_sha256_bytes","builder_version":"pith-number-builder-2026-05-17-v1","receipt_version":"0.3","canonical_sha256":"df8815e9069c9bb616ac958c70dd50da372ae80af7326b339a671a56b0ae8846","last_reissued_at":"2026-05-21T02:05:25.353043Z","signature_status":"signed_v1","first_computed_at":"2026-05-21T02:05:25.353043Z","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54"},"source_kind":"arxiv","source_id":"2605.21258","source_version":1,"attestation_state":"computed"},"signer":{"signer_id":"pith.science","signer_type":"pith_registry","key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54"},"created_at":"2026-05-21T02:05:25Z","supersedes":[],"prev_event":null,"signature":{"signature_status":"signed_v1","algorithm":"ed25519","key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","signature_b64":"Swx1zkARv32pBJb1sxw77uQz86DGqmW7sYTdt0TrrWx0f1gyJowK21eegKpUQxMoUatM3xQXNABFrfG0iFT8Cw==","signed_message":"open_graph_event_sha256_bytes","signed_at":"2026-05-25T19:24:45.723748Z"},"content_sha256":"a6492100bb8082df3e8fa6fe6cfd7b0272765f3fb1d0aae0d6e9b300d63e7d5a","schema_version":"1.0","event_id":"sha256:a6492100bb8082df3e8fa6fe6cfd7b0272765f3fb1d0aae0d6e9b300d63e7d5a"},{"event_type":"graph_snapshot","subject_pith_number":"pith:2026:36EBL2IGTSN3MFVMSWGHBXKQ3I","target":"graph","payload":{"graph_snapshot":{"paper":{"title":"Learning Structural Latent Points for Efficient Visual Representations in Robotic Manipulation","license":"http://creativecommons.org/licenses/by/4.0/","headline":"","cross_cats":["cs.AI"],"primary_cat":"cs.RO","authors_text":"Jiahang Cao, Jiaxu Wang, Jingkai Sun, Junhao He, Junhao Li, Mingyuan Sun, Qiang Zhang, Qiming Shao, Xiangyu Yue, YiCheng Jiang, Zesen Gan","submitted_at":"2026-05-20T14:48:01Z","abstract_excerpt":"Current 3D-aware pretraining methods for embodied perception and manipulation are largely built on differentiable rendering frameworks, producing either fully implicit neural fields or fully explicit geometric primitives. Implicit representations, while expressive, lack explicit structural cues, whereas explicit ones preserve geometry but suffer from resolution limits and weak generalization. To address these limitations, we propose a novel pretraining framework that learns a hybrid representation-structural latent points. Specifically, we insert a point-wise latent variational autoencoder int"},"claims":{"count":0,"items":[],"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"source":{"id":"2605.21258","kind":"arxiv","version":1},"verdict":{"id":null,"model_set":{},"created_at":null,"strongest_claim":"","one_line_summary":"","pipeline_version":null,"weakest_assumption":"","pith_extraction_headline":""},"integrity":{"clean":true,"summary":{"advisory":0,"critical":0,"by_detector":{},"informational":0},"endpoint":"/pith/2605.21258/integrity.json","findings":[],"available":true,"detectors_run":[],"snapshot_sha256":"c28c3603d3b5d939e8dc4c7e95fa8dfce3d595e45f758748cecf8e644a296938"},"references":{"count":0,"sample":[],"resolved_work":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57","internal_anchors":0},"formal_canon":{"evidence_count":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"author_claims":{"count":0,"strong_count":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"builder_version":"pith-number-builder-2026-05-17-v1"},"verdict_id":null},"signer":{"signer_id":"pith.science","signer_type":"pith_registry","key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54"},"created_at":"2026-05-21T02:05:25Z","supersedes":[],"prev_event":null,"signature":{"signature_status":"signed_v1","algorithm":"ed25519","key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","signature_b64":"1xskHhSr/6WX5goql8hczJKMp/6+Hg/FvPL/n0juHNqqGaLKKS5+/5OQxSR3ktC9jAxVGX0Jf6CoSJKmQNzMBg==","signed_message":"open_graph_event_sha256_bytes","signed_at":"2026-05-25T19:24:45.724519Z"},"content_sha256":"1725e09d407e7a6395026782fa24351c59a269c84191776bf27ba4221c5da79d","schema_version":"1.0","event_id":"sha256:1725e09d407e7a6395026782fa24351c59a269c84191776bf27ba4221c5da79d"}],"timestamp_proofs":[],"mirror_hints":[{"mirror_type":"https","name":"Pith Resolver","base_url":"https://pith.science","bundle_url":"https://pith.science/pith/36EBL2IGTSN3MFVMSWGHBXKQ3I/bundle.json","state_url":"https://pith.science/pith/36EBL2IGTSN3MFVMSWGHBXKQ3I/state.json","well_known_bundle_url":"https://pith.science/.well-known/pith/36EBL2IGTSN3MFVMSWGHBXKQ3I/bundle.json","status":"primary"}],"public_keys":[{"key_id":"pith-v1-2026-05","algorithm":"ed25519","format":"raw","public_key_b64":"stVStoiQhXFxp4s2pdzPNoqVNBMojDU/fJ2db5S3CbM=","public_key_hex":"b2d552b68890857171a78b36a5dccf368a953413288c353f7c9d9d6f94b709b3","fingerprint_sha256_b32_first128bits":"RVFV5Z2OI2J3ZUO7ERDEBCYNKS","fingerprint_sha256_hex":"8d4b5ee74e4693bcd1df2446408b0d54","rotates_at":null,"url":"https://pith.science/pith-signing-key.json","notes":"Pith uses this Ed25519 key to sign canonical record SHA-256 digests. Verify with: ed25519_verify(public_key, message=canonical_sha256_bytes, signature=base64decode(signature_b64))."}],"merge_version":"pith-open-graph-merge-v1","built_at":"2026-05-25T19:24:45Z","links":{"resolver":"https://pith.science/pith/36EBL2IGTSN3MFVMSWGHBXKQ3I","bundle":"https://pith.science/pith/36EBL2IGTSN3MFVMSWGHBXKQ3I/bundle.json","state":"https://pith.science/pith/36EBL2IGTSN3MFVMSWGHBXKQ3I/state.json","well_known_bundle":"https://pith.science/.well-known/pith/36EBL2IGTSN3MFVMSWGHBXKQ3I/bundle.json"},"state":{"state_type":"pith_open_graph_state","state_version":"1.0","pith_number":"pith:2026:36EBL2IGTSN3MFVMSWGHBXKQ3I","merge_version":"pith-open-graph-merge-v1","event_count":2,"valid_event_count":2,"invalid_event_count":0,"equivocation_count":0,"current":{"canonical_record":{"metadata":{"abstract_canon_sha256":"fb0fe2d2fa56d12723752d69fa26fb7c36290e0f0866d65306ff722cb1ea886e","cross_cats_sorted":["cs.AI"],"license":"http://creativecommons.org/licenses/by/4.0/","primary_cat":"cs.RO","submitted_at":"2026-05-20T14:48:01Z","title_canon_sha256":"67e951b9fa47c67fee3a5c79217205d2dfe1cffc8a44d132b3ce738b75ba84e5"},"schema_version":"1.0","source":{"id":"2605.21258","kind":"arxiv","version":1}},"source_aliases":[{"alias_kind":"arxiv","alias_value":"2605.21258","created_at":"2026-05-21T02:05:25Z"},{"alias_kind":"arxiv_version","alias_value":"2605.21258v1","created_at":"2026-05-21T02:05:25Z"},{"alias_kind":"doi","alias_value":"10.48550/arxiv.2605.21258","created_at":"2026-05-21T02:05:25Z"},{"alias_kind":"pith_short_12","alias_value":"36EBL2IGTSN3","created_at":"2026-05-21T02:05:25Z"},{"alias_kind":"pith_short_16","alias_value":"36EBL2IGTSN3MFVM","created_at":"2026-05-21T02:05:25Z"},{"alias_kind":"pith_short_8","alias_value":"36EBL2IG","created_at":"2026-05-21T02:05:25Z"}],"graph_snapshots":[{"event_id":"sha256:1725e09d407e7a6395026782fa24351c59a269c84191776bf27ba4221c5da79d","target":"graph","created_at":"2026-05-21T02:05:25Z","signer":{"key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","signer_id":"pith.science","signer_type":"pith_registry"},"payload":{"graph_snapshot":{"author_claims":{"count":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57","strong_count":0},"builder_version":"pith-number-builder-2026-05-17-v1","claims":{"count":0,"items":[],"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"formal_canon":{"evidence_count":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"integrity":{"available":true,"clean":true,"detectors_run":[],"endpoint":"/pith/2605.21258/integrity.json","findings":[],"snapshot_sha256":"c28c3603d3b5d939e8dc4c7e95fa8dfce3d595e45f758748cecf8e644a296938","summary":{"advisory":0,"by_detector":{},"critical":0,"informational":0}},"paper":{"abstract_excerpt":"Current 3D-aware pretraining methods for embodied perception and manipulation are largely built on differentiable rendering frameworks, producing either fully implicit neural fields or fully explicit geometric primitives. Implicit representations, while expressive, lack explicit structural cues, whereas explicit ones preserve geometry but suffer from resolution limits and weak generalization. To address these limitations, we propose a novel pretraining framework that learns a hybrid representation-structural latent points. Specifically, we insert a point-wise latent variational autoencoder int","authors_text":"Jiahang Cao, Jiaxu Wang, Jingkai Sun, Junhao He, Junhao Li, Mingyuan Sun, Qiang Zhang, Qiming Shao, Xiangyu Yue, YiCheng Jiang, Zesen Gan","cross_cats":["cs.AI"],"headline":"","license":"http://creativecommons.org/licenses/by/4.0/","primary_cat":"cs.RO","submitted_at":"2026-05-20T14:48:01Z","title":"Learning Structural Latent Points for Efficient Visual Representations in Robotic Manipulation"},"references":{"count":0,"internal_anchors":0,"resolved_work":0,"sample":[],"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"source":{"id":"2605.21258","kind":"arxiv","version":1},"verdict":{"created_at":null,"id":null,"model_set":{},"one_line_summary":"","pipeline_version":null,"pith_extraction_headline":"","strongest_claim":"","weakest_assumption":""}},"verdict_id":null}}],"author_attestations":[],"timestamp_anchors":[],"storage_attestations":[],"citation_signatures":[],"replication_records":[],"corrections":[],"mirror_hints":[],"record_created":{"event_id":"sha256:a6492100bb8082df3e8fa6fe6cfd7b0272765f3fb1d0aae0d6e9b300d63e7d5a","target":"record","created_at":"2026-05-21T02:05:25Z","signer":{"key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","signer_id":"pith.science","signer_type":"pith_registry"},"payload":{"attestation_state":"computed","canonical_record":{"metadata":{"abstract_canon_sha256":"fb0fe2d2fa56d12723752d69fa26fb7c36290e0f0866d65306ff722cb1ea886e","cross_cats_sorted":["cs.AI"],"license":"http://creativecommons.org/licenses/by/4.0/","primary_cat":"cs.RO","submitted_at":"2026-05-20T14:48:01Z","title_canon_sha256":"67e951b9fa47c67fee3a5c79217205d2dfe1cffc8a44d132b3ce738b75ba84e5"},"schema_version":"1.0","source":{"id":"2605.21258","kind":"arxiv","version":1}},"canonical_sha256":"df8815e9069c9bb616ac958c70dd50da372ae80af7326b339a671a56b0ae8846","receipt":{"algorithm":"ed25519","builder_version":"pith-number-builder-2026-05-17-v1","canonical_sha256":"df8815e9069c9bb616ac958c70dd50da372ae80af7326b339a671a56b0ae8846","first_computed_at":"2026-05-21T02:05:25.353043Z","key_id":"pith-v1-2026-05","kind":"pith_receipt","last_reissued_at":"2026-05-21T02:05:25.353043Z","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","receipt_version":"0.3","signature_b64":"XFnynLykAj6ymAPdanK3KTC1OyffH/Pnd5irpXVdcO5/19pGkouzye0Tumql3vBh9xkOLQfl9k6mvyVYI1qsAA==","signature_status":"signed_v1","signed_at":"2026-05-21T02:05:25.353886Z","signed_message":"canonical_sha256_bytes"},"source_id":"2605.21258","source_kind":"arxiv","source_version":1}}},"equivocations":[],"invalid_events":[],"applied_event_ids":["sha256:a6492100bb8082df3e8fa6fe6cfd7b0272765f3fb1d0aae0d6e9b300d63e7d5a","sha256:1725e09d407e7a6395026782fa24351c59a269c84191776bf27ba4221c5da79d"],"state_sha256":"3425596f77b8397ce017c9ad598c5dc3fccfbc5c08bb538fdb3b6f15217daa8d"},"bundle_signature":{"signature_status":"signed_v1","algorithm":"ed25519","key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","signature_b64":"OAWAq6pnTVWCW7UnKzZgudTRS4ZDhohJoHiQVehejDM3ODOE7Fk5xuJb+2dK/8x0rBUTXLv3MOBdRWMv6nqNBw==","signed_message":"bundle_sha256_bytes","signed_at":"2026-05-25T19:24:45.728759Z","bundle_sha256":"fc630131df3256f5c05bcd8d75afc84239de42b91676c2a57aa2898aab414e4a"}}