{"bundle_type":"pith_open_graph_bundle","bundle_version":"1.0","pith_number":"pith:2026:VGLOYHWFMPJ2DP6A75VL3BMZD7","short_pith_number":"pith:VGLOYHWF","canonical_record":{"source":{"id":"2606.00095","kind":"arxiv","version":1},"metadata":{"license":"http://arxiv.org/licenses/nonexclusive-distrib/1.0/","primary_cat":"cs.CV","submitted_at":"2026-05-25T08:53:21Z","cross_cats_sorted":["cs.AI","cs.CL","cs.RO"],"title_canon_sha256":"45128861a283add2ecb0b5c92313ef90ce2897837bd5dc7c56663a66c390da7c","abstract_canon_sha256":"6740a7b136b8f9d6bcac9ea637a8e740e3c89b53f738fe2abfffdcc31ffb747b"},"schema_version":"1.0"},"canonical_sha256":"a996ec1ec563d3a1bfc0ff6abd85991fd4ec63f8c5a055509822a2c9385f0270","source":{"kind":"arxiv","id":"2606.00095","version":1},"source_aliases":[{"alias_kind":"arxiv","alias_value":"2606.00095","created_at":"2026-06-02T00:03:14Z"},{"alias_kind":"arxiv_version","alias_value":"2606.00095v1","created_at":"2026-06-02T00:03:14Z"},{"alias_kind":"doi","alias_value":"10.48550/arxiv.2606.00095","created_at":"2026-06-02T00:03:14Z"},{"alias_kind":"pith_short_12","alias_value":"VGLOYHWFMPJ2","created_at":"2026-06-02T00:03:14Z"},{"alias_kind":"pith_short_16","alias_value":"VGLOYHWFMPJ2DP6A","created_at":"2026-06-02T00:03:14Z"},{"alias_kind":"pith_short_8","alias_value":"VGLOYHWF","created_at":"2026-06-02T00:03:14Z"}],"events":[{"event_type":"record_created","subject_pith_number":"pith:2026:VGLOYHWFMPJ2DP6A75VL3BMZD7","target":"record","payload":{"canonical_record":{"source":{"id":"2606.00095","kind":"arxiv","version":1},"metadata":{"license":"http://arxiv.org/licenses/nonexclusive-distrib/1.0/","primary_cat":"cs.CV","submitted_at":"2026-05-25T08:53:21Z","cross_cats_sorted":["cs.AI","cs.CL","cs.RO"],"title_canon_sha256":"45128861a283add2ecb0b5c92313ef90ce2897837bd5dc7c56663a66c390da7c","abstract_canon_sha256":"6740a7b136b8f9d6bcac9ea637a8e740e3c89b53f738fe2abfffdcc31ffb747b"},"schema_version":"1.0"},"canonical_sha256":"a996ec1ec563d3a1bfc0ff6abd85991fd4ec63f8c5a055509822a2c9385f0270","receipt":{"kind":"pith_receipt","key_id":"pith-v1-2026-05","algorithm":"ed25519","signed_at":"2026-06-02T00:03:14.853084Z","signature_b64":"gMZ+t3a7T9ip6SS7GsyytKDnIhPxoZKHK7T+vmWKMRCT5cgG9IhfdPLWh7QFmArQmHrHCsqGFbGAk/aTSTh8CA==","signed_message":"canonical_sha256_bytes","builder_version":"pith-number-builder-2026-05-17-v1","receipt_version":"0.3","canonical_sha256":"a996ec1ec563d3a1bfc0ff6abd85991fd4ec63f8c5a055509822a2c9385f0270","last_reissued_at":"2026-06-02T00:03:14.852603Z","signature_status":"signed_v1","first_computed_at":"2026-06-02T00:03:14.852603Z","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54"},"source_kind":"arxiv","source_id":"2606.00095","source_version":1,"attestation_state":"computed"},"signer":{"signer_id":"pith.science","signer_type":"pith_registry","key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54"},"created_at":"2026-06-02T00:03:14Z","supersedes":[],"prev_event":null,"signature":{"signature_status":"signed_v1","algorithm":"ed25519","key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","signature_b64":"/rQb3aSzOeuH4qZRFg0KtrpE3/ERwMPDJHzAGa/2e1SGwPCTKkkJ4vEJb8jA6iV9OweqLV9ltaHg+wVJW18ODw==","signed_message":"open_graph_event_sha256_bytes","signed_at":"2026-06-06T21:26:47.463088Z"},"content_sha256":"5a70a6da480845b1bd1832a774ec713aeea74911a0d8547a93e5db603697159b","schema_version":"1.0","event_id":"sha256:5a70a6da480845b1bd1832a774ec713aeea74911a0d8547a93e5db603697159b"},{"event_type":"graph_snapshot","subject_pith_number":"pith:2026:VGLOYHWFMPJ2DP6A75VL3BMZD7","target":"graph","payload":{"graph_snapshot":{"paper":{"title":"Bridging the 2D-3D Gap: A Hierarchical Semantic-Geometric Map for Vision Language Navigation","license":"http://arxiv.org/licenses/nonexclusive-distrib/1.0/","headline":"","cross_cats":["cs.AI","cs.CL","cs.RO"],"primary_cat":"cs.CV","authors_text":"Jingyu Gong, Kailing Li, Liang He, Lijin Yang, Tianwen Qian, Xiaoling Wang, Yuqian Fu","submitted_at":"2026-05-25T08:53:21Z","abstract_excerpt":"Vision-Language Navigation (VLN) enables embodied agents to reach target locations in unseen environments by following language instructions. Despite recent progress with vision-language models (VLMs), a critical semantic-geometric gap remains: while VLMs excel at language and 2D visual understanding, they struggle with 3D spatial reasoning and fail to capture the causal dynamics between actions and spatial transitions, resulting in unreliable navigation, particularly in zero-shot settings. To bridge this gap, we propose a Hierarchical Semantic-Geometric Map (HSGM) that transforms 3D geometric"},"claims":{"count":0,"items":[],"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"source":{"id":"2606.00095","kind":"arxiv","version":1},"verdict":{"id":null,"model_set":{},"created_at":null,"strongest_claim":"","one_line_summary":"","pipeline_version":null,"weakest_assumption":"","pith_extraction_headline":""},"integrity":{"clean":true,"summary":{"advisory":0,"critical":0,"by_detector":{},"informational":0},"endpoint":"/pith/2606.00095/integrity.json","findings":[],"available":true,"detectors_run":[],"snapshot_sha256":"c28c3603d3b5d939e8dc4c7e95fa8dfce3d595e45f758748cecf8e644a296938"},"references":{"count":0,"sample":[],"resolved_work":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57","internal_anchors":0},"formal_canon":{"evidence_count":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"author_claims":{"count":0,"strong_count":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"builder_version":"pith-number-builder-2026-05-17-v1"},"verdict_id":null},"signer":{"signer_id":"pith.science","signer_type":"pith_registry","key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54"},"created_at":"2026-06-02T00:03:14Z","supersedes":[],"prev_event":null,"signature":{"signature_status":"signed_v1","algorithm":"ed25519","key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","signature_b64":"gIODybXxKRvAxYeglvBqvLM2AgzediCZDM/HhEg7ryv2vevLa0EF8bWdg2GAJgg6YeZpWLFLH/vclc7tSedWAA==","signed_message":"open_graph_event_sha256_bytes","signed_at":"2026-06-06T21:26:47.463752Z"},"content_sha256":"a9bcae3ab443683e04814aadb416b29dfbd54426b91fcd2abc093081fc5f466b","schema_version":"1.0","event_id":"sha256:a9bcae3ab443683e04814aadb416b29dfbd54426b91fcd2abc093081fc5f466b"}],"timestamp_proofs":[],"mirror_hints":[{"mirror_type":"https","name":"Pith Resolver","base_url":"https://pith.science","bundle_url":"https://pith.science/pith/VGLOYHWFMPJ2DP6A75VL3BMZD7/bundle.json","state_url":"https://pith.science/pith/VGLOYHWFMPJ2DP6A75VL3BMZD7/state.json","well_known_bundle_url":"https://pith.science/.well-known/pith/VGLOYHWFMPJ2DP6A75VL3BMZD7/bundle.json","status":"primary"}],"public_keys":[{"key_id":"pith-v1-2026-05","algorithm":"ed25519","format":"raw","public_key_b64":"stVStoiQhXFxp4s2pdzPNoqVNBMojDU/fJ2db5S3CbM=","public_key_hex":"b2d552b68890857171a78b36a5dccf368a953413288c353f7c9d9d6f94b709b3","fingerprint_sha256_b32_first128bits":"RVFV5Z2OI2J3ZUO7ERDEBCYNKS","fingerprint_sha256_hex":"8d4b5ee74e4693bcd1df2446408b0d54","rotates_at":null,"url":"https://pith.science/pith-signing-key.json","notes":"Pith uses this Ed25519 key to sign canonical record SHA-256 digests. Verify with: ed25519_verify(public_key, message=canonical_sha256_bytes, signature=base64decode(signature_b64))."}],"merge_version":"pith-open-graph-merge-v1","built_at":"2026-06-06T21:26:47Z","links":{"resolver":"https://pith.science/pith/VGLOYHWFMPJ2DP6A75VL3BMZD7","bundle":"https://pith.science/pith/VGLOYHWFMPJ2DP6A75VL3BMZD7/bundle.json","state":"https://pith.science/pith/VGLOYHWFMPJ2DP6A75VL3BMZD7/state.json","well_known_bundle":"https://pith.science/.well-known/pith/VGLOYHWFMPJ2DP6A75VL3BMZD7/bundle.json"},"state":{"state_type":"pith_open_graph_state","state_version":"1.0","pith_number":"pith:2026:VGLOYHWFMPJ2DP6A75VL3BMZD7","merge_version":"pith-open-graph-merge-v1","event_count":2,"valid_event_count":2,"invalid_event_count":0,"equivocation_count":0,"current":{"canonical_record":{"metadata":{"abstract_canon_sha256":"6740a7b136b8f9d6bcac9ea637a8e740e3c89b53f738fe2abfffdcc31ffb747b","cross_cats_sorted":["cs.AI","cs.CL","cs.RO"],"license":"http://arxiv.org/licenses/nonexclusive-distrib/1.0/","primary_cat":"cs.CV","submitted_at":"2026-05-25T08:53:21Z","title_canon_sha256":"45128861a283add2ecb0b5c92313ef90ce2897837bd5dc7c56663a66c390da7c"},"schema_version":"1.0","source":{"id":"2606.00095","kind":"arxiv","version":1}},"source_aliases":[{"alias_kind":"arxiv","alias_value":"2606.00095","created_at":"2026-06-02T00:03:14Z"},{"alias_kind":"arxiv_version","alias_value":"2606.00095v1","created_at":"2026-06-02T00:03:14Z"},{"alias_kind":"doi","alias_value":"10.48550/arxiv.2606.00095","created_at":"2026-06-02T00:03:14Z"},{"alias_kind":"pith_short_12","alias_value":"VGLOYHWFMPJ2","created_at":"2026-06-02T00:03:14Z"},{"alias_kind":"pith_short_16","alias_value":"VGLOYHWFMPJ2DP6A","created_at":"2026-06-02T00:03:14Z"},{"alias_kind":"pith_short_8","alias_value":"VGLOYHWF","created_at":"2026-06-02T00:03:14Z"}],"graph_snapshots":[{"event_id":"sha256:a9bcae3ab443683e04814aadb416b29dfbd54426b91fcd2abc093081fc5f466b","target":"graph","created_at":"2026-06-02T00:03:14Z","signer":{"key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","signer_id":"pith.science","signer_type":"pith_registry"},"payload":{"graph_snapshot":{"author_claims":{"count":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57","strong_count":0},"builder_version":"pith-number-builder-2026-05-17-v1","claims":{"count":0,"items":[],"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"formal_canon":{"evidence_count":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"integrity":{"available":true,"clean":true,"detectors_run":[],"endpoint":"/pith/2606.00095/integrity.json","findings":[],"snapshot_sha256":"c28c3603d3b5d939e8dc4c7e95fa8dfce3d595e45f758748cecf8e644a296938","summary":{"advisory":0,"by_detector":{},"critical":0,"informational":0}},"paper":{"abstract_excerpt":"Vision-Language Navigation (VLN) enables embodied agents to reach target locations in unseen environments by following language instructions. Despite recent progress with vision-language models (VLMs), a critical semantic-geometric gap remains: while VLMs excel at language and 2D visual understanding, they struggle with 3D spatial reasoning and fail to capture the causal dynamics between actions and spatial transitions, resulting in unreliable navigation, particularly in zero-shot settings. To bridge this gap, we propose a Hierarchical Semantic-Geometric Map (HSGM) that transforms 3D geometric","authors_text":"Jingyu Gong, Kailing Li, Liang He, Lijin Yang, Tianwen Qian, Xiaoling Wang, Yuqian Fu","cross_cats":["cs.AI","cs.CL","cs.RO"],"headline":"","license":"http://arxiv.org/licenses/nonexclusive-distrib/1.0/","primary_cat":"cs.CV","submitted_at":"2026-05-25T08:53:21Z","title":"Bridging the 2D-3D Gap: A Hierarchical Semantic-Geometric Map for Vision Language Navigation"},"references":{"count":0,"internal_anchors":0,"resolved_work":0,"sample":[],"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"source":{"id":"2606.00095","kind":"arxiv","version":1},"verdict":{"created_at":null,"id":null,"model_set":{},"one_line_summary":"","pipeline_version":null,"pith_extraction_headline":"","strongest_claim":"","weakest_assumption":""}},"verdict_id":null}}],"author_attestations":[],"timestamp_anchors":[],"storage_attestations":[],"citation_signatures":[],"replication_records":[],"corrections":[],"mirror_hints":[],"record_created":{"event_id":"sha256:5a70a6da480845b1bd1832a774ec713aeea74911a0d8547a93e5db603697159b","target":"record","created_at":"2026-06-02T00:03:14Z","signer":{"key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","signer_id":"pith.science","signer_type":"pith_registry"},"payload":{"attestation_state":"computed","canonical_record":{"metadata":{"abstract_canon_sha256":"6740a7b136b8f9d6bcac9ea637a8e740e3c89b53f738fe2abfffdcc31ffb747b","cross_cats_sorted":["cs.AI","cs.CL","cs.RO"],"license":"http://arxiv.org/licenses/nonexclusive-distrib/1.0/","primary_cat":"cs.CV","submitted_at":"2026-05-25T08:53:21Z","title_canon_sha256":"45128861a283add2ecb0b5c92313ef90ce2897837bd5dc7c56663a66c390da7c"},"schema_version":"1.0","source":{"id":"2606.00095","kind":"arxiv","version":1}},"canonical_sha256":"a996ec1ec563d3a1bfc0ff6abd85991fd4ec63f8c5a055509822a2c9385f0270","receipt":{"algorithm":"ed25519","builder_version":"pith-number-builder-2026-05-17-v1","canonical_sha256":"a996ec1ec563d3a1bfc0ff6abd85991fd4ec63f8c5a055509822a2c9385f0270","first_computed_at":"2026-06-02T00:03:14.852603Z","key_id":"pith-v1-2026-05","kind":"pith_receipt","last_reissued_at":"2026-06-02T00:03:14.852603Z","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","receipt_version":"0.3","signature_b64":"gMZ+t3a7T9ip6SS7GsyytKDnIhPxoZKHK7T+vmWKMRCT5cgG9IhfdPLWh7QFmArQmHrHCsqGFbGAk/aTSTh8CA==","signature_status":"signed_v1","signed_at":"2026-06-02T00:03:14.853084Z","signed_message":"canonical_sha256_bytes"},"source_id":"2606.00095","source_kind":"arxiv","source_version":1}}},"equivocations":[],"invalid_events":[],"applied_event_ids":["sha256:5a70a6da480845b1bd1832a774ec713aeea74911a0d8547a93e5db603697159b","sha256:a9bcae3ab443683e04814aadb416b29dfbd54426b91fcd2abc093081fc5f466b"],"state_sha256":"e256df42a1537ec7dbdd899954d7bffccdb8965bc24f58f407ae4d4ccdf0acde"},"bundle_signature":{"signature_status":"signed_v1","algorithm":"ed25519","key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","signature_b64":"FSLpvcS6J7UPQ2yOzRMCCdE+6PFiNcc6sh84C9UkmJ599k/O415V6kzy2zyziAI7xbxqu6hP0uETILGzvNr8CA==","signed_message":"bundle_sha256_bytes","signed_at":"2026-06-06T21:26:47.466966Z","bundle_sha256":"ad0c4877b2583ed4aa2bd3cfcc05c6c18ed482bf64746c6aec46189379075b1a"}}