{"record_type":"pith_number_record","schema_url":"https://pith.science/schemas/pith-number/v1.json","pith_number":"pith:2026:IJ7ES7ZLMAGYEMYKG5F3CWACEU","short_pith_number":"pith:IJ7ES7ZL","schema_version":"1.0","canonical_sha256":"427e497f2b600d82330a374bb158022507d4e9ec83500925c748b459d8a3caa9","source":{"kind":"arxiv","id":"2605.31116","version":1},"attestation_state":"computed","paper":{"title":"NTR: Neural Token Reconstruction for Scene Token Bottleneck in End-to-End Driving","license":"http://creativecommons.org/licenses/by/4.0/","headline":"","cross_cats":["cs.RO"],"primary_cat":"cs.CV","authors_text":"Jiahui Li, Jiamin Shi, Jiawei Sun, Kaidi Yang, Liying Liu, Ming Liu, Ruiteng Zhao, Zhiyang Liu, Zixiang Ren, Zuoguan Wang","submitted_at":"2026-05-29T10:27:32Z","abstract_excerpt":"Recent perception-free end-to-end (E2E) autonomous driving methods bypass explicit perception outputs by compressing dense image patch tokens into compact scene tokens for downstream trajectory generation and scoring. While these scene tokens form a compact visual bottleneck for the planner, they receive supervision solely from the planning objective, providing limited constraints on the encoded visual information. To address this limitation, we introduce Neural Token Reconstruction (NTR), a representation learning framework to directly constrain the compact scene-token bottleneck in perceptio"},"verification_status":{"content_addressed":true,"pith_receipt":true,"author_attested":false,"weak_author_claims":0,"strong_author_claims":0,"externally_anchored":false,"storage_verified":false,"citation_signatures":0,"replication_records":0,"graph_snapshot":true,"references_resolved":false,"formal_links_present":false},"canonical_record":{"source":{"id":"2605.31116","kind":"arxiv","version":1},"metadata":{"license":"http://creativecommons.org/licenses/by/4.0/","primary_cat":"cs.CV","submitted_at":"2026-05-29T10:27:32Z","cross_cats_sorted":["cs.RO"],"title_canon_sha256":"7ce5ec861c0c7f614bc95476ce478330ff6ce9472b31e8d04c19c965463e11d2","abstract_canon_sha256":"bb0a6f5111e435d972433ddfc874b7d63335ff0739901d349b4cbd6e010b409f"},"schema_version":"1.0"},"receipt":{"kind":"pith_receipt","key_id":"pith-v1-2026-05","algorithm":"ed25519","signed_at":"2026-06-01T01:03:58.816692Z","signature_b64":"c8uHWzmmARR3028tQtHjNAWB8wIM9vZ9vwtGaW/LvWvHR8HpuhrpLIwXOcOudVcD27m3A9Vyw9y1l51oROT2Ag==","signed_message":"canonical_sha256_bytes","builder_version":"pith-number-builder-2026-05-17-v1","receipt_version":"0.3","canonical_sha256":"427e497f2b600d82330a374bb158022507d4e9ec83500925c748b459d8a3caa9","last_reissued_at":"2026-06-01T01:03:58.815825Z","signature_status":"signed_v1","first_computed_at":"2026-06-01T01:03:58.815825Z","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54"},"graph_snapshot":{"paper":{"title":"NTR: Neural Token Reconstruction for Scene Token Bottleneck in End-to-End Driving","license":"http://creativecommons.org/licenses/by/4.0/","headline":"","cross_cats":["cs.RO"],"primary_cat":"cs.CV","authors_text":"Jiahui Li, Jiamin Shi, Jiawei Sun, Kaidi Yang, Liying Liu, Ming Liu, Ruiteng Zhao, Zhiyang Liu, Zixiang Ren, Zuoguan Wang","submitted_at":"2026-05-29T10:27:32Z","abstract_excerpt":"Recent perception-free end-to-end (E2E) autonomous driving methods bypass explicit perception outputs by compressing dense image patch tokens into compact scene tokens for downstream trajectory generation and scoring. While these scene tokens form a compact visual bottleneck for the planner, they receive supervision solely from the planning objective, providing limited constraints on the encoded visual information. To address this limitation, we introduce Neural Token Reconstruction (NTR), a representation learning framework to directly constrain the compact scene-token bottleneck in perceptio"},"claims":{"count":0,"items":[],"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"source":{"id":"2605.31116","kind":"arxiv","version":1},"verdict":{"id":null,"model_set":{},"created_at":null,"strongest_claim":"","one_line_summary":"","pipeline_version":null,"weakest_assumption":"","pith_extraction_headline":""},"integrity":{"clean":true,"summary":{"advisory":0,"critical":0,"by_detector":{},"informational":0},"endpoint":"/pith/2605.31116/integrity.json","findings":[],"available":true,"detectors_run":[],"snapshot_sha256":"c28c3603d3b5d939e8dc4c7e95fa8dfce3d595e45f758748cecf8e644a296938"},"references":{"count":0,"sample":[],"resolved_work":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57","internal_anchors":0},"formal_canon":{"evidence_count":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"author_claims":{"count":0,"strong_count":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"builder_version":"pith-number-builder-2026-05-17-v1"},"aliases":[{"alias_kind":"arxiv","alias_value":"2605.31116","created_at":"2026-06-01T01:03:58.815962+00:00"},{"alias_kind":"arxiv_version","alias_value":"2605.31116v1","created_at":"2026-06-01T01:03:58.815962+00:00"},{"alias_kind":"doi","alias_value":"10.48550/arxiv.2605.31116","created_at":"2026-06-01T01:03:58.815962+00:00"},{"alias_kind":"pith_short_12","alias_value":"IJ7ES7ZLMAGY","created_at":"2026-06-01T01:03:58.815962+00:00"},{"alias_kind":"pith_short_16","alias_value":"IJ7ES7ZLMAGYEMYK","created_at":"2026-06-01T01:03:58.815962+00:00"},{"alias_kind":"pith_short_8","alias_value":"IJ7ES7ZL","created_at":"2026-06-01T01:03:58.815962+00:00"}],"events":[],"event_summary":{},"paper_claims":[],"inbound_citations":{"count":0,"internal_anchor_count":0,"sample":[]},"formal_canon":{"evidence_count":0,"sample":[],"anchors":[]},"links":{"html":"https://pith.science/pith/IJ7ES7ZLMAGYEMYKG5F3CWACEU","json":"https://pith.science/pith/IJ7ES7ZLMAGYEMYKG5F3CWACEU.json","graph_json":"https://pith.science/api/pith-number/IJ7ES7ZLMAGYEMYKG5F3CWACEU/graph.json","events_json":"https://pith.science/api/pith-number/IJ7ES7ZLMAGYEMYKG5F3CWACEU/events.json","paper":"https://pith.science/paper/IJ7ES7ZL"},"agent_actions":{"view_html":"https://pith.science/pith/IJ7ES7ZLMAGYEMYKG5F3CWACEU","download_json":"https://pith.science/pith/IJ7ES7ZLMAGYEMYKG5F3CWACEU.json","view_paper":"https://pith.science/paper/IJ7ES7ZL","resolve_alias":"https://pith.science/api/pith-number/resolve?arxiv=2605.31116&json=true","fetch_graph":"https://pith.science/api/pith-number/IJ7ES7ZLMAGYEMYKG5F3CWACEU/graph.json","fetch_events":"https://pith.science/api/pith-number/IJ7ES7ZLMAGYEMYKG5F3CWACEU/events.json","actions":{"anchor_timestamp":"https://pith.science/pith/IJ7ES7ZLMAGYEMYKG5F3CWACEU/action/timestamp_anchor","attest_storage":"https://pith.science/pith/IJ7ES7ZLMAGYEMYKG5F3CWACEU/action/storage_attestation","attest_author":"https://pith.science/pith/IJ7ES7ZLMAGYEMYKG5F3CWACEU/action/author_attestation","sign_citation":"https://pith.science/pith/IJ7ES7ZLMAGYEMYKG5F3CWACEU/action/citation_signature","submit_replication":"https://pith.science/pith/IJ7ES7ZLMAGYEMYKG5F3CWACEU/action/replication_record"}},"created_at":"2026-06-01T01:03:58.815962+00:00","updated_at":"2026-06-01T01:03:58.815962+00:00"}