{"bundle_type":"pith_open_graph_bundle","bundle_version":"1.0","pith_number":"pith:2026:AXIPP6QRGN2PCEU3AQ4WJC74VL","short_pith_number":"pith:AXIPP6QR","canonical_record":{"source":{"id":"2604.18747","kind":"arxiv","version":2},"metadata":{"license":"http://creativecommons.org/licenses/by/4.0/","primary_cat":"cs.CV","submitted_at":"2026-04-20T18:52:03Z","cross_cats_sorted":[],"title_canon_sha256":"ac811ee39c2d11d37c8df1fbf1c6b85e316264bd1a6be020ad277916dcc1fa9c","abstract_canon_sha256":"7bf1fa8a0642edc119c7bd7028807ec715e2adf6517332ded1da80ea69ebdcd5"},"schema_version":"1.0"},"canonical_sha256":"05d0f7fa113374f1129b0439648bfcaae7b602b1974251a5a0f985d934deea49","source":{"kind":"arxiv","id":"2604.18747","version":2},"source_aliases":[{"alias_kind":"arxiv","alias_value":"2604.18747","created_at":"2026-07-01T00:17:11Z"},{"alias_kind":"arxiv_version","alias_value":"2604.18747v2","created_at":"2026-07-01T00:17:11Z"},{"alias_kind":"doi","alias_value":"10.48550/arxiv.2604.18747","created_at":"2026-07-01T00:17:11Z"},{"alias_kind":"pith_short_12","alias_value":"AXIPP6QRGN2P","created_at":"2026-07-01T00:17:11Z"},{"alias_kind":"pith_short_16","alias_value":"AXIPP6QRGN2PCEU3","created_at":"2026-07-01T00:17:11Z"},{"alias_kind":"pith_short_8","alias_value":"AXIPP6QR","created_at":"2026-07-01T00:17:11Z"}],"events":[{"event_type":"record_created","subject_pith_number":"pith:2026:AXIPP6QRGN2PCEU3AQ4WJC74VL","target":"record","payload":{"canonical_record":{"source":{"id":"2604.18747","kind":"arxiv","version":2},"metadata":{"license":"http://creativecommons.org/licenses/by/4.0/","primary_cat":"cs.CV","submitted_at":"2026-04-20T18:52:03Z","cross_cats_sorted":[],"title_canon_sha256":"ac811ee39c2d11d37c8df1fbf1c6b85e316264bd1a6be020ad277916dcc1fa9c","abstract_canon_sha256":"7bf1fa8a0642edc119c7bd7028807ec715e2adf6517332ded1da80ea69ebdcd5"},"schema_version":"1.0"},"canonical_sha256":"05d0f7fa113374f1129b0439648bfcaae7b602b1974251a5a0f985d934deea49","receipt":{"kind":"pith_receipt","key_id":"pith-v1-2026-05","algorithm":"ed25519","signed_at":"2026-07-01T00:17:11.454869Z","signature_b64":"UWfqaZzKRz4AECRlBK3NgEdGI78l10fPpxfu2VetJQbf16B8erxFWnp0RKgmwsA055CQygzU3zhN4Wai6/MoAA==","signed_message":"canonical_sha256_bytes","builder_version":"pith-number-builder-2026-05-17-v1","receipt_version":"0.3","canonical_sha256":"05d0f7fa113374f1129b0439648bfcaae7b602b1974251a5a0f985d934deea49","last_reissued_at":"2026-07-01T00:17:11.454292Z","signature_status":"signed_v1","first_computed_at":"2026-07-01T00:17:11.454292Z","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54"},"source_kind":"arxiv","source_id":"2604.18747","source_version":2,"attestation_state":"computed"},"signer":{"signer_id":"pith.science","signer_type":"pith_registry","key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54"},"created_at":"2026-07-01T00:17:11Z","supersedes":[],"prev_event":null,"signature":{"signature_status":"signed_v1","algorithm":"ed25519","key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","signature_b64":"oNUfKmrQSx6G72L2OLy3YqWEKdq2Z8XsYzC75gwnRIdKCq1ZyW4V1XY3YcOi4UpBHr9DGU6b2TuJsXyaQqOcBQ==","signed_message":"open_graph_event_sha256_bytes","signed_at":"2026-07-02T07:24:15.158300Z"},"content_sha256":"25759fc507e33f4e8ab42cec788287bdd890d019cf0a6b48df6361dd8e09245f","schema_version":"1.0","event_id":"sha256:25759fc507e33f4e8ab42cec788287bdd890d019cf0a6b48df6361dd8e09245f"},{"event_type":"graph_snapshot","subject_pith_number":"pith:2026:AXIPP6QRGN2PCEU3AQ4WJC74VL","target":"graph","payload":{"graph_snapshot":{"paper":{"title":"URoPE: Universal Relative Position Embedding across Geometric Spaces","license":"http://creativecommons.org/licenses/by/4.0/","headline":"URoPE extends rotary position embeddings to cross-view and cross-dimensional geometry by sampling and projecting 3D ray points.","cross_cats":[],"primary_cat":"cs.CV","authors_text":"Chensheng Peng, Depu Meng, Masayoshi Tomizuka, Quentin Herau, Wei Zhan, Yichen Xie, Yihan Hu","submitted_at":"2026-04-20T18:52:03Z","abstract_excerpt":"Relative position embedding has become a standard mechanism for encoding positional information in Transformers. However, existing formulations are typically limited to a fixed geometric space, namely 1D sequences or regular 2D/3D grids, which restricts their applicability to many computer vision tasks that require geometric reasoning across camera views or between 2D and 3D spaces. To address this limitation, we propose URoPE, a universal extension of Rotary Position Embedding (RoPE) to cross-view or cross-dimensional geometric spaces. For each key/value image patch, URoPE samples 3D points a"},"claims":{"count":4,"items":[{"kind":"strongest_claim","text":"URoPE is a universal extension of Rotary Position Embedding (RoPE) to cross-view or cross-dimensional geometric spaces... URoPE is a parameter-free and intrinsics-aware relative position embedding that is invariant to the choice of global coordinate systems, while remaining fully compatible with existing RoPE-optimized attention kernels. Experiments show that URoPE consistently improves the performance of transformer-based models across all tasks.","source":"verdict.strongest_claim","status":"machine_extracted","claim_id":"C1","attestation":"unclaimed"},{"kind":"weakest_assumption","text":"That sampling 3D points along camera rays at a small number of predefined depth anchors and projecting them into the query plane is sufficient to encode the necessary relative geometric relationships for effective cross-view and cross-dimensional reasoning.","source":"verdict.weakest_assumption","status":"machine_extracted","claim_id":"C2","attestation":"unclaimed"},{"kind":"one_line_summary","text":"URoPE is a parameter-free relative position embedding for transformers that works across arbitrary geometric spaces by ray sampling and projection, yielding consistent gains on novel view synthesis, 3D detection, tracking, and depth estimation.","source":"verdict.one_line_summary","status":"machine_extracted","claim_id":"C3","attestation":"unclaimed"},{"kind":"headline","text":"URoPE extends rotary position embeddings to cross-view and cross-dimensional geometry by sampling and projecting 3D ray points.","source":"verdict.pith_extraction.headline","status":"machine_extracted","claim_id":"C4","attestation":"unclaimed"}],"snapshot_sha256":"14de58701c0030b32711e619c017412fa86a2e2832c9b57b3e49998c3c25240b"},"source":{"id":"2604.18747","kind":"arxiv","version":2},"verdict":{"id":"2ed1fe89-b146-485d-84de-51e0c135eacf","model_set":{"reader":"grok-4.3"},"created_at":"2026-05-10T04:13:18.206709Z","strongest_claim":"URoPE is a universal extension of Rotary Position Embedding (RoPE) to cross-view or cross-dimensional geometric spaces... URoPE is a parameter-free and intrinsics-aware relative position embedding that is invariant to the choice of global coordinate systems, while remaining fully compatible with existing RoPE-optimized attention kernels. Experiments show that URoPE consistently improves the performance of transformer-based models across all tasks.","one_line_summary":"URoPE is a parameter-free relative position embedding for transformers that works across arbitrary geometric spaces by ray sampling and projection, yielding consistent gains on novel view synthesis, 3D detection, tracking, and depth estimation.","pipeline_version":"pith-pipeline@v0.9.0","weakest_assumption":"That sampling 3D points along camera rays at a small number of predefined depth anchors and projecting them into the query plane is sufficient to encode the necessary relative geometric relationships for effective cross-view and cross-dimensional reasoning.","pith_extraction_headline":"URoPE extends rotary position embeddings to cross-view and cross-dimensional geometry by sampling and projecting 3D ray points."},"integrity":{"clean":true,"summary":{"advisory":0,"critical":0,"by_detector":{},"informational":0},"endpoint":"/pith/2604.18747/integrity.json","findings":[],"available":true,"detectors_run":[{"name":"doi_compliance","ran_at":"2026-05-20T03:43:52.862847Z","status":"completed","version":"1.0.0","findings_count":0}],"snapshot_sha256":"948160e13c971439a9c1810af585f7ffd3dbe414df3c05ca526fdb3e33cdb251"},"references":{"count":0,"sample":[],"resolved_work":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57","internal_anchors":0},"formal_canon":{"evidence_count":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"author_claims":{"count":0,"strong_count":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"builder_version":"pith-number-builder-2026-05-17-v1"},"verdict_id":"2ed1fe89-b146-485d-84de-51e0c135eacf"},"signer":{"signer_id":"pith.science","signer_type":"pith_registry","key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54"},"created_at":"2026-07-01T00:17:11Z","supersedes":[],"prev_event":null,"signature":{"signature_status":"signed_v1","algorithm":"ed25519","key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","signature_b64":"5/iKXxu0q7smycVHQ1/f1Q8ppyh4FVG2F0V8//y23SYEiVvTy2+S0lvwlykcqpx3NKecAogfXnU1ddbu7x/FCQ==","signed_message":"open_graph_event_sha256_bytes","signed_at":"2026-07-02T07:24:15.158815Z"},"content_sha256":"72fdbf764e4b1be39737af302dd7c34c010486a6bdba176a70e253467c94d27d","schema_version":"1.0","event_id":"sha256:72fdbf764e4b1be39737af302dd7c34c010486a6bdba176a70e253467c94d27d"}],"timestamp_proofs":[],"mirror_hints":[{"mirror_type":"https","name":"Pith Resolver","base_url":"https://pith.science","bundle_url":"https://pith.science/pith/AXIPP6QRGN2PCEU3AQ4WJC74VL/bundle.json","state_url":"https://pith.science/pith/AXIPP6QRGN2PCEU3AQ4WJC74VL/state.json","well_known_bundle_url":"https://pith.science/.well-known/pith/AXIPP6QRGN2PCEU3AQ4WJC74VL/bundle.json","status":"primary"}],"public_keys":[{"key_id":"pith-v1-2026-05","algorithm":"ed25519","format":"raw","public_key_b64":"stVStoiQhXFxp4s2pdzPNoqVNBMojDU/fJ2db5S3CbM=","public_key_hex":"b2d552b68890857171a78b36a5dccf368a953413288c353f7c9d9d6f94b709b3","fingerprint_sha256_b32_first128bits":"RVFV5Z2OI2J3ZUO7ERDEBCYNKS","fingerprint_sha256_hex":"8d4b5ee74e4693bcd1df2446408b0d54","rotates_at":null,"url":"https://pith.science/pith-signing-key.json","notes":"Pith uses this Ed25519 key to sign canonical record SHA-256 digests. Verify with: ed25519_verify(public_key, message=canonical_sha256_bytes, signature=base64decode(signature_b64))."}],"merge_version":"pith-open-graph-merge-v1","built_at":"2026-07-02T07:24:15Z","links":{"resolver":"https://pith.science/pith/AXIPP6QRGN2PCEU3AQ4WJC74VL","bundle":"https://pith.science/pith/AXIPP6QRGN2PCEU3AQ4WJC74VL/bundle.json","state":"https://pith.science/pith/AXIPP6QRGN2PCEU3AQ4WJC74VL/state.json","well_known_bundle":"https://pith.science/.well-known/pith/AXIPP6QRGN2PCEU3AQ4WJC74VL/bundle.json"},"state":{"state_type":"pith_open_graph_state","state_version":"1.0","pith_number":"pith:2026:AXIPP6QRGN2PCEU3AQ4WJC74VL","merge_version":"pith-open-graph-merge-v1","event_count":2,"valid_event_count":2,"invalid_event_count":0,"equivocation_count":0,"current":{"canonical_record":{"metadata":{"abstract_canon_sha256":"7bf1fa8a0642edc119c7bd7028807ec715e2adf6517332ded1da80ea69ebdcd5","cross_cats_sorted":[],"license":"http://creativecommons.org/licenses/by/4.0/","primary_cat":"cs.CV","submitted_at":"2026-04-20T18:52:03Z","title_canon_sha256":"ac811ee39c2d11d37c8df1fbf1c6b85e316264bd1a6be020ad277916dcc1fa9c"},"schema_version":"1.0","source":{"id":"2604.18747","kind":"arxiv","version":2}},"source_aliases":[{"alias_kind":"arxiv","alias_value":"2604.18747","created_at":"2026-07-01T00:17:11Z"},{"alias_kind":"arxiv_version","alias_value":"2604.18747v2","created_at":"2026-07-01T00:17:11Z"},{"alias_kind":"doi","alias_value":"10.48550/arxiv.2604.18747","created_at":"2026-07-01T00:17:11Z"},{"alias_kind":"pith_short_12","alias_value":"AXIPP6QRGN2P","created_at":"2026-07-01T00:17:11Z"},{"alias_kind":"pith_short_16","alias_value":"AXIPP6QRGN2PCEU3","created_at":"2026-07-01T00:17:11Z"},{"alias_kind":"pith_short_8","alias_value":"AXIPP6QR","created_at":"2026-07-01T00:17:11Z"}],"graph_snapshots":[{"event_id":"sha256:72fdbf764e4b1be39737af302dd7c34c010486a6bdba176a70e253467c94d27d","target":"graph","created_at":"2026-07-01T00:17:11Z","signer":{"key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","signer_id":"pith.science","signer_type":"pith_registry"},"payload":{"graph_snapshot":{"author_claims":{"count":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57","strong_count":0},"builder_version":"pith-number-builder-2026-05-17-v1","claims":{"count":4,"items":[{"attestation":"unclaimed","claim_id":"C1","kind":"strongest_claim","source":"verdict.strongest_claim","status":"machine_extracted","text":"URoPE is a universal extension of Rotary Position Embedding (RoPE) to cross-view or cross-dimensional geometric spaces... URoPE is a parameter-free and intrinsics-aware relative position embedding that is invariant to the choice of global coordinate systems, while remaining fully compatible with existing RoPE-optimized attention kernels. Experiments show that URoPE consistently improves the performance of transformer-based models across all tasks."},{"attestation":"unclaimed","claim_id":"C2","kind":"weakest_assumption","source":"verdict.weakest_assumption","status":"machine_extracted","text":"That sampling 3D points along camera rays at a small number of predefined depth anchors and projecting them into the query plane is sufficient to encode the necessary relative geometric relationships for effective cross-view and cross-dimensional reasoning."},{"attestation":"unclaimed","claim_id":"C3","kind":"one_line_summary","source":"verdict.one_line_summary","status":"machine_extracted","text":"URoPE is a parameter-free relative position embedding for transformers that works across arbitrary geometric spaces by ray sampling and projection, yielding consistent gains on novel view synthesis, 3D detection, tracking, and depth estimation."},{"attestation":"unclaimed","claim_id":"C4","kind":"headline","source":"verdict.pith_extraction.headline","status":"machine_extracted","text":"URoPE extends rotary position embeddings to cross-view and cross-dimensional geometry by sampling and projecting 3D ray points."}],"snapshot_sha256":"14de58701c0030b32711e619c017412fa86a2e2832c9b57b3e49998c3c25240b"},"formal_canon":{"evidence_count":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"integrity":{"available":true,"clean":true,"detectors_run":[{"findings_count":0,"name":"doi_compliance","ran_at":"2026-05-20T03:43:52.862847Z","status":"completed","version":"1.0.0"}],"endpoint":"/pith/2604.18747/integrity.json","findings":[],"snapshot_sha256":"948160e13c971439a9c1810af585f7ffd3dbe414df3c05ca526fdb3e33cdb251","summary":{"advisory":0,"by_detector":{},"critical":0,"informational":0}},"paper":{"abstract_excerpt":"Relative position embedding has become a standard mechanism for encoding positional information in Transformers. However, existing formulations are typically limited to a fixed geometric space, namely 1D sequences or regular 2D/3D grids, which restricts their applicability to many computer vision tasks that require geometric reasoning across camera views or between 2D and 3D spaces. To address this limitation, we propose URoPE, a universal extension of Rotary Position Embedding (RoPE) to cross-view or cross-dimensional geometric spaces. For each key/value image patch, URoPE samples 3D points a","authors_text":"Chensheng Peng, Depu Meng, Masayoshi Tomizuka, Quentin Herau, Wei Zhan, Yichen Xie, Yihan Hu","cross_cats":[],"headline":"URoPE extends rotary position embeddings to cross-view and cross-dimensional geometry by sampling and projecting 3D ray points.","license":"http://creativecommons.org/licenses/by/4.0/","primary_cat":"cs.CV","submitted_at":"2026-04-20T18:52:03Z","title":"URoPE: Universal Relative Position Embedding across Geometric Spaces"},"references":{"count":0,"internal_anchors":0,"resolved_work":0,"sample":[],"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"source":{"id":"2604.18747","kind":"arxiv","version":2},"verdict":{"created_at":"2026-05-10T04:13:18.206709Z","id":"2ed1fe89-b146-485d-84de-51e0c135eacf","model_set":{"reader":"grok-4.3"},"one_line_summary":"URoPE is a parameter-free relative position embedding for transformers that works across arbitrary geometric spaces by ray sampling and projection, yielding consistent gains on novel view synthesis, 3D detection, tracking, and depth estimation.","pipeline_version":"pith-pipeline@v0.9.0","pith_extraction_headline":"URoPE extends rotary position embeddings to cross-view and cross-dimensional geometry by sampling and projecting 3D ray points.","strongest_claim":"URoPE is a universal extension of Rotary Position Embedding (RoPE) to cross-view or cross-dimensional geometric spaces... URoPE is a parameter-free and intrinsics-aware relative position embedding that is invariant to the choice of global coordinate systems, while remaining fully compatible with existing RoPE-optimized attention kernels. Experiments show that URoPE consistently improves the performance of transformer-based models across all tasks.","weakest_assumption":"That sampling 3D points along camera rays at a small number of predefined depth anchors and projecting them into the query plane is sufficient to encode the necessary relative geometric relationships for effective cross-view and cross-dimensional reasoning."}},"verdict_id":"2ed1fe89-b146-485d-84de-51e0c135eacf"}}],"author_attestations":[],"timestamp_anchors":[],"storage_attestations":[],"citation_signatures":[],"replication_records":[],"corrections":[],"mirror_hints":[],"record_created":{"event_id":"sha256:25759fc507e33f4e8ab42cec788287bdd890d019cf0a6b48df6361dd8e09245f","target":"record","created_at":"2026-07-01T00:17:11Z","signer":{"key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","signer_id":"pith.science","signer_type":"pith_registry"},"payload":{"attestation_state":"computed","canonical_record":{"metadata":{"abstract_canon_sha256":"7bf1fa8a0642edc119c7bd7028807ec715e2adf6517332ded1da80ea69ebdcd5","cross_cats_sorted":[],"license":"http://creativecommons.org/licenses/by/4.0/","primary_cat":"cs.CV","submitted_at":"2026-04-20T18:52:03Z","title_canon_sha256":"ac811ee39c2d11d37c8df1fbf1c6b85e316264bd1a6be020ad277916dcc1fa9c"},"schema_version":"1.0","source":{"id":"2604.18747","kind":"arxiv","version":2}},"canonical_sha256":"05d0f7fa113374f1129b0439648bfcaae7b602b1974251a5a0f985d934deea49","receipt":{"algorithm":"ed25519","builder_version":"pith-number-builder-2026-05-17-v1","canonical_sha256":"05d0f7fa113374f1129b0439648bfcaae7b602b1974251a5a0f985d934deea49","first_computed_at":"2026-07-01T00:17:11.454292Z","key_id":"pith-v1-2026-05","kind":"pith_receipt","last_reissued_at":"2026-07-01T00:17:11.454292Z","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","receipt_version":"0.3","signature_b64":"UWfqaZzKRz4AECRlBK3NgEdGI78l10fPpxfu2VetJQbf16B8erxFWnp0RKgmwsA055CQygzU3zhN4Wai6/MoAA==","signature_status":"signed_v1","signed_at":"2026-07-01T00:17:11.454869Z","signed_message":"canonical_sha256_bytes"},"source_id":"2604.18747","source_kind":"arxiv","source_version":2}}},"equivocations":[],"invalid_events":[],"applied_event_ids":["sha256:25759fc507e33f4e8ab42cec788287bdd890d019cf0a6b48df6361dd8e09245f","sha256:72fdbf764e4b1be39737af302dd7c34c010486a6bdba176a70e253467c94d27d"],"state_sha256":"f577427945eecccbeac5dd152f6dcded63ae931d6be23fd1af79781b26c09f5c"},"bundle_signature":{"signature_status":"signed_v1","algorithm":"ed25519","key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","signature_b64":"FWZHixCasKafFMSqjaoMYeWcQwBXSpS82wikRVXB8sH7ZumxuQn9wpcNxSeAZDaq2td/5hU1E+C6Gly95j2cBQ==","signed_message":"bundle_sha256_bytes","signed_at":"2026-07-02T07:24:15.161209Z","bundle_sha256":"1e02b90dfa673ff53414137d17940ba8af47b04765efdb7cd1d9025c7c9ddfa0"}}