{"record_type":"pith_number_record","schema_url":"https://pith.science/schemas/pith-number/v1.json","pith_number":"pith:2026:HT7SH2RNXD3HMK45YXIYN3YTTQ","short_pith_number":"pith:HT7SH2RN","schema_version":"1.0","canonical_sha256":"3cff23ea2db8f6762b9dc5d186ef139c1031f42d31058a188d84c874a3d4109d","source":{"kind":"arxiv","id":"2605.14615","version":1},"attestation_state":"computed","paper":{"title":"CalibAnyView: Beyond Single-View Camera Calibration in the Wild","license":"http://arxiv.org/licenses/nonexclusive-distrib/1.0/","headline":"CalibAnyView enables camera calibration from any number of views in the wild by enforcing cross-view geometric consistency.","cross_cats":[],"primary_cat":"cs.CV","authors_text":"Boying Li, Cheng Zhang, Daniel Cremers, Hamid Rezatofighi, Ian Reid, Weirong Chen","submitted_at":"2026-05-14T09:32:12Z","abstract_excerpt":"Camera calibration is a fundamental prerequisite for reliable geometric perception, yet classical approaches rely on controlled acquisition setups that are impractical for in-the-wild imagery. Recent learning-based methods have shown promising results for single-view calibration, but inherently neglect geometric consistency across multiple views. We introduce CalibAnyView, a unified formulation that supports an arbitrary number of input views ($N \\geq 1$) by explicitly modeling cross-view geometric consistency. To facilitate this, we construct a large-scale multi-view video dataset covering di"},"verification_status":{"content_addressed":true,"pith_receipt":true,"author_attested":false,"weak_author_claims":0,"strong_author_claims":0,"externally_anchored":false,"storage_verified":false,"citation_signatures":0,"replication_records":0,"graph_snapshot":true,"references_resolved":true,"formal_links_present":true},"canonical_record":{"source":{"id":"2605.14615","kind":"arxiv","version":1},"metadata":{"license":"http://arxiv.org/licenses/nonexclusive-distrib/1.0/","primary_cat":"cs.CV","submitted_at":"2026-05-14T09:32:12Z","cross_cats_sorted":[],"title_canon_sha256":"15dee3fb9070d209ad4a19d24f8d968e971e2fab4c54ae7625d75b95070dd4d5","abstract_canon_sha256":"216f8d417ba85d00725a6b162724a89e0c183be8f294d7ad29f3d33f765a46ef"},"schema_version":"1.0"},"receipt":{"kind":"pith_receipt","key_id":"pith-v1-2026-05","algorithm":"ed25519","signed_at":"2026-05-17T23:39:04.122715Z","signature_b64":"YU80+CqN7POHrt0g5jqMG+iGcTBa6pHFaVeSQCx2SFy+XYXj1Z/AOg+y09gNJN/qUQIr5HNvRdpmciNn15TfCg==","signed_message":"canonical_sha256_bytes","builder_version":"pith-number-builder-2026-05-17-v1","receipt_version":"0.3","canonical_sha256":"3cff23ea2db8f6762b9dc5d186ef139c1031f42d31058a188d84c874a3d4109d","last_reissued_at":"2026-05-17T23:39:04.121970Z","signature_status":"signed_v1","first_computed_at":"2026-05-17T23:39:04.121970Z","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54"},"graph_snapshot":{"paper":{"title":"CalibAnyView: Beyond Single-View Camera Calibration in the Wild","license":"http://arxiv.org/licenses/nonexclusive-distrib/1.0/","headline":"CalibAnyView enables camera calibration from any number of views in the wild by enforcing cross-view geometric consistency.","cross_cats":[],"primary_cat":"cs.CV","authors_text":"Boying Li, Cheng Zhang, Daniel Cremers, Hamid Rezatofighi, Ian Reid, Weirong Chen","submitted_at":"2026-05-14T09:32:12Z","abstract_excerpt":"Camera calibration is a fundamental prerequisite for reliable geometric perception, yet classical approaches rely on controlled acquisition setups that are impractical for in-the-wild imagery. Recent learning-based methods have shown promising results for single-view calibration, but inherently neglect geometric consistency across multiple views. We introduce CalibAnyView, a unified formulation that supports an arbitrary number of input views ($N \\geq 1$) by explicitly modeling cross-view geometric consistency. To facilitate this, we construct a large-scale multi-view video dataset covering di"},"claims":{"count":4,"items":[{"kind":"strongest_claim","text":"CalibAnyView consistently outperforms state-of-the-art methods, achieves strong robustness under single-view settings, and further improves with multi-view inference.","source":"verdict.strongest_claim","status":"machine_extracted","claim_id":"C1","attestation":"unclaimed"},{"kind":"weakest_assumption","text":"The constructed large-scale multi-view video dataset sufficiently covers the diversity of real-world camera models, dynamic scenes, motion trajectories, and lens distortions so that the learned model generalizes beyond the training distribution.","source":"verdict.weakest_assumption","status":"machine_extracted","claim_id":"C2","attestation":"unclaimed"},{"kind":"one_line_summary","text":"A multi-view transformer predicts dense perspective fields that feed a geometric optimizer to estimate camera intrinsics and gravity from arbitrary numbers of real-world views.","source":"verdict.one_line_summary","status":"machine_extracted","claim_id":"C3","attestation":"unclaimed"},{"kind":"headline","text":"CalibAnyView enables camera calibration from any number of views in the wild by enforcing cross-view geometric consistency.","source":"verdict.pith_extraction.headline","status":"machine_extracted","claim_id":"C4","attestation":"unclaimed"}],"snapshot_sha256":"c1953e2c62b12106d16d10a88780c5208acdca1c2b998be04e02baa03ad21a48"},"source":{"id":"2605.14615","kind":"arxiv","version":1},"verdict":{"id":"1f5bf76f-6aa7-46d1-96f5-0f13ca415c11","model_set":{"reader":"grok-4.3"},"created_at":"2026-05-15T05:56:58.310994Z","strongest_claim":"CalibAnyView consistently outperforms state-of-the-art methods, achieves strong robustness under single-view settings, and further improves with multi-view inference.","one_line_summary":"A multi-view transformer predicts dense perspective fields that feed a geometric optimizer to estimate camera intrinsics and gravity from arbitrary numbers of real-world views.","pipeline_version":"pith-pipeline@v0.9.0","weakest_assumption":"The constructed large-scale multi-view video dataset sufficiently covers the diversity of real-world camera models, dynamic scenes, motion trajectories, and lens distortions so that the learned model generalizes beyond the training distribution.","pith_extraction_headline":"CalibAnyView enables camera calibration from any number of views in the wild by enforcing cross-view geometric consistency."},"references":{"count":61,"sample":[{"doi":"","year":2011,"title":"Communications of the ACM54(10), 105–112 (2011)","work_id":"e98ad0ee-c84a-4110-a036-4198d635688d","ref_index":1,"cited_arxiv_id":"","is_internal_anchor":false},{"doi":"","year":2017,"title":"Joint 2d-3d-semantic data for indoor scene understanding","work_id":"cd49417b-13e3-4652-87f2-c992e78d093a","ref_index":2,"cited_arxiv_id":"1702.01105","is_internal_anchor":true},{"doi":"","year":2025,"title":"Qwen2.5-VL Technical Report","work_id":"69dffacb-bfe8-442d-be86-48624c60426f","ref_index":3,"cited_arxiv_id":"2502.13923","is_internal_anchor":true},{"doi":"","year":2011,"title":"In: CVPR 2011","work_id":"ececda63-0d1a-4aa7-8188-c69cee730905","ref_index":4,"cited_arxiv_id":"","is_internal_anchor":false},{"doi":"","year":2018,"title":"Bogdan, O., Eckstein, V., Rameau, F., Bazin, J.C.: Deepcalib: A deep learning ap- proach for automatic intrinsic calibration of wide field-of-view cameras. In: CVMP. pp. 1–10 (2018)","work_id":"31c5c3a5-a4b7-4f79-a177-d23da30048ce","ref_index":5,"cited_arxiv_id":"","is_internal_anchor":false}],"resolved_work":61,"snapshot_sha256":"d6da3f5bdb80452c222ee150623c4a3b2d4c16f901f0b0e0a405ded8da8ced13","internal_anchors":5},"formal_canon":{"evidence_count":2,"snapshot_sha256":"3922add496d94c357b78d0eb30a471ac4439a70c70f15f0f9cd19fa30e8e809b"},"author_claims":{"count":0,"strong_count":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"builder_version":"pith-number-builder-2026-05-17-v1"},"aliases":[{"alias_kind":"arxiv","alias_value":"2605.14615","created_at":"2026-05-17T23:39:04.122095+00:00"},{"alias_kind":"arxiv_version","alias_value":"2605.14615v1","created_at":"2026-05-17T23:39:04.122095+00:00"},{"alias_kind":"doi","alias_value":"10.48550/arxiv.2605.14615","created_at":"2026-05-17T23:39:04.122095+00:00"},{"alias_kind":"pith_short_12","alias_value":"HT7SH2RNXD3H","created_at":"2026-05-18T12:33:37.589309+00:00"},{"alias_kind":"pith_short_16","alias_value":"HT7SH2RNXD3HMK45","created_at":"2026-05-18T12:33:37.589309+00:00"},{"alias_kind":"pith_short_8","alias_value":"HT7SH2RN","created_at":"2026-05-18T12:33:37.589309+00:00"}],"events":[],"event_summary":{},"paper_claims":[],"inbound_citations":{"count":0,"internal_anchor_count":0,"sample":[]},"formal_canon":{"evidence_count":2,"sample":[],"anchors":[]},"links":{"html":"https://pith.science/pith/HT7SH2RNXD3HMK45YXIYN3YTTQ","json":"https://pith.science/pith/HT7SH2RNXD3HMK45YXIYN3YTTQ.json","graph_json":"https://pith.science/api/pith-number/HT7SH2RNXD3HMK45YXIYN3YTTQ/graph.json","events_json":"https://pith.science/api/pith-number/HT7SH2RNXD3HMK45YXIYN3YTTQ/events.json","paper":"https://pith.science/paper/HT7SH2RN"},"agent_actions":{"view_html":"https://pith.science/pith/HT7SH2RNXD3HMK45YXIYN3YTTQ","download_json":"https://pith.science/pith/HT7SH2RNXD3HMK45YXIYN3YTTQ.json","view_paper":"https://pith.science/paper/HT7SH2RN","resolve_alias":"https://pith.science/api/pith-number/resolve?arxiv=2605.14615&json=true","fetch_graph":"https://pith.science/api/pith-number/HT7SH2RNXD3HMK45YXIYN3YTTQ/graph.json","fetch_events":"https://pith.science/api/pith-number/HT7SH2RNXD3HMK45YXIYN3YTTQ/events.json","actions":{"anchor_timestamp":"https://pith.science/pith/HT7SH2RNXD3HMK45YXIYN3YTTQ/action/timestamp_anchor","attest_storage":"https://pith.science/pith/HT7SH2RNXD3HMK45YXIYN3YTTQ/action/storage_attestation","attest_author":"https://pith.science/pith/HT7SH2RNXD3HMK45YXIYN3YTTQ/action/author_attestation","sign_citation":"https://pith.science/pith/HT7SH2RNXD3HMK45YXIYN3YTTQ/action/citation_signature","submit_replication":"https://pith.science/pith/HT7SH2RNXD3HMK45YXIYN3YTTQ/action/replication_record"}},"created_at":"2026-05-17T23:39:04.122095+00:00","updated_at":"2026-05-17T23:39:04.122095+00:00"}