{"work":{"id":"799b1f12-2edc-4b09-a83b-dbd87e1404e7","openalex_id":null,"doi":null,"arxiv_id":"2404.06512","raw_key":null,"title":"Internlm-xcomposer2-4khd: A pioneer- ing large vision-language model handling resolutions from 336 pixels to 4k hd","authors":null,"authors_text":"Xiaoyi Dong, Pan Zhang, Yuhang Zang, Yuhang Cao, Bin Wang, Linke Ouyang, Songyang Zhang, Haodong Duan, Wenwei Zhang, Yining Li, Hang Yan, Yang Gao, Zhe Chen, Xinyue Zhang, Wei Li, Jingwen Li, Wenhai Wang, Kai Chen, Conghui He, Xingcheng Zha","year":2024,"venue":null,"abstract":null,"external_url":"https://arxiv.org/abs/2404.06512","cited_by_count":null,"metadata_source":"arxiv_reference","metadata_fetched_at":"2026-05-23T19:43:23.809338+00:00","pith_arxiv_id":null,"created_at":"2026-05-10T13:23:57.961378+00:00","updated_at":"2026-06-05T21:23:00.469572+00:00","title_quality_ok":true,"display_title":"Internlm-xcomposer2-4khd: A pioneer- ing large vision-language model handling resolutions from 336 pixels to 4k hd","render_title":"Internlm-xcomposer2-4khd: A pioneer- ing large vision-language model handling resolutions from 336 pixels to 4k hd"},"hub":{"state":{"work_id":"799b1f12-2edc-4b09-a83b-dbd87e1404e7","tier":"hub","tier_reason":"10+ Pith inbound or 1,000+ external citations","pith_inbound_count":11,"external_cited_by_count":null,"distinct_field_count":2,"first_pith_cited_at":"2024-04-22T14:32:33+00:00","last_pith_cited_at":"2025-04-14T17:59:25+00:00","author_build_status":"not_needed","summary_status":"needed","contexts_status":"needed","graph_status":"needed","ask_index_status":"not_needed","reader_status":"not_needed","recognition_status":"not_needed","updated_at":"2026-06-10T16:26:54.875028+00:00","tier_text":"hub"},"tier":"hub","role_counts":[{"context_role":"background","n":8}],"polarity_counts":[{"context_polarity":"background","n":7},{"context_polarity":"unclear","n":1}],"runs":{},"summary":{},"graph":{},"authors":[]}}