Dataset Groups Activity Stream InternLM-XComposer2-4KHD InternLM-XComposer2-4KHD is a vision-language large model that supports images with any aspect ratio from 336 pixels up to 4K HD, facilitating its deployment in real-world contexts. BibTex: @dataset{Xiaoyi_Dong_and_Pan_Zhang_and_Yuhang_Zang_and_Yuhang_Cao_and_Bin_Wang_and_Linke_Ouyang_and_Songyang_Zhang_and_Haodong_Duan_and_Wenwei_Zhang_and_Yining_Li_and_Hang_Yan_and_Yang_Gao_and_Xinyue_Zhang_and_Wei_Li_and_Jingwen_Li_and_Kai_Chen_and_Conghui_He_and_Xingcheng_Zhang_and_Yu_Qiao_and_Dahua_Lin_and_Jiaqi_Wang_2024, abstract = {InternLM-XComposer2-4KHD is a vision-language large model that supports images with any aspect ratio from 336 pixels up to 4K HD, facilitating its deployment in real-world contexts.}, author = {Xiaoyi Dong and Pan Zhang and Yuhang Zang and Yuhang Cao and Bin Wang and Linke Ouyang and Songyang Zhang and Haodong Duan and Wenwei Zhang and Yining Li and Hang Yan and Yang Gao and Xinyue Zhang and Wei Li and Jingwen Li and Kai Chen and Conghui He and Xingcheng Zhang and Yu Qiao and Dahua Lin and Jiaqi Wang}, doi = {10.57702/6aq51r5q}, institution = {No Organization}, keyword = {'image processing', 'large model', 'vision-language model'}, month = {dec}, publisher = {TIB}, title = {InternLM-XComposer2-4KHD}, url = {https://service.tib.eu/ldmservice/dataset/internlm-xcomposer2-4khd}, year = {2024} }