Dataset Groups Activity Stream Kosmos-2: Grounding multimodal large language models to the world Kosmos-2: Grounding multimodal large language models to the world. BibTex: @dataset{Zhiliang_Peng_and_Wenhui_Wang_and_Li_Dong_and_Yaru_Hao_and_Shaohan_Huang_and_Shuming_Ma_and_Furu_Wei_2024, abstract = {Kosmos-2: Grounding multimodal large language models to the world.}, author = {Zhiliang Peng and Wenhui Wang and Li Dong and Yaru Hao and Shaohan Huang and Shuming Ma and Furu Wei}, doi = {10.57702/elgkymz1}, institution = {No Organization}, keyword = {'Grounding', 'Large language models', 'Multimodal learning'}, month = {dec}, publisher = {TIB}, title = {Kosmos-2: Grounding multimodal large language models to the world}, url = {https://service.tib.eu/ldmservice/dataset/kosmos-2--grounding-multimodal-large-language-models-to-the-world}, year = {2024} }