Dataset Groups Activity Stream Vision-and-Language Navigation The Vision-and-Language Navigation (VLN) task gives a global natural sentence I = {w0,..., wl} as an instruction, where wi is a word token while the l is the length of the sentence. BibTex: @dataset{Peter_Anderson_and_Angel_X_Chang_and_Devendra_Singh_Chaplot_and_Alexey_Dosovitsky_and_Saurabh_Gupta_and_Jitendra_Ma-Vladlen_Koltun_and_Manolis_Savva_and_Amir_Roshan_Zamir_2024, abstract = {The Vision-and-Language Navigation (VLN) task gives a global natural sentence I = {w0,..., wl} as an instruction, where wi is a word token while the l is the length of the sentence.}, author = {Peter Anderson and Angel X. Chang and Devendra Singh Chaplot and Alexey Dosovitsky and Saurabh Gupta and Jitendra Ma-Vladlen Koltun and Manolis Savva and Amir Roshan Zamir}, doi = {10.57702/ntvoct4a}, institution = {No Organization}, keyword = {'Instruction Following', 'Navigation', 'Vision-and-Language Navigation', 'language instructions', 'natural language instruction', 'panoramic view', 'vision-and-language navigation', 'vision-language navigation'}, month = {dec}, publisher = {TIB}, title = {Vision-and-Language Navigation}, url = {https://service.tib.eu/ldmservice/dataset/vision-and-language-navigation}, year = {2024} }