Dataset Groups Activity Stream VisionLLaMA: A Unified LLaMA Interface for Vision Tasks VisionLLaMA is a unified and generic modeling framework for solving most vision tasks. BibTex: @dataset{Xiangxiang_Chu_and_Jianlin_Su_and_Bo_Zhang_and_Chunhua_Shen_2024, abstract = {VisionLLaMA is a unified and generic modeling framework for solving most vision tasks.}, author = {Xiangxiang Chu and Jianlin Su and Bo Zhang and Chunhua Shen}, doi = {10.57702/cjy8r7i0}, institution = {No Organization}, keyword = {'image classification', 'image generation', 'vision transformer'}, month = {dec}, publisher = {TIB}, title = {VisionLLaMA: A Unified LLaMA Interface for Vision Tasks}, url = {https://service.tib.eu/ldmservice/dataset/visionllama--a-unified-llama-interface-for-vision-tasks}, year = {2024} }