@article{wang2023visionllm, title={Visionllm: Large language model is also an open-ended decoder for vision-centric tasks}, author={Wang, Wenhai and Chen, Zhe and Chen, Xiaokang and Wu, Jiannan and Zhu, Xizhou and Zeng, Gang and Luo, Ping and Lu, Tong and Zhou, Jie and Qiao, Yu and others}, journal={arXiv preprint arXiv:2305.11175}, year={2023} }