@article{journals/corr/abs-2312-06109,
added-at = {2024-01-03T00:00:00.000+0100},
author = {Wei, Haoran and Kong, Lingyu and Chen, Jinyue and Zhao, Liang and Ge, Zheng and Yang, Jinrong and Sun, Jianjian and Han, Chunrui and Zhang, Xiangyu},
biburl = {https://www.bibsonomy.org/bibtex/200b628b3f0f21b1be32821753c77b19e/dblp},
ee = {https://doi.org/10.48550/arXiv.2312.06109},
interhash = {39686ae3e489922618c95742cf88c5c4},
intrahash = {00b628b3f0f21b1be32821753c77b19e},
journal = {CoRR},
keywords = {dblp},
timestamp = {2024-04-08T23:47:55.000+0200},
title = {Vary: Scaling up the Vision Vocabulary for Large Vision-Language Models.},
url = {http://dblp.uni-trier.de/db/journals/corr/corr2312.html#abs-2312-06109},
volume = {abs/2312.06109},
year = 2023
}