@inproceedings{deng2024enhancing, title={Enhancing Large Vision Language Models with Self-Training on Image Comprehension}, author={Deng, Yihe Deng and Lu, Pan and Yin, Fan and Hu, Ziniu and Shen, Sheng and Gu, Quanquan and Zou, James and Chang, Kai-Wei and Wang, Wei}, booktitle={The 38th Conference on Neural Information Processing Systems (NeurIPS)}, year={2024} }