@inproceedings{NEURIPS2022_259a5df4, author = {Wang, Junke and Chen, Dongdong and Wu, Zuxuan and Luo, Chong and Zhou, Luowei and Zhao, Yucheng and Xie, Yujia and Liu, Ce and Jiang, Yu-Gang and Yuan, Lu}, booktitle = {Advances in Neural Information Processing Systems}, editor = {S. Koyejo and S. Mohamed and A. Agarwal and D. Belgrave and K. Cho and A. Oh}, pages = {5696--5710}, publisher = {Curran Associates, Inc.}, title = {OmniVL: One Foundation Model for Image-Language and Video-Language Tasks}, url = {https://proceedings.neurips.cc/paper_files/paper/2022/file/259a5df46308d60f8454bd4adcc3b462-Paper-Conference.pdf}, volume = {35}, year = {2022} }