VL-bert
@article{su2019vl,
title={Vl-bert: Pre-training of generic visual-linguistic representations},
author={Su, Weijie and Zhu, Xizhou and Cao, Yue and Li, Bin and Lu, Lewei and Wei, Furu and Dai, Jifeng},
journal={arXiv preprint arXiv:1908.08530},
year={2019}
}