Luo et al. "C4AV: Learning Cross-Modal Representations from Transformers." European Conference on Computer Vision Workshops, 2020. doi:10.1007/978-3-030-66096-3_3
Markdown
[Luo et al. "C4AV: Learning Cross-Modal Representations from Transformers." European Conference on Computer Vision Workshops, 2020.](https://mlanthology.org/eccvw/2020/luo2020eccvw-c4av/) doi:10.1007/978-3-030-66096-3_3
BibTeX
@inproceedings{luo2020eccvw-c4av,
title = {{C4AV: Learning Cross-Modal Representations from Transformers}},
author = {Luo, Shujie and Dai, Hang and Shao, Ling and Ding, Yong},
booktitle = {European Conference on Computer Vision Workshops},
year = {2020},
pages = {33-38},
doi = {10.1007/978-3-030-66096-3_3},
url = {https://mlanthology.org/eccvw/2020/luo2020eccvw-c4av/}
}