Jang et al. "Unifying Vision-Language Representation Space with Single-Tower Transformer." AAAI Conference on Artificial Intelligence, 2023. doi:10.1609/AAAI.V37I1.25178
Markdown
[Jang et al. "Unifying Vision-Language Representation Space with Single-Tower Transformer." AAAI Conference on Artificial Intelligence, 2023.](https://mlanthology.org/aaai/2023/jang2023aaai-unifying/) doi:10.1609/AAAI.V37I1.25178
BibTeX
@inproceedings{jang2023aaai-unifying,
title = {{Unifying Vision-Language Representation Space with Single-Tower Transformer}},
author = {Jang, Jiho and Kong, Chaerin and Jeon, Donghyeon and Kim, Seonhoon and Kwak, Nojun},
booktitle = {AAAI Conference on Artificial Intelligence},
year = {2023},
pages = {980-988},
doi = {10.1609/AAAI.V37I1.25178},
url = {https://mlanthology.org/aaai/2023/jang2023aaai-unifying/}
}