Ruan et al. "Accommodating Audio Modality in CLIP for Multimodal Processing." AAAI Conference on Artificial Intelligence, 2023. doi:10.1609/AAAI.V37I8.26153
Markdown
[Ruan et al. "Accommodating Audio Modality in CLIP for Multimodal Processing." AAAI Conference on Artificial Intelligence, 2023.](https://mlanthology.org/aaai/2023/ruan2023aaai-accommodating/) doi:10.1609/AAAI.V37I8.26153
BibTeX
@inproceedings{ruan2023aaai-accommodating,
title = {{Accommodating Audio Modality in CLIP for Multimodal Processing}},
author = {Ruan, Ludan and Hu, Anwen and Song, Yuqing and Zhang, Liang and Zheng, Sipeng and Jin, Qin},
booktitle = {AAAI Conference on Artificial Intelligence},
year = {2023},
pages = {9641-9649},
doi = {10.1609/AAAI.V37I8.26153},
url = {https://mlanthology.org/aaai/2023/ruan2023aaai-accommodating/}
}