Zhu et al. "Multichannel AV-Wav2vec2: A Framework for Learning Multichannel Multi-Modal Speech Representation." AAAI Conference on Artificial Intelligence, 2024. doi:10.1609/AAAI.V38I17.29951
Markdown
[Zhu et al. "Multichannel AV-Wav2vec2: A Framework for Learning Multichannel Multi-Modal Speech Representation." AAAI Conference on Artificial Intelligence, 2024.](https://mlanthology.org/aaai/2024/zhu2024aaai-multichannel/) doi:10.1609/AAAI.V38I17.29951
BibTeX
@inproceedings{zhu2024aaai-multichannel,
title = {{Multichannel AV-Wav2vec2: A Framework for Learning Multichannel Multi-Modal Speech Representation}},
author = {Zhu, Qiushi and Zhang, Jie and Gu, Yu and Hu, Yuchen and Dai, Lirong},
booktitle = {AAAI Conference on Artificial Intelligence},
year = {2024},
pages = {19768-19776},
doi = {10.1609/AAAI.V38I17.29951},
url = {https://mlanthology.org/aaai/2024/zhu2024aaai-multichannel/}
}