Li et al. "Patch-Level Sounding Object Tracking for Audio-Visual Question Answering." AAAI Conference on Artificial Intelligence, 2025. doi:10.1609/AAAI.V39I5.32538
Markdown
[Li et al. "Patch-Level Sounding Object Tracking for Audio-Visual Question Answering." AAAI Conference on Artificial Intelligence, 2025.](https://mlanthology.org/aaai/2025/li2025aaai-patch/) doi:10.1609/AAAI.V39I5.32538
BibTeX
@inproceedings{li2025aaai-patch,
title = {{Patch-Level Sounding Object Tracking for Audio-Visual Question Answering}},
author = {Li, Zhangbin and Zhou, Jinxing and Zhang, Jing and Tang, Shengeng and Li, Kun and Guo, Dan},
booktitle = {AAAI Conference on Artificial Intelligence},
year = {2025},
pages = {5075-5083},
doi = {10.1609/AAAI.V39I5.32538},
url = {https://mlanthology.org/aaai/2025/li2025aaai-patch/}
}