Wang et al. "A Multimodal, Multi-Task Adapting Framework for Video Action Recognition." AAAI Conference on Artificial Intelligence, 2024. doi:10.1609/AAAI.V38I6.28361
Markdown
[Wang et al. "A Multimodal, Multi-Task Adapting Framework for Video Action Recognition." AAAI Conference on Artificial Intelligence, 2024.](https://mlanthology.org/aaai/2024/wang2024aaai-multimodal/) doi:10.1609/AAAI.V38I6.28361
BibTeX
@inproceedings{wang2024aaai-multimodal,
title = {{A Multimodal, Multi-Task Adapting Framework for Video Action Recognition}},
author = {Wang, Mengmeng and Xing, Jiazheng and Jiang, Boyuan and Chen, Jun and Mei, Jianbiao and Zuo, Xingxing and Dai, Guang and Wang, Jingdong and Liu, Yong},
booktitle = {AAAI Conference on Artificial Intelligence},
year = {2024},
pages = {5517-5525},
doi = {10.1609/AAAI.V38I6.28361},
url = {https://mlanthology.org/aaai/2024/wang2024aaai-multimodal/}
}