Vivoli et al. "ComiCap: A VLMs Pipeline for Dense Captioning of Comic Panels." European Conference on Computer Vision Workshops, 2024. doi:10.1007/978-3-031-92808-6_4
Markdown
[Vivoli et al. "ComiCap: A VLMs Pipeline for Dense Captioning of Comic Panels." European Conference on Computer Vision Workshops, 2024.](https://mlanthology.org/eccvw/2024/vivoli2024eccvw-comicap/) doi:10.1007/978-3-031-92808-6_4
BibTeX
@inproceedings{vivoli2024eccvw-comicap,
title = {{ComiCap: A VLMs Pipeline for Dense Captioning of Comic Panels}},
author = {Vivoli, Emanuele and Biondi, Niccolò and Bertini, Marco and Karatzas, Dimosthenis},
booktitle = {European Conference on Computer Vision Workshops},
year = {2024},
pages = {56-67},
doi = {10.1007/978-3-031-92808-6_4},
url = {https://mlanthology.org/eccvw/2024/vivoli2024eccvw-comicap/}
}