Park et al. "Accurate Sublayer Pruning for Large Language Models by Exploiting Latency and Tunability Information." International Joint Conference on Artificial Intelligence, 2025. doi:10.24963/IJCAI.2025/913
Markdown
[Park et al. "Accurate Sublayer Pruning for Large Language Models by Exploiting Latency and Tunability Information." International Joint Conference on Artificial Intelligence, 2025.](https://mlanthology.org/ijcai/2025/park2025ijcai-accurate/) doi:10.24963/IJCAI.2025/913
BibTeX
@inproceedings{park2025ijcai-accurate,
title = {{Accurate Sublayer Pruning for Large Language Models by Exploiting Latency and Tunability Information}},
author = {Park, Seungcheol and Lee, Sojin and Kim, Jongjin and Lee, Jinsik and Jo, Hyunjik and Kang, U},
booktitle = {International Joint Conference on Artificial Intelligence},
year = {2025},
pages = {8213-8221},
doi = {10.24963/IJCAI.2025/913},
url = {https://mlanthology.org/ijcai/2025/park2025ijcai-accurate/}
}