Sun et al. "SciEval: A Multi-Level Large Language Model Evaluation Benchmark for Scientific Research." AAAI Conference on Artificial Intelligence, 2024. doi:10.1609/AAAI.V38I17.29872
Markdown
[Sun et al. "SciEval: A Multi-Level Large Language Model Evaluation Benchmark for Scientific Research." AAAI Conference on Artificial Intelligence, 2024.](https://mlanthology.org/aaai/2024/sun2024aaai-scieval/) doi:10.1609/AAAI.V38I17.29872
BibTeX
@inproceedings{sun2024aaai-scieval,
title = {{SciEval: A Multi-Level Large Language Model Evaluation Benchmark for Scientific Research}},
author = {Sun, Liangtai and Han, Yang and Zhao, Zihan and Ma, Da and Shen, Zhennan and Chen, Baocai and Chen, Lu and Yu, Kai},
booktitle = {AAAI Conference on Artificial Intelligence},
year = {2024},
pages = {19053-19061},
doi = {10.1609/AAAI.V38I17.29872},
url = {https://mlanthology.org/aaai/2024/sun2024aaai-scieval/}
}