Can We Trust AI Benchmarks? An Interdisciplinary Review of Current Issues in AI Evaluation
Authors
Venue
arXiv preprint arXiv:2502.06559
Tags
Links
BibTeX
Local Entry
@article{eriksson2025benchmarks,
title = {Can We Trust AI Benchmarks? An Interdisciplinary Review of Current Issues in AI Evaluation},
author = {Maria Eriksson and Erasmo Purificato and Arman Noroozian and Joao Vinagre and Guillaume Chaslot and Emilia Gomez and David Fernandez-Llorca},
year = {2025},
journal = {arXiv preprint arXiv:2502.06559},
url = {https://arxiv.org/abs/2502.06559}
} From OPENALEX
@article{eriksson2025benchmarks,
title = {Can We Trust AI Benchmarks? An Interdisciplinary Review of Current Issues in AI Evaluation},
author = {Maria Eriksson and Erasmo Purificato and Arman Noroozian and João Vinagre and Guillaume Chaslot and Emilia Gómez and David Fernández Llorca},
year = {2025},
journal = {arXiv (Cornell University)},
doi = {10.48550/arxiv.2502.06559}
}