Data Leverage References

← Back to browse

Can We Trust AI Benchmarks? An Interdisciplinary Review of Current Issues in AI Evaluation

2025 article eriksson2025benchmarks Not yet verified
Authors
Maria Eriksson, Erasmo Purificato, Arman Noroozian, Joao Vinagre, Guillaume Chaslot, Emilia Gomez, David Fernandez-Llorca
Venue
arXiv preprint arXiv:2502.06559
Tags

BibTeX

Local Entry
@article{eriksson2025benchmarks,
  title = {Can We Trust AI Benchmarks? An Interdisciplinary Review of Current Issues in AI Evaluation},
  author = {Maria Eriksson and Erasmo Purificato and Arman Noroozian and Joao Vinagre and Guillaume Chaslot and Emilia Gomez and David Fernandez-Llorca},
  year = {2025},
  journal = {arXiv preprint arXiv:2502.06559},
  url = {https://arxiv.org/abs/2502.06559}
}
From OPENALEX
@article{eriksson2025benchmarks,
  title = {Can We Trust AI Benchmarks? An Interdisciplinary Review of Current Issues in AI Evaluation},
  author = {Maria Eriksson and Erasmo Purificato and Arman Noroozian and João Vinagre and Guillaume Chaslot and Emilia Gómez and David Fernández Llorca},
  year = {2025},
  journal = {arXiv (Cornell University)},
  doi = {10.48550/arxiv.2502.06559}
}