The Economics of AI Training Data: A Research Agenda
Authors
Venue
arXiv preprint
Abstract
Research agenda documenting AI training data deals from 2020 to 2025. Reveals persistent market fragmentation, five distinct pricing mechanisms (from per-unit licensing to commissioning), and that most deals exclude original creators from compensation. Found only 7 of 24 major deals compensate original creators.
Tags
Links
BibTeX
Local Entry
@article{oderinwale2025aitrainingeconomics,
title = {The Economics of AI Training Data: A Research Agenda},
author = {Hamidah Oderinwale and Anna Kazlauskas},
year = {2025},
journal = {arXiv preprint},
url = {https://arxiv.org/abs/2510.24990},
abstract = {Research agenda documenting AI training data deals from 2020 to 2025. Reveals persistent market fragmentation, five distinct pricing mechanisms (from per-unit licensing to commissioning), and that most deals exclude original creators from compensation. Found only 7 of 24 major deals compensate original creators.}
} From AUTO:S2
@article{oderinwale2025aitrainingeconomics,
title = {The Economics of AI Training Data: A Research Agenda},
author = {Hamidah Oderinwale and Anna Kazlauskas},
year = {2025},
journal = {arXiv.org},
doi = {10.48550/arXiv.2510.24990}
}