What's in the Box? An Analysis of Undesirable Content in the Common Crawl Corpus
Authors
Venue
Proceedings of the 59th Annual Meeting of the Association for Computational Linguistics and the 11th International Joint Conference on Natural Language Processing (Volume 2: Short Papers)
Tags
BibTeX
Local Entry
@inproceedings{luccioni2021box,
title = {What's in the Box? An Analysis of Undesirable Content in the Common Crawl Corpus},
author = {Alexandra Sasha Luccioni and Joseph D. Viviano},
year = {2021},
booktitle = {Proceedings of the 59th Annual Meeting of the Association for Computational Linguistics and the 11th International Joint Conference on Natural Language Processing (Volume 2: Short Papers)},
doi = {10.18653/v1/2021.acl-short.24},
url = {https://aclanthology.org/2021.acl-short.24/}
} From OPENALEX
@inproceedings{luccioni2021box,
title = {What’s in the Box? An Analysis of Undesirable Content in the Common Crawl Corpus},
author = {Alexandra Sasha Luccioni and Joseph D. Viviano},
year = {2021},
doi = {10.18653/v1/2021.acl-short.24}
}