@inproceedings{fries-etal-2022-dataset, title = "Dataset Debt in Biomedical Language Modeling", author = "Fries, Jason and Seelam, Natasha and Altay, Gabriel and Weber, Leon and Kang, Myungsun and Datta, Debajyoti and Su, Ruisi and Garda, Samuele and Wang, Bo and Ott, Simon and Samwald, Matthias and Kusa, Wojciech", editor = "Fan, Angela and Ilic, Suzana and Wolf, Thomas and Gall{\'e}, Matthias", booktitle = "Proceedings of BigScience Episode {\#}5 -- Workshop on Challenges {\&} Perspectives in Creating Large Language Models", month = may, year = "2022", address = "virtual+Dublin", publisher = "Association for Computational Linguistics", url = "https://preview.aclanthology.org/add-emnlp-2024-awards/2022.bigscience-1.10/", doi = "10.18653/v1/2022.bigscience-1.10", pages = "137--145" }