@inproceedings{fries-etal-2022-dataset,
    title = "Dataset Debt in Biomedical Language Modeling",
    author = "Fries, Jason  and
      Seelam, Natasha  and
      Altay, Gabriel  and
      Weber, Leon  and
      Kang, Myungsun  and
      Datta, Debajyoti  and
      Su, Ruisi  and
      Garda, Samuele  and
      Wang, Bo  and
      Ott, Simon  and
      Samwald, Matthias  and
      Kusa, Wojciech",
    editor = "Fan, Angela  and
      Ilic, Suzana  and
      Wolf, Thomas  and
      Gall{\'e}, Matthias",
    booktitle = "Proceedings of BigScience Episode {\#}5 -- Workshop on Challenges {\&} Perspectives in Creating Large Language Models",
    month = may,
    year = "2022",
    address = "virtual+Dublin",
    publisher = "Association for Computational Linguistics",
    url = "https://preview.aclanthology.org/add-emnlp-2024-awards/2022.bigscience-1.10/",
    doi = "10.18653/v1/2022.bigscience-1.10",
    pages = "137--145"
}