@inproceedings{joseph-morgan-2020-word,
title = "When do Word Embeddings Accurately Reflect Surveys on our Beliefs About People?",
author = "Joseph, Kenneth and
Morgan, Jonathan",
booktitle = "Proceedings of the 58th Annual Meeting of the Association for Computational Linguistics",
month = jul,
year = "2020",
address = "Online",
publisher = "Association for Computational Linguistics",
url = "https://aclanthology.org/2020.acl-main.405",
doi = "10.18653/v1/2020.acl-main.405",
pages = "4392--4415",
abstract = "Social biases are encoded in word embeddings. This presents a unique opportunity to study society historically and at scale, and a unique danger when embeddings are used in downstream applications. Here, we investigate the extent to which publicly-available word embeddings accurately reflect beliefs about certain kinds of people as measured via traditional survey methods. We find that biases found in word embeddings do, on average, closely mirror survey data across seventeen dimensions of social meaning. However, we also find that biases in embeddings are much more reflective of survey data for some dimensions of meaning (e.g. gender) than others (e.g. race), and that we can be highly confident that embedding-based measures reflect survey data only for the most salient biases.",
}
<?xml version="1.0" encoding="UTF-8"?>
<modsCollection xmlns="http://www.loc.gov/mods/v3">
<mods ID="joseph-morgan-2020-word">
<titleInfo>
<title>When do Word Embeddings Accurately Reflect Surveys on our Beliefs About People?</title>
</titleInfo>
<name type="personal">
<namePart type="given">Kenneth</namePart>
<namePart type="family">Joseph</namePart>
<role>
<roleTerm authority="marcrelator" type="text">author</roleTerm>
</role>
</name>
<name type="personal">
<namePart type="given">Jonathan</namePart>
<namePart type="family">Morgan</namePart>
<role>
<roleTerm authority="marcrelator" type="text">author</roleTerm>
</role>
</name>
<originInfo>
<dateIssued>2020-jul</dateIssued>
</originInfo>
<typeOfResource>text</typeOfResource>
<relatedItem type="host">
<titleInfo>
<title>Proceedings of the 58th Annual Meeting of the Association for Computational Linguistics</title>
</titleInfo>
<originInfo>
<publisher>Association for Computational Linguistics</publisher>
<place>
<placeTerm type="text">Online</placeTerm>
</place>
</originInfo>
<genre authority="marcgt">conference publication</genre>
</relatedItem>
<abstract>Social biases are encoded in word embeddings. This presents a unique opportunity to study society historically and at scale, and a unique danger when embeddings are used in downstream applications. Here, we investigate the extent to which publicly-available word embeddings accurately reflect beliefs about certain kinds of people as measured via traditional survey methods. We find that biases found in word embeddings do, on average, closely mirror survey data across seventeen dimensions of social meaning. However, we also find that biases in embeddings are much more reflective of survey data for some dimensions of meaning (e.g. gender) than others (e.g. race), and that we can be highly confident that embedding-based measures reflect survey data only for the most salient biases.</abstract>
<identifier type="citekey">joseph-morgan-2020-word</identifier>
<identifier type="doi">10.18653/v1/2020.acl-main.405</identifier>
<location>
<url>https://aclanthology.org/2020.acl-main.405</url>
</location>
<part>
<date>2020-jul</date>
<extent unit="page">
<start>4392</start>
<end>4415</end>
</extent>
</part>
</mods>
</modsCollection>
%0 Conference Proceedings
%T When do Word Embeddings Accurately Reflect Surveys on our Beliefs About People?
%A Joseph, Kenneth
%A Morgan, Jonathan
%S Proceedings of the 58th Annual Meeting of the Association for Computational Linguistics
%D 2020
%8 jul
%I Association for Computational Linguistics
%C Online
%F joseph-morgan-2020-word
%X Social biases are encoded in word embeddings. This presents a unique opportunity to study society historically and at scale, and a unique danger when embeddings are used in downstream applications. Here, we investigate the extent to which publicly-available word embeddings accurately reflect beliefs about certain kinds of people as measured via traditional survey methods. We find that biases found in word embeddings do, on average, closely mirror survey data across seventeen dimensions of social meaning. However, we also find that biases in embeddings are much more reflective of survey data for some dimensions of meaning (e.g. gender) than others (e.g. race), and that we can be highly confident that embedding-based measures reflect survey data only for the most salient biases.
%R 10.18653/v1/2020.acl-main.405
%U https://aclanthology.org/2020.acl-main.405
%U https://doi.org/10.18653/v1/2020.acl-main.405
%P 4392-4415
Markdown (Informal)
[When do Word Embeddings Accurately Reflect Surveys on our Beliefs About People?](https://aclanthology.org/2020.acl-main.405) (Joseph & Morgan, ACL 2020)
ACL