{"id":"https://openalex.org/W4416035277","doi":"https://doi.org/10.18653/v1/2025.emnlp-main.1640","title":"Assumed Identities: Quantifying Gender Bias in Machine Translation of Gender-Ambiguous Occupational Terms","display_name":"Assumed Identities: Quantifying Gender Bias in Machine Translation of Gender-Ambiguous Occupational Terms","publication_year":2025,"publication_date":"2025-01-01","ids":{"openalex":"https://openalex.org/W4416035277","doi":"https://doi.org/10.18653/v1/2025.emnlp-main.1640"},"language":null,"primary_location":{"id":"doi:10.18653/v1/2025.emnlp-main.1640","is_oa":true,"landing_page_url":"https://doi.org/10.18653/v1/2025.emnlp-main.1640","pdf_url":"https://aclanthology.org/2025.emnlp-main.1640.pdf","source":null,"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Proceedings of the 2025 Conference on Empirical Methods in Natural Language Processing","raw_type":"proceedings-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":true,"oa_status":"gold","oa_url":"https://aclanthology.org/2025.emnlp-main.1640.pdf","any_repository_has_fulltext":null},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5032386720","display_name":"Orfeas Menis Mastromichalakis","orcid":"https://orcid.org/0000-0001-5286-1388"},"institutions":[],"countries":[],"is_corresponding":true,"raw_author_name":"Orfeas Menis Mastromichalakis","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5077371399","display_name":"Giorgos Filandrianos","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Giorgos Filandrianos","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5077110074","display_name":"Maria Symeonaki","orcid":"https://orcid.org/0000-0003-0755-1617"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Maria Symeonaki","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"last","author":{"id":"https://openalex.org/A5085359792","display_name":"Giorgos Stamou","orcid":"https://orcid.org/0000-0003-1210-9874"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Giorgos Stamou","raw_affiliation_strings":[],"affiliations":[]}],"institutions":[],"countries_distinct_count":0,"institutions_distinct_count":4,"corresponding_author_ids":["https://openalex.org/A5032386720"],"corresponding_institution_ids":[],"apc_list":null,"apc_paid":null,"fwci":0.0,"has_fulltext":true,"cited_by_count":0,"citation_normalized_percentile":{"value":0.41316384,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":null,"biblio":{"volume":null,"issue":null,"first_page":"32221","last_page":"32237"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T13173","display_name":"Gender Studies in Language","score":0.2702000141143799,"subfield":{"id":"https://openalex.org/subfields/3318","display_name":"Gender Studies"},"field":{"id":"https://openalex.org/fields/33","display_name":"Social Sciences"},"domain":{"id":"https://openalex.org/domains/2","display_name":"Social Sciences"}},"topics":[{"id":"https://openalex.org/T13173","display_name":"Gender Studies in Language","score":0.2702000141143799,"subfield":{"id":"https://openalex.org/subfields/3318","display_name":"Gender Studies"},"field":{"id":"https://openalex.org/fields/33","display_name":"Social Sciences"},"domain":{"id":"https://openalex.org/domains/2","display_name":"Social Sciences"}},{"id":"https://openalex.org/T10181","display_name":"Natural Language Processing Techniques","score":0.11640000343322754,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10028","display_name":"Topic Modeling","score":0.10750000178813934,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/machine-translation","display_name":"Machine translation","score":0.39750000834465027},{"id":"https://openalex.org/keywords/gender-bias","display_name":"Gender bias","score":0.38960000872612},{"id":"https://openalex.org/keywords/translation","display_name":"Translation (biology)","score":0.32670000195503235},{"id":"https://openalex.org/keywords/noise","display_name":"Noise (video)","score":0.2851000130176544},{"id":"https://openalex.org/keywords/measure","display_name":"Measure (data warehouse)","score":0.2822999954223633}],"concepts":[{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.5029000043869019},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.5008999705314636},{"id":"https://openalex.org/C203005215","wikidata":"https://www.wikidata.org/wiki/Q79798","display_name":"Machine translation","level":2,"score":0.39750000834465027},{"id":"https://openalex.org/C204321447","wikidata":"https://www.wikidata.org/wiki/Q30642","display_name":"Natural language processing","level":1,"score":0.3919000029563904},{"id":"https://openalex.org/C2983427547","wikidata":"https://www.wikidata.org/wiki/Q93200","display_name":"Gender bias","level":2,"score":0.38960000872612},{"id":"https://openalex.org/C149364088","wikidata":"https://www.wikidata.org/wiki/Q185917","display_name":"Translation (biology)","level":4,"score":0.32670000195503235},{"id":"https://openalex.org/C15744967","wikidata":"https://www.wikidata.org/wiki/Q9418","display_name":"Psychology","level":0,"score":0.31360000371932983},{"id":"https://openalex.org/C99498987","wikidata":"https://www.wikidata.org/wiki/Q2210247","display_name":"Noise (video)","level":3,"score":0.2851000130176544},{"id":"https://openalex.org/C2780009758","wikidata":"https://www.wikidata.org/wiki/Q6804172","display_name":"Measure (data warehouse)","level":2,"score":0.2822999954223633},{"id":"https://openalex.org/C149782125","wikidata":"https://www.wikidata.org/wiki/Q160039","display_name":"Econometrics","level":1,"score":0.28200000524520874},{"id":"https://openalex.org/C119857082","wikidata":"https://www.wikidata.org/wiki/Q2539","display_name":"Machine learning","level":1,"score":0.2741999924182892},{"id":"https://openalex.org/C18762648","wikidata":"https://www.wikidata.org/wiki/Q42213","display_name":"Work (physics)","level":2,"score":0.26089999079704285},{"id":"https://openalex.org/C9652623","wikidata":"https://www.wikidata.org/wiki/Q190109","display_name":"Field (mathematics)","level":2,"score":0.25540000200271606},{"id":"https://openalex.org/C2993271050","wikidata":"https://www.wikidata.org/wiki/Q93200","display_name":"Gender discrimination","level":2,"score":0.2524000108242035},{"id":"https://openalex.org/C180747234","wikidata":"https://www.wikidata.org/wiki/Q23373","display_name":"Cognitive psychology","level":1,"score":0.25110000371932983}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.18653/v1/2025.emnlp-main.1640","is_oa":true,"landing_page_url":"https://doi.org/10.18653/v1/2025.emnlp-main.1640","pdf_url":"https://aclanthology.org/2025.emnlp-main.1640.pdf","source":null,"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Proceedings of the 2025 Conference on Empirical Methods in Natural Language Processing","raw_type":"proceedings-article"}],"best_oa_location":{"id":"doi:10.18653/v1/2025.emnlp-main.1640","is_oa":true,"landing_page_url":"https://doi.org/10.18653/v1/2025.emnlp-main.1640","pdf_url":"https://aclanthology.org/2025.emnlp-main.1640.pdf","source":null,"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Proceedings of the 2025 Conference on Empirical Methods in Natural Language Processing","raw_type":"proceedings-article"},"sustainable_development_goals":[],"awards":[],"funders":[{"id":"https://openalex.org/F4320334322","display_name":"HORIZON EUROPE Framework Programme","ror":null},{"id":"https://openalex.org/F4320334779","display_name":"Funda\u00e7\u00e3o para a Ci\u00eancia e a Tecnologia","ror":"https://ror.org/00snfqn58"}],"has_content":{"pdf":true,"grobid_xml":true},"content_urls":{"pdf":"https://content.openalex.org/works/W4416035277.pdf","grobid_xml":"https://content.openalex.org/works/W4416035277.grobid-xml"},"referenced_works_count":0,"referenced_works":[],"related_works":[],"abstract_inverted_index":{"Machine":[0],"Translation":[1],"(MT)":[2],"systems":[3,94],"frequently":[4],"encounter":[5],"gender-ambiguous":[6,86],"occupational":[7,87,113],"terms,":[8],"where":[9],"they":[10],"must":[11],"assign":[12],"gender":[13,69,114],"without":[14],"explicit":[15],"contextual":[16],"cues.While":[17],"individual":[18],"translations":[19,100],"in":[20,83,101],"such":[21],"cases":[22],"may":[23],"not":[24],"be":[25],"inherently":[26],"biased,":[27],"systematic":[28],"patterns-such":[29],"as":[30,51],"consistently":[31],"translating":[32],"certain":[33],"professions":[34],"with":[35,85,106],"specific":[36],"genders-can":[37],"emerge,":[38],"reflecting":[39],"and":[40,95,103,116],"perpetuating":[41],"societal":[42,110],"stereotypes.This":[43],"ambiguity":[44],"challenges":[45],"traditional":[46],"instance-level":[47],"singleanswer":[48],"evaluation":[49],"approaches,":[50],"no":[52],"single":[53],"gold":[54],"standard":[55],"translation":[56],"exists.To":[57],"address":[58],"this,":[59,76],"we":[60,77,90],"introduce":[61],"GRAPE,":[62,89],"a":[63,80],"probability-based":[64],"metric":[65],"designed":[66],"to":[67],"evaluate":[68,91],"bias":[70],"by":[71],"analyzing":[72],"aggregated":[73],"model":[74],"responses.Alongside":[75],"present":[78],"GAMBIT,":[79],"benchmarking":[81],"dataset":[82],"English":[84],"terms.Using":[88],"several":[92],"MT":[93],"examine":[96],"whether":[97],"their":[98],"gendered":[99],"Greek":[102],"French":[104],"align":[105],"or":[107],"diverge":[108],"from":[109],"stereotypes,":[111],"real-world":[112],"distributions,":[115],"normative":[117],"standards":[118],"1":[119],".":[120]},"counts_by_year":[],"updated_date":"2026-03-20T23:20:44.827607","created_date":"2025-11-08T00:00:00"}
