{"id":"https://openalex.org/W3212216134","doi":"https://doi.org/10.1109/taslp.2021.3126949","title":"Counterfactually Fair Automatic Speech Recognition","display_name":"Counterfactually Fair Automatic Speech Recognition","publication_year":2021,"publication_date":"2021-01-01","ids":{"openalex":"https://openalex.org/W3212216134","doi":"https://doi.org/10.1109/taslp.2021.3126949","mag":"3212216134"},"language":"en","primary_location":{"id":"doi:10.1109/taslp.2021.3126949","is_oa":true,"landing_page_url":"https://doi.org/10.1109/taslp.2021.3126949","pdf_url":null,"source":{"id":"https://openalex.org/S4210169297","display_name":"IEEE/ACM Transactions on Audio Speech and Language Processing","issn_l":"2329-9290","issn":["2329-9290","2329-9304"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310319808","host_organization_name":"Institute of Electrical and Electronics Engineers","host_organization_lineage":["https://openalex.org/P4310319808"],"host_organization_lineage_names":["Institute of Electrical and Electronics Engineers"],"type":"journal"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"IEEE/ACM Transactions on Audio, Speech, and Language Processing","raw_type":"journal-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":true,"oa_status":"hybrid","oa_url":"https://doi.org/10.1109/taslp.2021.3126949","any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5113969253","display_name":"Leda Sar","orcid":null},"institutions":[],"countries":[],"is_corresponding":true,"raw_author_name":"Leda Sar","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5004778663","display_name":"Mark Hasegawa\u2010Johnson","orcid":"https://orcid.org/0000-0002-5631-2893"},"institutions":[{"id":"https://openalex.org/I157725225","display_name":"University of Illinois Urbana-Champaign","ror":"https://ror.org/047426m28","country_code":"US","type":"education","lineage":["https://openalex.org/I157725225"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Mark Hasegawa-Johnson","raw_affiliation_strings":["Electrical and Computer Engineering, University of Illinois at Urbana-Champaign, Urbana, Illinois, United States, 61801 (e-mail: jhasegaw@illinois.edu)"],"affiliations":[{"raw_affiliation_string":"Electrical and Computer Engineering, University of Illinois at Urbana-Champaign, Urbana, Illinois, United States, 61801 (e-mail: jhasegaw@illinois.edu)","institution_ids":["https://openalex.org/I157725225"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5073287748","display_name":"Chang D. Yoo","orcid":"https://orcid.org/0000-0002-0756-7179"},"institutions":[{"id":"https://openalex.org/I157485424","display_name":"Korea Advanced Institute of Science and Technology","ror":"https://ror.org/05apxxy63","country_code":"KR","type":"education","lineage":["https://openalex.org/I157485424"]}],"countries":["KR"],"is_corresponding":false,"raw_author_name":"Chang D. Yoo","raw_affiliation_strings":["Dept. Electrical Engineering, KAIST - Korea Advanced Institute of Science & Technology, Daejeon, Korea (the Republic of), 34141 (e-mail: cd_yoo@kaist.ac.kr)"],"affiliations":[{"raw_affiliation_string":"Dept. Electrical Engineering, KAIST - Korea Advanced Institute of Science & Technology, Daejeon, Korea (the Republic of), 34141 (e-mail: cd_yoo@kaist.ac.kr)","institution_ids":["https://openalex.org/I157485424"]}]}],"institutions":[],"countries_distinct_count":2,"institutions_distinct_count":3,"corresponding_author_ids":["https://openalex.org/A5113969253"],"corresponding_institution_ids":[],"apc_list":null,"apc_paid":null,"fwci":1.6897,"has_fulltext":false,"cited_by_count":20,"citation_normalized_percentile":{"value":0.87274381,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":{"min":89,"max":99},"biblio":{"volume":"29","issue":null,"first_page":"3515","last_page":"3525"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10181","display_name":"Natural Language Processing Techniques","score":0.9973999857902527,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10181","display_name":"Natural Language Processing Techniques","score":0.9973999857902527,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10201","display_name":"Speech Recognition and Synthesis","score":0.9973999857902527,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10028","display_name":"Topic Modeling","score":0.9890000224113464,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/counterfactual-thinking","display_name":"Counterfactual thinking","score":0.8804498910903931},{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.5198367238044739},{"id":"https://openalex.org/keywords/odds","display_name":"Odds","score":0.5059062838554382},{"id":"https://openalex.org/keywords/connectionism","display_name":"Connectionism","score":0.49307581782341003},{"id":"https://openalex.org/keywords/speech-recognition","display_name":"Speech recognition","score":0.4731016159057617},{"id":"https://openalex.org/keywords/word-error-rate","display_name":"Word error rate","score":0.4609295725822449},{"id":"https://openalex.org/keywords/psychology","display_name":"Psychology","score":0.40382397174835205},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.26553478837013245},{"id":"https://openalex.org/keywords/social-psychology","display_name":"Social psychology","score":0.26431626081466675},{"id":"https://openalex.org/keywords/logistic-regression","display_name":"Logistic regression","score":0.21352046728134155},{"id":"https://openalex.org/keywords/machine-learning","display_name":"Machine learning","score":0.15734729170799255},{"id":"https://openalex.org/keywords/artificial-neural-network","display_name":"Artificial neural network","score":0.13428843021392822}],"concepts":[{"id":"https://openalex.org/C108650721","wikidata":"https://www.wikidata.org/wiki/Q1783253","display_name":"Counterfactual thinking","level":2,"score":0.8804498910903931},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.5198367238044739},{"id":"https://openalex.org/C143095724","wikidata":"https://www.wikidata.org/wiki/Q515895","display_name":"Odds","level":3,"score":0.5059062838554382},{"id":"https://openalex.org/C8521452","wikidata":"https://www.wikidata.org/wiki/Q203790","display_name":"Connectionism","level":3,"score":0.49307581782341003},{"id":"https://openalex.org/C28490314","wikidata":"https://www.wikidata.org/wiki/Q189436","display_name":"Speech recognition","level":1,"score":0.4731016159057617},{"id":"https://openalex.org/C40969351","wikidata":"https://www.wikidata.org/wiki/Q3516228","display_name":"Word error rate","level":2,"score":0.4609295725822449},{"id":"https://openalex.org/C15744967","wikidata":"https://www.wikidata.org/wiki/Q9418","display_name":"Psychology","level":0,"score":0.40382397174835205},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.26553478837013245},{"id":"https://openalex.org/C77805123","wikidata":"https://www.wikidata.org/wiki/Q161272","display_name":"Social psychology","level":1,"score":0.26431626081466675},{"id":"https://openalex.org/C151956035","wikidata":"https://www.wikidata.org/wiki/Q1132755","display_name":"Logistic regression","level":2,"score":0.21352046728134155},{"id":"https://openalex.org/C119857082","wikidata":"https://www.wikidata.org/wiki/Q2539","display_name":"Machine learning","level":1,"score":0.15734729170799255},{"id":"https://openalex.org/C50644808","wikidata":"https://www.wikidata.org/wiki/Q192776","display_name":"Artificial neural network","level":2,"score":0.13428843021392822}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.1109/taslp.2021.3126949","is_oa":true,"landing_page_url":"https://doi.org/10.1109/taslp.2021.3126949","pdf_url":null,"source":{"id":"https://openalex.org/S4210169297","display_name":"IEEE/ACM Transactions on Audio Speech and Language Processing","issn_l":"2329-9290","issn":["2329-9290","2329-9304"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310319808","host_organization_name":"Institute of Electrical and Electronics Engineers","host_organization_lineage":["https://openalex.org/P4310319808"],"host_organization_lineage_names":["Institute of Electrical and Electronics Engineers"],"type":"journal"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"IEEE/ACM Transactions on Audio, Speech, and Language Processing","raw_type":"journal-article"}],"best_oa_location":{"id":"doi:10.1109/taslp.2021.3126949","is_oa":true,"landing_page_url":"https://doi.org/10.1109/taslp.2021.3126949","pdf_url":null,"source":{"id":"https://openalex.org/S4210169297","display_name":"IEEE/ACM Transactions on Audio Speech and Language Processing","issn_l":"2329-9290","issn":["2329-9290","2329-9304"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310319808","host_organization_name":"Institute of Electrical and Electronics Engineers","host_organization_lineage":["https://openalex.org/P4310319808"],"host_organization_lineage_names":["Institute of Electrical and Electronics Engineers"],"type":"journal"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"IEEE/ACM Transactions on Audio, Speech, and Language Processing","raw_type":"journal-article"},"sustainable_development_goals":[{"display_name":"Quality Education","score":0.8299999833106995,"id":"https://metadata.un.org/sdg/4"}],"awards":[],"funders":[],"has_content":{"grobid_xml":false,"pdf":false},"content_urls":null,"referenced_works_count":52,"referenced_works":["https://openalex.org/W72757270","https://openalex.org/W1494198834","https://openalex.org/W1828163288","https://openalex.org/W1882958252","https://openalex.org/W2017480732","https://openalex.org/W2048087720","https://openalex.org/W2049910836","https://openalex.org/W2079623482","https://openalex.org/W2100960835","https://openalex.org/W2127141656","https://openalex.org/W2143612262","https://openalex.org/W2193413348","https://openalex.org/W2327501763","https://openalex.org/W2398776621","https://openalex.org/W2493567909","https://openalex.org/W2530395818","https://openalex.org/W2545177271","https://openalex.org/W2627092829","https://openalex.org/W2726674076","https://openalex.org/W2753845591","https://openalex.org/W2809878087","https://openalex.org/W2892038960","https://openalex.org/W2936774411","https://openalex.org/W2949992972","https://openalex.org/W2964031043","https://openalex.org/W2977235550","https://openalex.org/W2983036158","https://openalex.org/W3001553940","https://openalex.org/W3012624518","https://openalex.org/W3033733989","https://openalex.org/W3080248383","https://openalex.org/W3092661284","https://openalex.org/W3101767999","https://openalex.org/W3126686938","https://openalex.org/W3152436735","https://openalex.org/W4288282543","https://openalex.org/W4288586852","https://openalex.org/W4295097398","https://openalex.org/W4295253939","https://openalex.org/W4295312788","https://openalex.org/W6638749077","https://openalex.org/W6639480849","https://openalex.org/W6687566353","https://openalex.org/W6728551298","https://openalex.org/W6739095351","https://openalex.org/W6740362099","https://openalex.org/W6744097617","https://openalex.org/W6744110554","https://openalex.org/W6765645076","https://openalex.org/W6766978945","https://openalex.org/W6768299147","https://openalex.org/W6790219302"],"related_works":["https://openalex.org/W2309273277","https://openalex.org/W2061937230","https://openalex.org/W1769849273","https://openalex.org/W1574295218","https://openalex.org/W113247760","https://openalex.org/W1967477266","https://openalex.org/W2547793174","https://openalex.org/W2070212102","https://openalex.org/W2132658536","https://openalex.org/W2544241817"],"abstract_inverted_index":{"Widely":[0],"used":[1],"automatic":[2],"speech":[3],"recognition":[4],"(ASR)":[5],"systems":[6],"have":[7],"been":[8],"empirically":[9],"demonstrated":[10],"in":[11,33,114,122],"various":[12],"studies":[13],"to":[14,30,36,111,138,170,175],"be":[15],"unfair,":[16],"having":[17],"higher":[18],"error":[19,192,204],"rates":[20,193],"for":[21,144,172],"some":[22],"groups":[23],"of":[24,44,68,74,105,160],"users":[25],"than":[26],"others.":[27],"One":[28],"way":[29],"define":[31],"fairness":[32,104],"ASR":[34,106,110,151],"is":[35],"require":[37],"that":[38,183],"changing":[39,48],"the":[40,58,66,78,83,94,103,109,123,129,158,167],"demographic":[41,125,200],"group":[42,75,91],"affiliation":[43,76,92],"any":[45],"individual":[46],"(e.g.,":[47,77,93],"their":[49,142],"gender,":[50,176],"age,":[51,177],"education":[52],"or":[53],"race)":[54],"should":[55],"not":[56],"change":[57,113,121],"probability":[59],"distribution":[60],"across":[61],"possible":[62],"speech-to-text":[63],"transcriptions.":[64],"In":[65],"paradigm":[67],"counterfactual":[69,120,131,185],"fairness,":[70],"all":[71],"variables":[72,88],"independent":[73],"text":[79],"being":[80],"read":[81],"by":[82,107],"speaker)":[84],"remain":[85],"unchanged,":[86],"while":[87,194],"dependent":[89],"on":[90,157],"speaker's":[95],"voice)":[96],"are":[97],"counterfactually":[98],"modified.":[99],"Hence,":[100],"we":[101,135,187],"approach":[102],"training":[108],"minimize":[112],"its":[115],"outcome":[116],"probabilities":[117],"despite":[118],"a":[119],"individual's":[124],"attributes.":[126],"Starting":[127],"from":[128],"individualized":[130],"equal":[132],"odds":[133],"criterion,":[134],"provide":[136],"relaxations":[137],"it":[139],"and":[140,166,179,202],"compare":[141],"performances":[143],"connectionist":[145],"temporal":[146],"classification":[147],"(CTC)":[148],"based":[149],"end-to-end":[150],"systems.":[152],"We":[153,181],"perform":[154],"our":[155],"experiments":[156],"Corpus":[159],"Regional":[161],"African":[162],"American":[163],"Languages":[164],"(CORAAL)":[165],"LibriSpeech":[168],"dataset":[169],"accommodate":[171],"differences":[173],"due":[174],"education,":[178],"race.":[180],"show":[182],"with":[184],"training,":[186],"can":[188],"reduce":[189],"average":[190],"character":[191],"achieving":[195],"lower":[196,203],"performance":[197],"gap":[198],"between":[199],"groups,":[201],"standard":[205],"deviation":[206],"among":[207],"individuals.":[208]},"counts_by_year":[{"year":2026,"cited_by_count":1},{"year":2025,"cited_by_count":7},{"year":2024,"cited_by_count":1},{"year":2023,"cited_by_count":5},{"year":2022,"cited_by_count":5},{"year":2021,"cited_by_count":1}],"updated_date":"2026-04-03T22:45:19.894376","created_date":"2025-10-10T00:00:00"}
