{"id":"https://openalex.org/W4296069263","doi":"https://doi.org/10.21437/interspeech.2022-10816","title":"Toward Fairness in Speech Recognition: Discovery and mitigation of performance disparities","display_name":"Toward Fairness in Speech Recognition: Discovery and mitigation of performance disparities","publication_year":2022,"publication_date":"2022-09-16","ids":{"openalex":"https://openalex.org/W4296069263","doi":"https://doi.org/10.21437/interspeech.2022-10816"},"language":"en","primary_location":{"id":"doi:10.21437/interspeech.2022-10816","is_oa":false,"landing_page_url":"https://doi.org/10.21437/interspeech.2022-10816","pdf_url":null,"source":{"id":"https://openalex.org/S4363604309","display_name":"Interspeech 2022","issn_l":null,"issn":null,"is_oa":false,"is_in_doaj":false,"is_core":false,"host_organization":null,"host_organization_name":null,"host_organization_lineage":[],"host_organization_lineage_names":[],"type":"conference"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Interspeech 2022","raw_type":"proceedings-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":false,"oa_status":"closed","oa_url":null,"any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5031451770","display_name":"PRANAV DHERAM","orcid":null},"institutions":[{"id":"https://openalex.org/I1311688040","display_name":"Amazon (United States)","ror":"https://ror.org/04mv4n011","country_code":"US","type":"company","lineage":["https://openalex.org/I1311688040"]}],"countries":["US"],"is_corresponding":true,"raw_author_name":"PRANAV DHERAM","raw_affiliation_strings":["Amazon Alexa AI, USA"],"affiliations":[{"raw_affiliation_string":"Amazon Alexa AI, USA","institution_ids":["https://openalex.org/I1311688040"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5009785474","display_name":"Murugesan Ramakrishnan","orcid":null},"institutions":[{"id":"https://openalex.org/I1311688040","display_name":"Amazon (United States)","ror":"https://ror.org/04mv4n011","country_code":"US","type":"company","lineage":["https://openalex.org/I1311688040"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Murugesan Ramakrishnan","raw_affiliation_strings":["Amazon Alexa AI, USA"],"affiliations":[{"raw_affiliation_string":"Amazon Alexa AI, USA","institution_ids":["https://openalex.org/I1311688040"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5109046112","display_name":"Anirudh Raju","orcid":null},"institutions":[{"id":"https://openalex.org/I1311688040","display_name":"Amazon (United States)","ror":"https://ror.org/04mv4n011","country_code":"US","type":"company","lineage":["https://openalex.org/I1311688040"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Anirudh Raju","raw_affiliation_strings":["Amazon Alexa AI, USA"],"affiliations":[{"raw_affiliation_string":"Amazon Alexa AI, USA","institution_ids":["https://openalex.org/I1311688040"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5046605612","display_name":"I\u2010Ming Chen","orcid":"https://orcid.org/0000-0002-4831-3781"},"institutions":[{"id":"https://openalex.org/I1311688040","display_name":"Amazon (United States)","ror":"https://ror.org/04mv4n011","country_code":"US","type":"company","lineage":["https://openalex.org/I1311688040"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"I-Fan Chen","raw_affiliation_strings":["Amazon Alexa AI, USA"],"affiliations":[{"raw_affiliation_string":"Amazon Alexa AI, USA","institution_ids":["https://openalex.org/I1311688040"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5027102522","display_name":"Brian King","orcid":"https://orcid.org/0000-0002-5300-5564"},"institutions":[{"id":"https://openalex.org/I1311688040","display_name":"Amazon (United States)","ror":"https://ror.org/04mv4n011","country_code":"US","type":"company","lineage":["https://openalex.org/I1311688040"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Brian King","raw_affiliation_strings":["Amazon Alexa AI, USA"],"affiliations":[{"raw_affiliation_string":"Amazon Alexa AI, USA","institution_ids":["https://openalex.org/I1311688040"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5016957625","display_name":"Katherine Powell","orcid":null},"institutions":[{"id":"https://openalex.org/I1311688040","display_name":"Amazon (United States)","ror":"https://ror.org/04mv4n011","country_code":"US","type":"company","lineage":["https://openalex.org/I1311688040"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Katherine Powell","raw_affiliation_strings":["Amazon Alexa AI, USA"],"affiliations":[{"raw_affiliation_string":"Amazon Alexa AI, USA","institution_ids":["https://openalex.org/I1311688040"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5039857755","display_name":"Melissa Saboowala","orcid":null},"institutions":[{"id":"https://openalex.org/I1311688040","display_name":"Amazon (United States)","ror":"https://ror.org/04mv4n011","country_code":"US","type":"company","lineage":["https://openalex.org/I1311688040"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Melissa Saboowala","raw_affiliation_strings":["Amazon Alexa AI, USA"],"affiliations":[{"raw_affiliation_string":"Amazon Alexa AI, USA","institution_ids":["https://openalex.org/I1311688040"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5108140703","display_name":"Karan Shetty","orcid":null},"institutions":[{"id":"https://openalex.org/I1311688040","display_name":"Amazon (United States)","ror":"https://ror.org/04mv4n011","country_code":"US","type":"company","lineage":["https://openalex.org/I1311688040"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Karan Shetty","raw_affiliation_strings":["Amazon Alexa AI, USA"],"affiliations":[{"raw_affiliation_string":"Amazon Alexa AI, USA","institution_ids":["https://openalex.org/I1311688040"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5060979948","display_name":"Andreas Stolcke","orcid":"https://orcid.org/0000-0002-9925-905X"},"institutions":[{"id":"https://openalex.org/I1311688040","display_name":"Amazon (United States)","ror":"https://ror.org/04mv4n011","country_code":"US","type":"company","lineage":["https://openalex.org/I1311688040"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Andreas Stolcke","raw_affiliation_strings":["Amazon Alexa AI, USA"],"affiliations":[{"raw_affiliation_string":"Amazon Alexa AI, USA","institution_ids":["https://openalex.org/I1311688040"]}]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":9,"corresponding_author_ids":["https://openalex.org/A5031451770"],"corresponding_institution_ids":["https://openalex.org/I1311688040"],"apc_list":null,"apc_paid":null,"fwci":9.1466,"has_fulltext":false,"cited_by_count":16,"citation_normalized_percentile":{"value":0.99132948,"is_in_top_1_percent":true,"is_in_top_10_percent":true},"cited_by_percentile_year":{"min":96,"max":99},"biblio":{"volume":null,"issue":null,"first_page":"1268","last_page":"1272"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T13812","display_name":"AI and HR Technologies","score":0.5073000192642212,"subfield":{"id":"https://openalex.org/subfields/1407","display_name":"Organizational Behavior and Human Resource Management"},"field":{"id":"https://openalex.org/fields/14","display_name":"Business, Management and Accounting"},"domain":{"id":"https://openalex.org/domains/2","display_name":"Social Sciences"}},"topics":[{"id":"https://openalex.org/T13812","display_name":"AI and HR Technologies","score":0.5073000192642212,"subfield":{"id":"https://openalex.org/subfields/1407","display_name":"Organizational Behavior and Human Resource Management"},"field":{"id":"https://openalex.org/fields/14","display_name":"Business, Management and Accounting"},"domain":{"id":"https://openalex.org/domains/2","display_name":"Social Sciences"}},{"id":"https://openalex.org/T12031","display_name":"Speech and dialogue systems","score":0.49410000443458557,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T14260","display_name":"Impact of AI and Big Data on Business and Society","score":0.4357999861240387,"subfield":{"id":"https://openalex.org/subfields/1803","display_name":"Management Science and Operations Research"},"field":{"id":"https://openalex.org/fields/18","display_name":"Decision Sciences"},"domain":{"id":"https://openalex.org/domains/2","display_name":"Social Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.6460089087486267},{"id":"https://openalex.org/keywords/oversampling","display_name":"Oversampling","score":0.5644140839576721},{"id":"https://openalex.org/keywords/speech-recognition","display_name":"Speech recognition","score":0.5235728621482849},{"id":"https://openalex.org/keywords/scalability","display_name":"Scalability","score":0.5112099647521973},{"id":"https://openalex.org/keywords/embedding","display_name":"Embedding","score":0.499753475189209},{"id":"https://openalex.org/keywords/cohort","display_name":"Cohort","score":0.4973435699939728},{"id":"https://openalex.org/keywords/scale","display_name":"Scale (ratio)","score":0.4455568790435791},{"id":"https://openalex.org/keywords/voice-activity-detection","display_name":"Voice activity detection","score":0.4269244074821472},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.37975502014160156},{"id":"https://openalex.org/keywords/machine-learning","display_name":"Machine learning","score":0.3788602948188782},{"id":"https://openalex.org/keywords/speech-processing","display_name":"Speech processing","score":0.2621288299560547},{"id":"https://openalex.org/keywords/statistics","display_name":"Statistics","score":0.1417681872844696},{"id":"https://openalex.org/keywords/telecommunications","display_name":"Telecommunications","score":0.12941953539848328},{"id":"https://openalex.org/keywords/database","display_name":"Database","score":0.12261593341827393},{"id":"https://openalex.org/keywords/mathematics","display_name":"Mathematics","score":0.09913620352745056},{"id":"https://openalex.org/keywords/geography","display_name":"Geography","score":0.08464363217353821}],"concepts":[{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.6460089087486267},{"id":"https://openalex.org/C197323446","wikidata":"https://www.wikidata.org/wiki/Q331222","display_name":"Oversampling","level":3,"score":0.5644140839576721},{"id":"https://openalex.org/C28490314","wikidata":"https://www.wikidata.org/wiki/Q189436","display_name":"Speech recognition","level":1,"score":0.5235728621482849},{"id":"https://openalex.org/C48044578","wikidata":"https://www.wikidata.org/wiki/Q727490","display_name":"Scalability","level":2,"score":0.5112099647521973},{"id":"https://openalex.org/C41608201","wikidata":"https://www.wikidata.org/wiki/Q980509","display_name":"Embedding","level":2,"score":0.499753475189209},{"id":"https://openalex.org/C72563966","wikidata":"https://www.wikidata.org/wiki/Q1303415","display_name":"Cohort","level":2,"score":0.4973435699939728},{"id":"https://openalex.org/C2778755073","wikidata":"https://www.wikidata.org/wiki/Q10858537","display_name":"Scale (ratio)","level":2,"score":0.4455568790435791},{"id":"https://openalex.org/C204201278","wikidata":"https://www.wikidata.org/wiki/Q1332614","display_name":"Voice activity detection","level":3,"score":0.4269244074821472},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.37975502014160156},{"id":"https://openalex.org/C119857082","wikidata":"https://www.wikidata.org/wiki/Q2539","display_name":"Machine learning","level":1,"score":0.3788602948188782},{"id":"https://openalex.org/C61328038","wikidata":"https://www.wikidata.org/wiki/Q3358061","display_name":"Speech processing","level":2,"score":0.2621288299560547},{"id":"https://openalex.org/C105795698","wikidata":"https://www.wikidata.org/wiki/Q12483","display_name":"Statistics","level":1,"score":0.1417681872844696},{"id":"https://openalex.org/C76155785","wikidata":"https://www.wikidata.org/wiki/Q418","display_name":"Telecommunications","level":1,"score":0.12941953539848328},{"id":"https://openalex.org/C77088390","wikidata":"https://www.wikidata.org/wiki/Q8513","display_name":"Database","level":1,"score":0.12261593341827393},{"id":"https://openalex.org/C33923547","wikidata":"https://www.wikidata.org/wiki/Q395","display_name":"Mathematics","level":0,"score":0.09913620352745056},{"id":"https://openalex.org/C205649164","wikidata":"https://www.wikidata.org/wiki/Q1071","display_name":"Geography","level":0,"score":0.08464363217353821},{"id":"https://openalex.org/C58640448","wikidata":"https://www.wikidata.org/wiki/Q42515","display_name":"Cartography","level":1,"score":0.0},{"id":"https://openalex.org/C2776257435","wikidata":"https://www.wikidata.org/wiki/Q1576430","display_name":"Bandwidth (computing)","level":2,"score":0.0}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.21437/interspeech.2022-10816","is_oa":false,"landing_page_url":"https://doi.org/10.21437/interspeech.2022-10816","pdf_url":null,"source":{"id":"https://openalex.org/S4363604309","display_name":"Interspeech 2022","issn_l":null,"issn":null,"is_oa":false,"is_in_doaj":false,"is_core":false,"host_organization":null,"host_organization_name":null,"host_organization_lineage":[],"host_organization_lineage_names":[],"type":"conference"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Interspeech 2022","raw_type":"proceedings-article"}],"best_oa_location":null,"sustainable_development_goals":[{"display_name":"Peace, Justice and strong institutions","id":"https://metadata.un.org/sdg/16","score":0.6899999976158142}],"awards":[],"funders":[],"has_content":{"pdf":false,"grobid_xml":false},"content_urls":null,"referenced_works_count":20,"referenced_works":["https://openalex.org/W74746702","https://openalex.org/W1828163288","https://openalex.org/W2053154970","https://openalex.org/W2143612262","https://openalex.org/W2753845591","https://openalex.org/W2788481061","https://openalex.org/W2913244614","https://openalex.org/W2948917818","https://openalex.org/W2963980299","https://openalex.org/W2972981900","https://openalex.org/W2983036158","https://openalex.org/W2997390712","https://openalex.org/W3012624518","https://openalex.org/W3035296331","https://openalex.org/W3035591180","https://openalex.org/W3147107444","https://openalex.org/W3176890131","https://openalex.org/W3181414820","https://openalex.org/W4286902103","https://openalex.org/W4307334170"],"related_works":["https://openalex.org/W3135230428","https://openalex.org/W2904739811","https://openalex.org/W2106462793","https://openalex.org/W2099105119","https://openalex.org/W2559837139","https://openalex.org/W2152158029","https://openalex.org/W2012540220","https://openalex.org/W2081671587","https://openalex.org/W1151175420","https://openalex.org/W2131711534"],"abstract_inverted_index":{"As":[0],"for":[1],"other":[2],"forms":[3],"of":[4,61,104],"AI,":[5],"speech":[6,26,71],"recognition":[7,27,72,128],"has":[8],"recently":[9],"been":[10],"examined":[11],"with":[12,56],"respect":[13],"to":[14,22,29,83],"performance":[15,38,62],"disparities":[16,63],"across":[17],"different":[18],"user":[19],"cohorts.One":[20],"approach":[21],"achieve":[23],"fairness":[24,42,98],"in":[25],"is":[28],"(1)":[30],"identify":[31],"speaker":[32,95,111],"cohorts":[33,47],"that":[34,88,102],"suffer":[35],"from":[36,66],"subpar":[37],"and":[39,59,80],"(2)":[40],"apply":[41],"mitigation":[43,60],"measures":[44],"targeting":[45],"the":[46,119],"discovered.In":[48],"this":[49],"paper,":[50],"we":[51,100],"report":[52],"on":[53,78],"initial":[54],"findings":[55],"both":[57],"discovery":[58,76],"using":[64,94],"data":[65],"a":[67,84],"product-scale":[68],"AI":[69],"assistant":[70],"system.We":[73],"compare":[74],"cohort":[75,112],"based":[77],"geographic":[79],"demographic":[81],"information":[82],"more":[85],"scalable":[86],"method":[87],"groups":[89],"speakers":[90],"without":[91,125],"human":[92],"labels,":[93],"embedding":[96],"technology.For":[97],"mitigation,":[99],"find":[101],"oversampling":[103],"underrepresented":[105],"cohorts,":[106,124],"as":[107,109],"well":[108],"modeling":[110],"membership":[113],"by":[114],"additional":[115],"input":[116],"variables,":[117],"reduces":[118],"gap":[120],"between":[121],"top-and":[122],"bottom-performing":[123],"deteriorating":[126],"overall":[127],"accuracy.":[129]},"counts_by_year":[{"year":2025,"cited_by_count":3},{"year":2024,"cited_by_count":6},{"year":2023,"cited_by_count":7}],"updated_date":"2026-04-03T22:45:19.894376","created_date":"2025-10-10T00:00:00"}
