{"id":"https://openalex.org/W4393970566","doi":"https://doi.org/10.1145/3640543.3645165","title":"Creating an African American-Sounding TTS: Guidelines, Technical Challenges, and Surprising Evaluations","display_name":"Creating an African American-Sounding TTS: Guidelines, Technical Challenges, and Surprising Evaluations","publication_year":2024,"publication_date":"2024-03-18","ids":{"openalex":"https://openalex.org/W4393970566","doi":"https://doi.org/10.1145/3640543.3645165"},"language":"en","primary_location":{"id":"doi:10.1145/3640543.3645165","is_oa":true,"landing_page_url":"https://doi.org/10.1145/3640543.3645165","pdf_url":"https://dl.acm.org/doi/pdf/10.1145/3640543.3645165","source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Proceedings of the 29th International Conference on Intelligent User Interfaces","raw_type":"proceedings-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":true,"oa_status":"gold","oa_url":"https://dl.acm.org/doi/pdf/10.1145/3640543.3645165","any_repository_has_fulltext":null},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5019048636","display_name":"Cl\u00e1udio Pinhanez","orcid":"https://orcid.org/0000-0001-6715-1290"},"institutions":[{"id":"https://openalex.org/I4210113516","display_name":"IBM Research - Brazil","ror":"https://ror.org/01fxqdx25","country_code":"BR","type":"facility","lineage":["https://openalex.org/I1341412227","https://openalex.org/I4210113516","https://openalex.org/I4210114115"]}],"countries":["BR"],"is_corresponding":true,"raw_author_name":"Claudio Santos Pinhanez","raw_affiliation_strings":["IBM Research, Brazil"],"raw_orcid":"https://orcid.org/0000-0001-6715-1290","affiliations":[{"raw_affiliation_string":"IBM Research, Brazil","institution_ids":["https://openalex.org/I4210113516"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5103271822","display_name":"Ra\u00fal Addine Fern\u00e1ndez","orcid":"https://orcid.org/0009-0009-7650-193X"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Raul Fernandez","raw_affiliation_strings":["IBM Research, United States"],"raw_orcid":"https://orcid.org/0009-0009-7650-193X","affiliations":[{"raw_affiliation_string":"IBM Research, United States","institution_ids":[]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5048212988","display_name":"Marcelo Grave","orcid":"https://orcid.org/0000-0003-1738-332X"},"institutions":[{"id":"https://openalex.org/I4210113516","display_name":"IBM Research - Brazil","ror":"https://ror.org/01fxqdx25","country_code":"BR","type":"facility","lineage":["https://openalex.org/I1341412227","https://openalex.org/I4210113516","https://openalex.org/I4210114115"]}],"countries":["BR"],"is_corresponding":false,"raw_author_name":"Marcelo Carpinette Grave","raw_affiliation_strings":["IBM Research, Brazil"],"raw_orcid":"https://orcid.org/0000-0003-1738-332X","affiliations":[{"raw_affiliation_string":"IBM Research, Brazil","institution_ids":["https://openalex.org/I4210113516"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5001862450","display_name":"Julio Nogima","orcid":"https://orcid.org/0009-0008-9764-6874"},"institutions":[{"id":"https://openalex.org/I4210113516","display_name":"IBM Research - Brazil","ror":"https://ror.org/01fxqdx25","country_code":"BR","type":"facility","lineage":["https://openalex.org/I1341412227","https://openalex.org/I4210113516","https://openalex.org/I4210114115"]}],"countries":["BR"],"is_corresponding":false,"raw_author_name":"Julio Nogima","raw_affiliation_strings":["IBM Research, Brazil"],"raw_orcid":"https://orcid.org/0009-0008-9764-6874","affiliations":[{"raw_affiliation_string":"IBM Research, Brazil","institution_ids":["https://openalex.org/I4210113516"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5053864983","display_name":"Ron Hoory","orcid":"https://orcid.org/0009-0006-1327-5160"},"institutions":[{"id":"https://openalex.org/I4210167297","display_name":"IBM Research - Haifa","ror":"https://ror.org/05rw9t746","country_code":"IL","type":"facility","lineage":["https://openalex.org/I1341412227","https://openalex.org/I4210114115","https://openalex.org/I4210167297"]}],"countries":["IL"],"is_corresponding":false,"raw_author_name":"Ron Hoory","raw_affiliation_strings":["IBM Research, Israel"],"raw_orcid":"https://orcid.org/0009-0006-1327-5160","affiliations":[{"raw_affiliation_string":"IBM Research, Israel","institution_ids":["https://openalex.org/I4210167297"]}]}],"institutions":[],"countries_distinct_count":2,"institutions_distinct_count":5,"corresponding_author_ids":["https://openalex.org/A5019048636"],"corresponding_institution_ids":["https://openalex.org/I4210113516"],"apc_list":null,"apc_paid":null,"fwci":0.7809,"has_fulltext":true,"cited_by_count":2,"citation_normalized_percentile":{"value":0.7833741,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":{"min":91,"max":98},"biblio":{"volume":null,"issue":null,"first_page":"259","last_page":"273"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T11704","display_name":"Mobile Crowdsensing and Crowdsourcing","score":0.9976000189781189,"subfield":{"id":"https://openalex.org/subfields/1706","display_name":"Computer Science Applications"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T11704","display_name":"Mobile Crowdsensing and Crowdsourcing","score":0.9976000189781189,"subfield":{"id":"https://openalex.org/subfields/1706","display_name":"Computer Science Applications"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T12031","display_name":"Speech and dialogue systems","score":0.9922000169754028,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T12262","display_name":"Hate Speech and Cyberbullying Detection","score":0.9761999845504761,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/representativeness-heuristic","display_name":"Representativeness heuristic","score":0.7351042032241821},{"id":"https://openalex.org/keywords/stress","display_name":"Stress (linguistics)","score":0.7093442678451538},{"id":"https://openalex.org/keywords/american-english","display_name":"American English","score":0.5996510982513428},{"id":"https://openalex.org/keywords/race","display_name":"Race (biology)","score":0.5414978861808777},{"id":"https://openalex.org/keywords/white","display_name":"White (mutation)","score":0.49657779932022095},{"id":"https://openalex.org/keywords/african-american","display_name":"African american","score":0.4773992598056793},{"id":"https://openalex.org/keywords/quality","display_name":"Quality (philosophy)","score":0.44295603036880493},{"id":"https://openalex.org/keywords/psychology","display_name":"Psychology","score":0.4302127957344055},{"id":"https://openalex.org/keywords/representation","display_name":"Representation (politics)","score":0.42794716358184814},{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.4043487310409546},{"id":"https://openalex.org/keywords/linguistics","display_name":"Linguistics","score":0.36061835289001465},{"id":"https://openalex.org/keywords/sociology","display_name":"Sociology","score":0.24950745701789856},{"id":"https://openalex.org/keywords/political-science","display_name":"Political science","score":0.2183533012866974},{"id":"https://openalex.org/keywords/gender-studies","display_name":"Gender studies","score":0.21716171503067017},{"id":"https://openalex.org/keywords/speech-recognition","display_name":"Speech recognition","score":0.1889834702014923},{"id":"https://openalex.org/keywords/social-psychology","display_name":"Social psychology","score":0.1869601309299469}],"concepts":[{"id":"https://openalex.org/C37381756","wikidata":"https://www.wikidata.org/wiki/Q20203288","display_name":"Representativeness heuristic","level":2,"score":0.7351042032241821},{"id":"https://openalex.org/C2776756274","wikidata":"https://www.wikidata.org/wiki/Q181767","display_name":"Stress (linguistics)","level":2,"score":0.7093442678451538},{"id":"https://openalex.org/C2777939226","wikidata":"https://www.wikidata.org/wiki/Q7976","display_name":"American English","level":2,"score":0.5996510982513428},{"id":"https://openalex.org/C76509639","wikidata":"https://www.wikidata.org/wiki/Q918036","display_name":"Race (biology)","level":2,"score":0.5414978861808777},{"id":"https://openalex.org/C56273599","wikidata":"https://www.wikidata.org/wiki/Q3122841","display_name":"White (mutation)","level":3,"score":0.49657779932022095},{"id":"https://openalex.org/C2987028688","wikidata":"https://www.wikidata.org/wiki/Q49085","display_name":"African american","level":2,"score":0.4773992598056793},{"id":"https://openalex.org/C2779530757","wikidata":"https://www.wikidata.org/wiki/Q1207505","display_name":"Quality (philosophy)","level":2,"score":0.44295603036880493},{"id":"https://openalex.org/C15744967","wikidata":"https://www.wikidata.org/wiki/Q9418","display_name":"Psychology","level":0,"score":0.4302127957344055},{"id":"https://openalex.org/C2776359362","wikidata":"https://www.wikidata.org/wiki/Q2145286","display_name":"Representation (politics)","level":3,"score":0.42794716358184814},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.4043487310409546},{"id":"https://openalex.org/C41895202","wikidata":"https://www.wikidata.org/wiki/Q8162","display_name":"Linguistics","level":1,"score":0.36061835289001465},{"id":"https://openalex.org/C144024400","wikidata":"https://www.wikidata.org/wiki/Q21201","display_name":"Sociology","level":0,"score":0.24950745701789856},{"id":"https://openalex.org/C17744445","wikidata":"https://www.wikidata.org/wiki/Q36442","display_name":"Political science","level":0,"score":0.2183533012866974},{"id":"https://openalex.org/C107993555","wikidata":"https://www.wikidata.org/wiki/Q1662673","display_name":"Gender studies","level":1,"score":0.21716171503067017},{"id":"https://openalex.org/C28490314","wikidata":"https://www.wikidata.org/wiki/Q189436","display_name":"Speech recognition","level":1,"score":0.1889834702014923},{"id":"https://openalex.org/C77805123","wikidata":"https://www.wikidata.org/wiki/Q161272","display_name":"Social psychology","level":1,"score":0.1869601309299469},{"id":"https://openalex.org/C104317684","wikidata":"https://www.wikidata.org/wiki/Q7187","display_name":"Gene","level":2,"score":0.0},{"id":"https://openalex.org/C2549261","wikidata":"https://www.wikidata.org/wiki/Q43455","display_name":"Ethnology","level":1,"score":0.0},{"id":"https://openalex.org/C185592680","wikidata":"https://www.wikidata.org/wiki/Q2329","display_name":"Chemistry","level":0,"score":0.0},{"id":"https://openalex.org/C138885662","wikidata":"https://www.wikidata.org/wiki/Q5891","display_name":"Philosophy","level":0,"score":0.0},{"id":"https://openalex.org/C111472728","wikidata":"https://www.wikidata.org/wiki/Q9471","display_name":"Epistemology","level":1,"score":0.0},{"id":"https://openalex.org/C94625758","wikidata":"https://www.wikidata.org/wiki/Q7163","display_name":"Politics","level":2,"score":0.0},{"id":"https://openalex.org/C55493867","wikidata":"https://www.wikidata.org/wiki/Q7094","display_name":"Biochemistry","level":1,"score":0.0},{"id":"https://openalex.org/C199539241","wikidata":"https://www.wikidata.org/wiki/Q7748","display_name":"Law","level":1,"score":0.0}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.1145/3640543.3645165","is_oa":true,"landing_page_url":"https://doi.org/10.1145/3640543.3645165","pdf_url":"https://dl.acm.org/doi/pdf/10.1145/3640543.3645165","source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Proceedings of the 29th International Conference on Intelligent User Interfaces","raw_type":"proceedings-article"}],"best_oa_location":{"id":"doi:10.1145/3640543.3645165","is_oa":true,"landing_page_url":"https://doi.org/10.1145/3640543.3645165","pdf_url":"https://dl.acm.org/doi/pdf/10.1145/3640543.3645165","source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Proceedings of the 29th International Conference on Intelligent User Interfaces","raw_type":"proceedings-article"},"sustainable_development_goals":[],"awards":[],"funders":[],"has_content":{"pdf":true,"grobid_xml":true},"content_urls":{"pdf":"https://content.openalex.org/works/W4393970566.pdf","grobid_xml":"https://content.openalex.org/works/W4393970566.grobid-xml"},"referenced_works_count":28,"referenced_works":["https://openalex.org/W1523550190","https://openalex.org/W1556641933","https://openalex.org/W1628789162","https://openalex.org/W2036233992","https://openalex.org/W2054021874","https://openalex.org/W2061141035","https://openalex.org/W2069573448","https://openalex.org/W2131916103","https://openalex.org/W2134344734","https://openalex.org/W2151401338","https://openalex.org/W2155980578","https://openalex.org/W2623601081","https://openalex.org/W2767655316","https://openalex.org/W2791568830","https://openalex.org/W2886048720","https://openalex.org/W2889160585","https://openalex.org/W2890184085","https://openalex.org/W2921047845","https://openalex.org/W2966398511","https://openalex.org/W2971062439","https://openalex.org/W2982552777","https://openalex.org/W3009222807","https://openalex.org/W3047117292","https://openalex.org/W3121078277","https://openalex.org/W3175765954","https://openalex.org/W4205795265","https://openalex.org/W4292341621","https://openalex.org/W4385822623"],"related_works":["https://openalex.org/W644364909","https://openalex.org/W2034865276","https://openalex.org/W640712713","https://openalex.org/W4386460245","https://openalex.org/W2126764764","https://openalex.org/W2121210147","https://openalex.org/W2786897797","https://openalex.org/W3024271910","https://openalex.org/W3198486451","https://openalex.org/W1488684580"],"abstract_inverted_index":{"Representations":[0],"of":[1,16,40,47,74,89,106,148,153,169],"AI":[2],"agents":[3],"in":[4,14,23,37,44],"user":[5],"interfaces":[6],"and":[7,18,84,92,98],"robotics":[8],"are":[9],"predominantly":[10],"White,":[11],"not":[12,129,164],"only":[13,165],"terms":[15],"facial":[17],"skin":[19],"features,":[20],"but":[21,176],"also":[22,177],"the":[24,38,45,72,87,107,112,126,133,137,146,167,170,180,189,192],"synthetic":[25],"voices":[26,203],"they":[27],"use.":[28],"In":[29],"this":[30],"paper":[31,68],"we":[32,42,174],"explore":[33],"some":[34,105],"unexpected":[35],"challenges":[36,85],"representation":[39],"race":[41,135,147],"found":[43],"process":[46],"developing":[48],"an":[49,59],"U.S.":[50,122],"English":[51,123],"Text-to-Speech":[52],"(TTS)":[53],"system":[54,95,114,152],"aimed":[55],"to":[56,131,136,198,204],"sound":[57],"like":[58],"educated,":[60,200],"professional,":[61],"regional":[62],"accent-free":[63],"African":[64,78,138,160,171,205],"American":[65,79,139,161,172,206],"woman.":[66],"The":[67],"starts":[69],"by":[70,101,111,188],"presenting":[71],"results":[73,183],"focus":[75,157],"groups":[76],"with":[77,121,159],"IT":[80,162],"professionals":[81],"where":[82,125],"guidelines":[83],"for":[86],"creation":[88],"a":[90,102,149],"representative":[91],"appropriate":[93],"TTS":[94,113,140,151],"were":[96,128],"discussed":[97],"gathered,":[99],"followed":[100],"discussion":[103],"about":[104],"technical":[108],"difficulties":[109],"faced":[110],"developers.":[115],"We":[116],"then":[117],"describe":[118],"two":[119],"studies":[120],"speakers":[124],"participants":[127],"able":[130],"attribute":[132],"correct":[134],"voice":[141,173],"while":[142],"overwhelmingly":[143],"correctly":[144],"recognizing":[145],"White":[150],"similar":[154],"quality.":[155],"A":[156],"group":[158],"workers":[163],"confirmed":[166],"representativeness":[168],"built,":[175],"suggested":[178],"that":[179],"surprising":[181],"recognition":[182],"may":[184],"have":[185],"been":[186],"caused":[187],"inability":[190],"or":[191],"latent":[193],"prejudice":[194],"from":[195],"non-African":[196],"Americans":[197],"associate":[199],"non-vernacular,":[201],"professionally-sounding":[202],"people.":[207]},"counts_by_year":[{"year":2026,"cited_by_count":1},{"year":2025,"cited_by_count":1}],"updated_date":"2026-03-27T05:58:40.876381","created_date":"2025-10-10T00:00:00"}
