{"id":"https://openalex.org/W7139043925","doi":"https://doi.org/10.48550/arxiv.2603.15807","title":"Lost in Transcription: Subtitle Errors in Automatic Speech Recognition Reduce Speaker and Content Evaluations","display_name":"Lost in Transcription: Subtitle Errors in Automatic Speech Recognition Reduce Speaker and Content Evaluations","publication_year":2026,"publication_date":"2026-03-16","ids":{"openalex":"https://openalex.org/W7139043925","doi":"https://doi.org/10.48550/arxiv.2603.15807"},"language":null,"primary_location":{"id":"doi:10.48550/arxiv.2603.15807","is_oa":true,"landing_page_url":"https://doi.org/10.48550/arxiv.2603.15807","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":null,"is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"Preprint"},"type":"preprint","indexed_in":["datacite"],"open_access":{"is_oa":true,"oa_status":"green","oa_url":"https://doi.org/10.48550/arxiv.2603.15807","any_repository_has_fulltext":true},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5129997462","display_name":"Kowe Kadoma","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Kadoma, Kowe","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5081620014","display_name":"Priyal Shrivastava","orcid":"https://orcid.org/0000-0003-3070-6760"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Shrivastava, Priyal","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"last","author":{"id":"https://openalex.org/A5054248372","display_name":"Mor Naaman","orcid":"https://orcid.org/0000-0002-6436-3877"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Naaman, Mor","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]}],"institutions":[],"countries_distinct_count":0,"institutions_distinct_count":0,"corresponding_author_ids":[],"corresponding_institution_ids":[],"apc_list":null,"apc_paid":null,"fwci":null,"has_fulltext":false,"cited_by_count":0,"citation_normalized_percentile":null,"cited_by_percentile_year":null,"biblio":{"volume":null,"issue":null,"first_page":null,"last_page":null},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T13310","display_name":"Subtitles and Audiovisual Media","score":0.8540999889373779,"subfield":{"id":"https://openalex.org/subfields/1203","display_name":"Language and Linguistics"},"field":{"id":"https://openalex.org/fields/12","display_name":"Arts and Humanities"},"domain":{"id":"https://openalex.org/domains/2","display_name":"Social Sciences"}},"topics":[{"id":"https://openalex.org/T13310","display_name":"Subtitles and Audiovisual Media","score":0.8540999889373779,"subfield":{"id":"https://openalex.org/subfields/1203","display_name":"Language and Linguistics"},"field":{"id":"https://openalex.org/fields/12","display_name":"Arts and Humanities"},"domain":{"id":"https://openalex.org/domains/2","display_name":"Social Sciences"}},{"id":"https://openalex.org/T10201","display_name":"Speech Recognition and Synthesis","score":0.018200000748038292,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T12151","display_name":"Interpreting and Communication in Healthcare","score":0.01730000041425228,"subfield":{"id":"https://openalex.org/subfields/3600","display_name":"General Health Professions"},"field":{"id":"https://openalex.org/fields/36","display_name":"Health Professions"},"domain":{"id":"https://openalex.org/domains/4","display_name":"Health Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/subtitle","display_name":"Subtitle","score":0.9211999773979187},{"id":"https://openalex.org/keywords/stress","display_name":"Stress (linguistics)","score":0.6060000061988831},{"id":"https://openalex.org/keywords/affect","display_name":"Affect (linguistics)","score":0.47749999165534973},{"id":"https://openalex.org/keywords/content","display_name":"Content (measure theory)","score":0.4050000011920929},{"id":"https://openalex.org/keywords/error-analysis","display_name":"Error analysis","score":0.29989999532699585}],"concepts":[{"id":"https://openalex.org/C2780364048","wikidata":"https://www.wikidata.org/wiki/Q204028","display_name":"Subtitle","level":2,"score":0.9211999773979187},{"id":"https://openalex.org/C28490314","wikidata":"https://www.wikidata.org/wiki/Q189436","display_name":"Speech recognition","level":1,"score":0.628000020980835},{"id":"https://openalex.org/C2776756274","wikidata":"https://www.wikidata.org/wiki/Q181767","display_name":"Stress (linguistics)","level":2,"score":0.6060000061988831},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.5680000185966492},{"id":"https://openalex.org/C204321447","wikidata":"https://www.wikidata.org/wiki/Q30642","display_name":"Natural language processing","level":1,"score":0.4982999861240387},{"id":"https://openalex.org/C2776035688","wikidata":"https://www.wikidata.org/wiki/Q1606558","display_name":"Affect (linguistics)","level":2,"score":0.47749999165534973},{"id":"https://openalex.org/C2778152352","wikidata":"https://www.wikidata.org/wiki/Q5165061","display_name":"Content (measure theory)","level":2,"score":0.4050000011920929},{"id":"https://openalex.org/C15744967","wikidata":"https://www.wikidata.org/wiki/Q9418","display_name":"Psychology","level":0,"score":0.38749998807907104},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.3772999942302704},{"id":"https://openalex.org/C41895202","wikidata":"https://www.wikidata.org/wiki/Q8162","display_name":"Linguistics","level":1,"score":0.3411000072956085},{"id":"https://openalex.org/C3018824978","wikidata":"https://www.wikidata.org/wiki/Q2894891","display_name":"Error analysis","level":2,"score":0.29989999532699585},{"id":"https://openalex.org/C61328038","wikidata":"https://www.wikidata.org/wiki/Q3358061","display_name":"Speech processing","level":2,"score":0.2980000078678131},{"id":"https://openalex.org/C133892786","wikidata":"https://www.wikidata.org/wiki/Q1145189","display_name":"Speaker recognition","level":2,"score":0.2971999943256378},{"id":"https://openalex.org/C87868495","wikidata":"https://www.wikidata.org/wiki/Q750843","display_name":"Information processing","level":2,"score":0.2646999955177307}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.48550/arxiv.2603.15807","is_oa":true,"landing_page_url":"https://doi.org/10.48550/arxiv.2603.15807","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":null,"is_accepted":false,"is_published":null,"raw_source_name":null,"raw_type":"Preprint"}],"best_oa_location":{"id":"doi:10.48550/arxiv.2603.15807","is_oa":true,"landing_page_url":"https://doi.org/10.48550/arxiv.2603.15807","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":null,"is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"Preprint"},"sustainable_development_goals":[{"display_name":"Quality Education","score":0.558951735496521,"id":"https://metadata.un.org/sdg/4"}],"awards":[],"funders":[],"has_content":{"grobid_xml":false,"pdf":false},"content_urls":null,"referenced_works_count":0,"referenced_works":[],"related_works":[],"abstract_inverted_index":{"Researchers":[0],"have":[1],"demonstrated":[2],"that":[3,57,94],"Automatic":[4],"Speech":[5],"Recognition":[6],"(ASR)":[7],"systems":[8,101],"perform":[9,102],"differently":[10],"across":[11],"demographic":[12],"groups.":[13],"In":[14],"this":[15,90],"work,":[16],"we":[17],"examined":[18],"how":[19],"subtitle":[20,82],"errors":[21],"affect":[22],"evaluations":[23,66],"of":[24,89],"speakers":[25,39,95],"and":[26,64],"their":[27],"content":[28,65],"using":[29],"a":[30,44],"preregistered":[31],"online":[32],"experiment":[33],"(N=207,":[34],"U.S.-based":[35],"crowdworkers).":[36],"Participants":[37],"watched":[38],"with":[40,96,112],"various":[41],"accents":[42,97],"deliver":[43],"talk":[45],"in":[46],"which":[47,99],"the":[48,77,87],"subtitles":[49,59],"were":[50],"accurate":[51],"or":[52],"error-prone.":[53],"Our":[54],"results":[55],"indicate":[56],"error-prone":[58],"consistently":[60],"reduce":[61],"both":[62],"speaker":[63],"for":[67,81,98],"all":[68],"speakers.":[69],"We":[70],"did":[71],"not":[72],"see":[73],"disparate":[74],"impact":[75],"between":[76],"accent":[78],"groups,":[79],"controlling":[80],"quality.":[83],"Taken":[84],"together,":[85],"though,":[86],"findings":[88],"short":[91],"paper":[92],"imply":[93],"ASR":[100],"poorly":[103],"are":[104],"likely":[105],"to":[106],"be":[107],"further":[108],"penalized":[109],"by":[110],"viewers":[111],"lower":[113],"evaluations.":[114]},"counts_by_year":[],"updated_date":"2026-07-01T06:00:48.157686","created_date":"2026-03-20T00:00:00"}
