{"id":"https://openalex.org/W3015634748","doi":"https://doi.org/10.1109/icassp40776.2020.9053287","title":"On Modeling ASR Word Confidence","display_name":"On Modeling ASR Word Confidence","publication_year":2020,"publication_date":"2020-04-09","ids":{"openalex":"https://openalex.org/W3015634748","doi":"https://doi.org/10.1109/icassp40776.2020.9053287","mag":"3015634748"},"language":"en","primary_location":{"id":"doi:10.1109/icassp40776.2020.9053287","is_oa":false,"landing_page_url":"https://doi.org/10.1109/icassp40776.2020.9053287","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"ICASSP 2020 - 2020 IEEE International Conference on Acoustics, Speech and Signal Processing (ICASSP)","raw_type":"proceedings-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":false,"oa_status":"closed","oa_url":null,"any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5055671046","display_name":"Woojay Jeon","orcid":null},"institutions":[{"id":"https://openalex.org/I4210153776","display_name":"Apple (United States)","ror":"https://ror.org/059hsda18","country_code":"US","type":"company","lineage":["https://openalex.org/I4210153776"]}],"countries":["US"],"is_corresponding":true,"raw_author_name":"Woojay Jeon","raw_affiliation_strings":["Apple Inc., Cupertino, California"],"affiliations":[{"raw_affiliation_string":"Apple Inc., Cupertino, California","institution_ids":["https://openalex.org/I4210153776"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5087117921","display_name":"Maxwell Jordan","orcid":null},"institutions":[{"id":"https://openalex.org/I4210153776","display_name":"Apple (United States)","ror":"https://ror.org/059hsda18","country_code":"US","type":"company","lineage":["https://openalex.org/I4210153776"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Maxwell Jordan","raw_affiliation_strings":["Apple Inc., Cupertino, California"],"affiliations":[{"raw_affiliation_string":"Apple Inc., Cupertino, California","institution_ids":["https://openalex.org/I4210153776"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5085465402","display_name":"Mahesh Krishnamoorthy","orcid":null},"institutions":[{"id":"https://openalex.org/I4210153776","display_name":"Apple (United States)","ror":"https://ror.org/059hsda18","country_code":"US","type":"company","lineage":["https://openalex.org/I4210153776"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Mahesh Krishnamoorthy","raw_affiliation_strings":["Apple Inc., Cupertino, California"],"affiliations":[{"raw_affiliation_string":"Apple Inc., Cupertino, California","institution_ids":["https://openalex.org/I4210153776"]}]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":3,"corresponding_author_ids":["https://openalex.org/A5055671046"],"corresponding_institution_ids":["https://openalex.org/I4210153776"],"apc_list":null,"apc_paid":null,"fwci":0.5302,"has_fulltext":false,"cited_by_count":7,"citation_normalized_percentile":{"value":0.71709296,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":{"min":91,"max":97},"biblio":{"volume":null,"issue":null,"first_page":null,"last_page":null},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10028","display_name":"Topic Modeling","score":0.9998999834060669,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10028","display_name":"Topic Modeling","score":0.9998999834060669,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10181","display_name":"Natural Language Processing Techniques","score":0.9998999834060669,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10201","display_name":"Speech Recognition and Synthesis","score":0.998199999332428,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.7887357473373413},{"id":"https://openalex.org/keywords/word","display_name":"Word (group theory)","score":0.7372063994407654},{"id":"https://openalex.org/keywords/confusion","display_name":"Confusion","score":0.6407080888748169},{"id":"https://openalex.org/keywords/word-error-rate","display_name":"Word error rate","score":0.5476192831993103},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.5267423987388611},{"id":"https://openalex.org/keywords/artificial-neural-network","display_name":"Artificial neural network","score":0.524463415145874},{"id":"https://openalex.org/keywords/reliability","display_name":"Reliability (semiconductor)","score":0.4955791234970093},{"id":"https://openalex.org/keywords/natural-language-processing","display_name":"Natural language processing","score":0.4740312397480011},{"id":"https://openalex.org/keywords/calibration","display_name":"Calibration","score":0.44316381216049194},{"id":"https://openalex.org/keywords/key","display_name":"Key (lock)","score":0.4292922019958496},{"id":"https://openalex.org/keywords/speech-recognition","display_name":"Speech recognition","score":0.42409542202949524},{"id":"https://openalex.org/keywords/statistics","display_name":"Statistics","score":0.16635918617248535},{"id":"https://openalex.org/keywords/mathematics","display_name":"Mathematics","score":0.10727348923683167}],"concepts":[{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.7887357473373413},{"id":"https://openalex.org/C90805587","wikidata":"https://www.wikidata.org/wiki/Q10944557","display_name":"Word (group theory)","level":2,"score":0.7372063994407654},{"id":"https://openalex.org/C2781140086","wikidata":"https://www.wikidata.org/wiki/Q557945","display_name":"Confusion","level":2,"score":0.6407080888748169},{"id":"https://openalex.org/C40969351","wikidata":"https://www.wikidata.org/wiki/Q3516228","display_name":"Word error rate","level":2,"score":0.5476192831993103},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.5267423987388611},{"id":"https://openalex.org/C50644808","wikidata":"https://www.wikidata.org/wiki/Q192776","display_name":"Artificial neural network","level":2,"score":0.524463415145874},{"id":"https://openalex.org/C43214815","wikidata":"https://www.wikidata.org/wiki/Q7310987","display_name":"Reliability (semiconductor)","level":3,"score":0.4955791234970093},{"id":"https://openalex.org/C204321447","wikidata":"https://www.wikidata.org/wiki/Q30642","display_name":"Natural language processing","level":1,"score":0.4740312397480011},{"id":"https://openalex.org/C165838908","wikidata":"https://www.wikidata.org/wiki/Q736777","display_name":"Calibration","level":2,"score":0.44316381216049194},{"id":"https://openalex.org/C26517878","wikidata":"https://www.wikidata.org/wiki/Q228039","display_name":"Key (lock)","level":2,"score":0.4292922019958496},{"id":"https://openalex.org/C28490314","wikidata":"https://www.wikidata.org/wiki/Q189436","display_name":"Speech recognition","level":1,"score":0.42409542202949524},{"id":"https://openalex.org/C105795698","wikidata":"https://www.wikidata.org/wiki/Q12483","display_name":"Statistics","level":1,"score":0.16635918617248535},{"id":"https://openalex.org/C33923547","wikidata":"https://www.wikidata.org/wiki/Q395","display_name":"Mathematics","level":0,"score":0.10727348923683167},{"id":"https://openalex.org/C38652104","wikidata":"https://www.wikidata.org/wiki/Q3510521","display_name":"Computer security","level":1,"score":0.0},{"id":"https://openalex.org/C2524010","wikidata":"https://www.wikidata.org/wiki/Q8087","display_name":"Geometry","level":1,"score":0.0},{"id":"https://openalex.org/C163258240","wikidata":"https://www.wikidata.org/wiki/Q25342","display_name":"Power (physics)","level":2,"score":0.0},{"id":"https://openalex.org/C15744967","wikidata":"https://www.wikidata.org/wiki/Q9418","display_name":"Psychology","level":0,"score":0.0},{"id":"https://openalex.org/C11171543","wikidata":"https://www.wikidata.org/wiki/Q41630","display_name":"Psychoanalysis","level":1,"score":0.0},{"id":"https://openalex.org/C62520636","wikidata":"https://www.wikidata.org/wiki/Q944","display_name":"Quantum mechanics","level":1,"score":0.0},{"id":"https://openalex.org/C121332964","wikidata":"https://www.wikidata.org/wiki/Q413","display_name":"Physics","level":0,"score":0.0}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.1109/icassp40776.2020.9053287","is_oa":false,"landing_page_url":"https://doi.org/10.1109/icassp40776.2020.9053287","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"ICASSP 2020 - 2020 IEEE International Conference on Acoustics, Speech and Signal Processing (ICASSP)","raw_type":"proceedings-article"}],"best_oa_location":null,"sustainable_development_goals":[],"awards":[],"funders":[],"has_content":{"grobid_xml":false,"pdf":false},"content_urls":null,"referenced_works_count":14,"referenced_works":["https://openalex.org/W34303869","https://openalex.org/W1571931074","https://openalex.org/W1598033630","https://openalex.org/W2012942264","https://openalex.org/W2107091848","https://openalex.org/W2115568091","https://openalex.org/W2129334286","https://openalex.org/W2134659216","https://openalex.org/W2250539671","https://openalex.org/W2511962886","https://openalex.org/W2594610113","https://openalex.org/W2773499542","https://openalex.org/W2963505832","https://openalex.org/W6635717444"],"related_works":["https://openalex.org/W2309273277","https://openalex.org/W2061937230","https://openalex.org/W1574295218","https://openalex.org/W113247760","https://openalex.org/W1967477266","https://openalex.org/W2547793174","https://openalex.org/W2070212102","https://openalex.org/W2544241817","https://openalex.org/W2914603036","https://openalex.org/W2158882055"],"abstract_inverted_index":{"We":[0,40],"present":[1],"a":[2,43,51,69,84],"new":[3,44,70],"method":[4,45,73,127],"for":[5,18,46,74],"computing":[6],"ASR":[7,16],"word":[8,24,48,97,105],"confidences":[9],"that":[10,57,103,124],"effectively":[11],"mitigates":[12],"the":[13,23,28,92,99,104,108,116,121,125,131],"effect":[14],"of":[15,27,35,78,95,120,133],"errors":[17],"diverse":[19],"downstream":[20],"applications,":[21],"improves":[22],"error":[25],"rate":[26],"1-best":[29,118],"result,":[30],"and":[31,67,123],"allows":[32],"better":[33],"comparison":[34,77],"scores":[36,79,94],"across":[37],"different":[38,81],"models.":[39,82],"propose":[41],"1)":[42],"modeling":[47],"confidence":[49,93,111],"using":[50],"Heterogeneous":[52],"Word":[53,64],"Confusion":[54,65],"Network":[55],"(HWCN)":[56],"addresses":[58],"some":[59],"key":[60],"flaws":[61],"in":[62,98],"conventional":[63],"Networks,":[66],"2)":[68],"score":[71],"calibration":[72,126],"facilitating":[75],"direct":[76],"from":[80],"Using":[83],"bidirectional":[85],"lattice":[86],"recurrent":[87],"neural":[88],"network":[89],"to":[90],"compute":[91],"each":[96],"HWCN,":[100],"we":[101],"show":[102],"sequence":[106],"with":[107],"best":[109],"overall":[110],"is":[112],"more":[113],"accurate":[114],"than":[115],"default":[117],"result":[119],"recognizer,":[122],"can":[128],"substantially":[129],"improve":[130],"reliability":[132],"recognizer":[134],"combination.":[135]},"counts_by_year":[{"year":2025,"cited_by_count":1},{"year":2024,"cited_by_count":2},{"year":2023,"cited_by_count":4}],"updated_date":"2025-11-06T03:46:38.306776","created_date":"2025-10-10T00:00:00"}
