{"id":"https://openalex.org/W1978741356","doi":"https://doi.org/10.1109/asru.2011.6163908","title":"Don't multiply lightly: Quantifying problems with the acoustic model assumptions in speech recognition","display_name":"Don't multiply lightly: Quantifying problems with the acoustic model assumptions in speech recognition","publication_year":2011,"publication_date":"2011-12-01","ids":{"openalex":"https://openalex.org/W1978741356","doi":"https://doi.org/10.1109/asru.2011.6163908","mag":"1978741356"},"language":"en","primary_location":{"id":"doi:10.1109/asru.2011.6163908","is_oa":false,"landing_page_url":"https://doi.org/10.1109/asru.2011.6163908","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"2011 IEEE Workshop on Automatic Speech Recognition &amp; Understanding","raw_type":"proceedings-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":false,"oa_status":"closed","oa_url":null,"any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5110207594","display_name":"Dan Gillick","orcid":null},"institutions":[{"id":"https://openalex.org/I1297971548","display_name":"International Computer Science Institute","ror":"https://ror.org/01ewh7m12","country_code":"US","type":"nonprofit","lineage":["https://openalex.org/I1297971548"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Dan Gillick","raw_affiliation_strings":["International Computer Science Institute, Berkeley, CA, USA"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"International Computer Science Institute, Berkeley, CA, USA","institution_ids":["https://openalex.org/I1297971548"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5058277853","display_name":"Larry Gillick","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Larry Gillick","raw_affiliation_strings":["EnglishCentral, Inc., Arlington, MA, USA"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"EnglishCentral, Inc., Arlington, MA, USA","institution_ids":[]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5025957537","display_name":"Steven Wegmann","orcid":null},"institutions":[{"id":"https://openalex.org/I1297971548","display_name":"International Computer Science Institute","ror":"https://ror.org/01ewh7m12","country_code":"US","type":"nonprofit","lineage":["https://openalex.org/I1297971548"]},{"id":"https://openalex.org/I135428043","display_name":"Cisco Systems (United States)","ror":"https://ror.org/03yt1ez60","country_code":"US","type":"company","lineage":["https://openalex.org/I135428043"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Steven Wegmann","raw_affiliation_strings":["Cisco Systems, Inc., San Jose, CA, USA","International Computer Science Institute, Berkeley, CA, USA"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"Cisco Systems, Inc., San Jose, CA, USA","institution_ids":["https://openalex.org/I135428043"]},{"raw_affiliation_string":"International Computer Science Institute, Berkeley, CA, USA","institution_ids":["https://openalex.org/I1297971548"]}]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":3,"corresponding_author_ids":[],"corresponding_institution_ids":[],"apc_list":null,"apc_paid":null,"fwci":3.5172,"has_fulltext":false,"cited_by_count":25,"citation_normalized_percentile":{"value":0.92703573,"is_in_top_1_percent":false,"is_in_top_10_percent":true},"cited_by_percentile_year":{"min":90,"max":99},"biblio":{"volume":"14","issue":null,"first_page":"71","last_page":"76"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10201","display_name":"Speech Recognition and Synthesis","score":0.9998999834060669,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10201","display_name":"Speech Recognition and Synthesis","score":0.9998999834060669,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10181","display_name":"Natural Language Processing Techniques","score":0.9990000128746033,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11309","display_name":"Music and Audio Processing","score":0.9980999827384949,"subfield":{"id":"https://openalex.org/subfields/1711","display_name":"Signal Processing"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/hidden-markov-model","display_name":"Hidden Markov model","score":0.9124205112457275},{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.7608749270439148},{"id":"https://openalex.org/keywords/speech-recognition","display_name":"Speech recognition","score":0.6400753259658813},{"id":"https://openalex.org/keywords/component","display_name":"Component (thermodynamics)","score":0.6103436946868896},{"id":"https://openalex.org/keywords/independence","display_name":"Independence (probability theory)","score":0.5513021945953369},{"id":"https://openalex.org/keywords/generative-model","display_name":"Generative model","score":0.5366456508636475},{"id":"https://openalex.org/keywords/sampling","display_name":"Sampling (signal processing)","score":0.5280091166496277},{"id":"https://openalex.org/keywords/process","display_name":"Process (computing)","score":0.5122339129447937},{"id":"https://openalex.org/keywords/set","display_name":"Set (abstract data type)","score":0.5022768974304199},{"id":"https://openalex.org/keywords/word","display_name":"Word (group theory)","score":0.4965267777442932},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.4614822268486023},{"id":"https://openalex.org/keywords/markov-process","display_name":"Markov process","score":0.4569876194000244},{"id":"https://openalex.org/keywords/generative-grammar","display_name":"Generative grammar","score":0.45621269941329956},{"id":"https://openalex.org/keywords/series","display_name":"Series (stratigraphy)","score":0.42218124866485596},{"id":"https://openalex.org/keywords/pattern-recognition","display_name":"Pattern recognition (psychology)","score":0.4102591872215271},{"id":"https://openalex.org/keywords/mathematics","display_name":"Mathematics","score":0.13828158378601074},{"id":"https://openalex.org/keywords/statistics","display_name":"Statistics","score":0.11975747346878052}],"concepts":[{"id":"https://openalex.org/C23224414","wikidata":"https://www.wikidata.org/wiki/Q176769","display_name":"Hidden Markov model","level":2,"score":0.9124205112457275},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.7608749270439148},{"id":"https://openalex.org/C28490314","wikidata":"https://www.wikidata.org/wiki/Q189436","display_name":"Speech recognition","level":1,"score":0.6400753259658813},{"id":"https://openalex.org/C168167062","wikidata":"https://www.wikidata.org/wiki/Q1117970","display_name":"Component (thermodynamics)","level":2,"score":0.6103436946868896},{"id":"https://openalex.org/C35651441","wikidata":"https://www.wikidata.org/wiki/Q625303","display_name":"Independence (probability theory)","level":2,"score":0.5513021945953369},{"id":"https://openalex.org/C167966045","wikidata":"https://www.wikidata.org/wiki/Q5532625","display_name":"Generative model","level":3,"score":0.5366456508636475},{"id":"https://openalex.org/C140779682","wikidata":"https://www.wikidata.org/wiki/Q210868","display_name":"Sampling (signal processing)","level":3,"score":0.5280091166496277},{"id":"https://openalex.org/C98045186","wikidata":"https://www.wikidata.org/wiki/Q205663","display_name":"Process (computing)","level":2,"score":0.5122339129447937},{"id":"https://openalex.org/C177264268","wikidata":"https://www.wikidata.org/wiki/Q1514741","display_name":"Set (abstract data type)","level":2,"score":0.5022768974304199},{"id":"https://openalex.org/C90805587","wikidata":"https://www.wikidata.org/wiki/Q10944557","display_name":"Word (group theory)","level":2,"score":0.4965267777442932},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.4614822268486023},{"id":"https://openalex.org/C159886148","wikidata":"https://www.wikidata.org/wiki/Q176645","display_name":"Markov process","level":2,"score":0.4569876194000244},{"id":"https://openalex.org/C39890363","wikidata":"https://www.wikidata.org/wiki/Q36108","display_name":"Generative grammar","level":2,"score":0.45621269941329956},{"id":"https://openalex.org/C143724316","wikidata":"https://www.wikidata.org/wiki/Q312468","display_name":"Series (stratigraphy)","level":2,"score":0.42218124866485596},{"id":"https://openalex.org/C153180895","wikidata":"https://www.wikidata.org/wiki/Q7148389","display_name":"Pattern recognition (psychology)","level":2,"score":0.4102591872215271},{"id":"https://openalex.org/C33923547","wikidata":"https://www.wikidata.org/wiki/Q395","display_name":"Mathematics","level":0,"score":0.13828158378601074},{"id":"https://openalex.org/C105795698","wikidata":"https://www.wikidata.org/wiki/Q12483","display_name":"Statistics","level":1,"score":0.11975747346878052},{"id":"https://openalex.org/C121332964","wikidata":"https://www.wikidata.org/wiki/Q413","display_name":"Physics","level":0,"score":0.0},{"id":"https://openalex.org/C151730666","wikidata":"https://www.wikidata.org/wiki/Q7205","display_name":"Paleontology","level":1,"score":0.0},{"id":"https://openalex.org/C106131492","wikidata":"https://www.wikidata.org/wiki/Q3072260","display_name":"Filter (signal processing)","level":2,"score":0.0},{"id":"https://openalex.org/C2524010","wikidata":"https://www.wikidata.org/wiki/Q8087","display_name":"Geometry","level":1,"score":0.0},{"id":"https://openalex.org/C199360897","wikidata":"https://www.wikidata.org/wiki/Q9143","display_name":"Programming language","level":1,"score":0.0},{"id":"https://openalex.org/C97355855","wikidata":"https://www.wikidata.org/wiki/Q11473","display_name":"Thermodynamics","level":1,"score":0.0},{"id":"https://openalex.org/C86803240","wikidata":"https://www.wikidata.org/wiki/Q420","display_name":"Biology","level":0,"score":0.0},{"id":"https://openalex.org/C111919701","wikidata":"https://www.wikidata.org/wiki/Q9135","display_name":"Operating system","level":1,"score":0.0},{"id":"https://openalex.org/C31972630","wikidata":"https://www.wikidata.org/wiki/Q844240","display_name":"Computer vision","level":1,"score":0.0}],"mesh":[],"locations_count":2,"locations":[{"id":"doi:10.1109/asru.2011.6163908","is_oa":false,"landing_page_url":"https://doi.org/10.1109/asru.2011.6163908","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"2011 IEEE Workshop on Automatic Speech Recognition &amp; Understanding","raw_type":"proceedings-article"},{"id":"pmh:oai:CiteSeerX.psu:10.1.1.799.7712","is_oa":false,"landing_page_url":"http://citeseerx.ist.psu.edu/viewdoc/summary?doi=10.1.1.799.7712","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":"http://www.icsi.berkeley.edu/pubs/speech/dontmultiplylightly11.pdf","raw_type":"text"}],"best_oa_location":null,"sustainable_development_goals":[{"display_name":"Peace, Justice and strong institutions","id":"https://metadata.un.org/sdg/16","score":0.699999988079071}],"awards":[],"funders":[{"id":"https://openalex.org/F4320306076","display_name":"National Science Foundation","ror":"https://ror.org/021nxhr62"}],"has_content":{"grobid_xml":false,"pdf":false},"content_urls":null,"referenced_works_count":16,"referenced_works":["https://openalex.org/W943204654","https://openalex.org/W1500026161","https://openalex.org/W1631260214","https://openalex.org/W2003123121","https://openalex.org/W2051347452","https://openalex.org/W2078223462","https://openalex.org/W2083393647","https://openalex.org/W2098318492","https://openalex.org/W2106404689","https://openalex.org/W2106554350","https://openalex.org/W2111551391","https://openalex.org/W2122028591","https://openalex.org/W2124181495","https://openalex.org/W2156615793","https://openalex.org/W6636811518","https://openalex.org/W6683422774"],"related_works":["https://openalex.org/W4365211920","https://openalex.org/W3014948380","https://openalex.org/W4380551139","https://openalex.org/W2280377497","https://openalex.org/W4387506531","https://openalex.org/W3174044702","https://openalex.org/W4238433571","https://openalex.org/W2967848559","https://openalex.org/W4283803360","https://openalex.org/W4317695495"],"abstract_inverted_index":{"We":[0],"describe":[1],"a":[2,22,43,47],"series":[3],"of":[4,24,33,68,77,92],"experiments":[5],"simulating":[6,30,55],"data":[7],"from":[8,56],"the":[9,34,57,64,69,74,89,93,104],"standard":[10],"Hidden":[11],"Markov":[12],"Model":[13],"(HMM)":[14],"framework":[15],"used":[16],"for":[17,46,60],"speech":[18],"recognition.":[19],"Starting":[20],"with":[21],"set":[23],"test":[25,88],"transcriptions,":[26],"we":[27,41],"begin":[28],"by":[29],"every":[31],"step":[32],"generative":[35],"process.":[36],"In":[37],"each":[38,78],"subsequent":[39],"experiment,":[40],"substitute":[42],"real":[44],"component":[45,49],"simulated":[48],"(real":[50],"state":[51],"durations":[52],"rather":[53],"than":[54,103],"transition":[58],"models,":[59],"example),":[61],"and":[62],"compare":[63],"word":[65],"error":[66],"rates":[67],"resulting":[70],"data,":[71],"thus":[72],"quantifying":[73],"relative":[75],"costs":[76],"modeling":[79],"assumption.":[80],"A":[81],"novel":[82],"sampling":[83],"process":[84],"allows":[85],"us":[86],"to":[87,97],"independence":[90],"assumptions":[91],"HMM,":[94],"which":[95],"appear":[96],"present":[98],"far":[99],"more":[100],"serious":[101],"problems":[102],"other":[105],"data/model":[106],"mismatches.":[107]},"counts_by_year":[{"year":2020,"cited_by_count":2},{"year":2019,"cited_by_count":1},{"year":2017,"cited_by_count":4},{"year":2016,"cited_by_count":6},{"year":2015,"cited_by_count":4},{"year":2014,"cited_by_count":4},{"year":2013,"cited_by_count":3},{"year":2012,"cited_by_count":1}],"updated_date":"2026-06-11T09:08:48.828518","created_date":"2025-10-10T00:00:00"}
