{"id":"https://openalex.org/W2124338691","doi":"https://doi.org/10.1109/asru.2009.5373493","title":"Generalization problem in ASR acoustic model training and adaptation","display_name":"Generalization problem in ASR acoustic model training and adaptation","publication_year":2009,"publication_date":"2009-12-01","ids":{"openalex":"https://openalex.org/W2124338691","doi":"https://doi.org/10.1109/asru.2009.5373493","mag":"2124338691"},"language":"en","primary_location":{"id":"doi:10.1109/asru.2009.5373493","is_oa":false,"landing_page_url":"https://doi.org/10.1109/asru.2009.5373493","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"2009 IEEE Workshop on Automatic Speech Recognition &amp; Understanding","raw_type":"proceedings-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":true,"oa_status":"green","oa_url":"http://t2r2.star.titech.ac.jp/rrws/file/CTT100598393/ATD100000413/","any_repository_has_fulltext":true},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5009532108","display_name":"Sadaoki Furui","orcid":null},"institutions":[{"id":"https://openalex.org/I114531698","display_name":"Tokyo Institute of Technology","ror":"https://ror.org/0112mx960","country_code":"JP","type":"education","lineage":["https://openalex.org/I114531698"]}],"countries":["JP"],"is_corresponding":true,"raw_author_name":"Sadaoki Furui","raw_affiliation_strings":["Department of Computer Science, Tokyo Institute of Technology, Meguro, Tokyo, Japan","Department of Computer Science, Tokyo Institute of Technology, 2-12-1 Ookayama, Meguro-ku, 152-8552 Japan"],"affiliations":[{"raw_affiliation_string":"Department of Computer Science, Tokyo Institute of Technology, Meguro, Tokyo, Japan","institution_ids":["https://openalex.org/I114531698"]},{"raw_affiliation_string":"Department of Computer Science, Tokyo Institute of Technology, 2-12-1 Ookayama, Meguro-ku, 152-8552 Japan","institution_ids":["https://openalex.org/I114531698"]}]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":1,"corresponding_author_ids":["https://openalex.org/A5009532108"],"corresponding_institution_ids":["https://openalex.org/I114531698"],"apc_list":null,"apc_paid":null,"fwci":2.6171,"has_fulltext":false,"cited_by_count":12,"citation_normalized_percentile":{"value":0.90915692,"is_in_top_1_percent":false,"is_in_top_10_percent":true},"cited_by_percentile_year":{"min":89,"max":97},"biblio":{"volume":null,"issue":null,"first_page":"1","last_page":"10"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10201","display_name":"Speech Recognition and Synthesis","score":0.9998999834060669,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10201","display_name":"Speech Recognition and Synthesis","score":0.9998999834060669,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10860","display_name":"Speech and Audio Processing","score":0.998199999332428,"subfield":{"id":"https://openalex.org/subfields/1711","display_name":"Signal Processing"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11309","display_name":"Music and Audio Processing","score":0.9944999814033508,"subfield":{"id":"https://openalex.org/subfields/1711","display_name":"Signal Processing"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.8434308171272278},{"id":"https://openalex.org/keywords/adaptation","display_name":"Adaptation (eye)","score":0.7225164771080017},{"id":"https://openalex.org/keywords/generalization","display_name":"Generalization","score":0.7041480541229248},{"id":"https://openalex.org/keywords/speech-recognition","display_name":"Speech recognition","score":0.668217122554779},{"id":"https://openalex.org/keywords/a-priori-and-a-posteriori","display_name":"A priori and a posteriori","score":0.6491595506668091},{"id":"https://openalex.org/keywords/acoustic-model","display_name":"Acoustic model","score":0.5436692237854004},{"id":"https://openalex.org/keywords/variation","display_name":"Variation (astronomy)","score":0.4988291263580322},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.4723454713821411},{"id":"https://openalex.org/keywords/training","display_name":"Training (meteorology)","score":0.4320722818374634},{"id":"https://openalex.org/keywords/training-set","display_name":"Training set","score":0.4103473424911499},{"id":"https://openalex.org/keywords/machine-learning","display_name":"Machine learning","score":0.4008645713329315},{"id":"https://openalex.org/keywords/speech-processing","display_name":"Speech processing","score":0.39134031534194946}],"concepts":[{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.8434308171272278},{"id":"https://openalex.org/C139807058","wikidata":"https://www.wikidata.org/wiki/Q352374","display_name":"Adaptation (eye)","level":2,"score":0.7225164771080017},{"id":"https://openalex.org/C177148314","wikidata":"https://www.wikidata.org/wiki/Q170084","display_name":"Generalization","level":2,"score":0.7041480541229248},{"id":"https://openalex.org/C28490314","wikidata":"https://www.wikidata.org/wiki/Q189436","display_name":"Speech recognition","level":1,"score":0.668217122554779},{"id":"https://openalex.org/C75553542","wikidata":"https://www.wikidata.org/wiki/Q178161","display_name":"A priori and a posteriori","level":2,"score":0.6491595506668091},{"id":"https://openalex.org/C155635449","wikidata":"https://www.wikidata.org/wiki/Q4674699","display_name":"Acoustic model","level":3,"score":0.5436692237854004},{"id":"https://openalex.org/C2778334786","wikidata":"https://www.wikidata.org/wiki/Q1586270","display_name":"Variation (astronomy)","level":2,"score":0.4988291263580322},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.4723454713821411},{"id":"https://openalex.org/C2777211547","wikidata":"https://www.wikidata.org/wiki/Q17141490","display_name":"Training (meteorology)","level":2,"score":0.4320722818374634},{"id":"https://openalex.org/C51632099","wikidata":"https://www.wikidata.org/wiki/Q3985153","display_name":"Training set","level":2,"score":0.4103473424911499},{"id":"https://openalex.org/C119857082","wikidata":"https://www.wikidata.org/wiki/Q2539","display_name":"Machine learning","level":1,"score":0.4008645713329315},{"id":"https://openalex.org/C61328038","wikidata":"https://www.wikidata.org/wiki/Q3358061","display_name":"Speech processing","level":2,"score":0.39134031534194946},{"id":"https://openalex.org/C138885662","wikidata":"https://www.wikidata.org/wiki/Q5891","display_name":"Philosophy","level":0,"score":0.0},{"id":"https://openalex.org/C153294291","wikidata":"https://www.wikidata.org/wiki/Q25261","display_name":"Meteorology","level":1,"score":0.0},{"id":"https://openalex.org/C121332964","wikidata":"https://www.wikidata.org/wiki/Q413","display_name":"Physics","level":0,"score":0.0},{"id":"https://openalex.org/C134306372","wikidata":"https://www.wikidata.org/wiki/Q7754","display_name":"Mathematical analysis","level":1,"score":0.0},{"id":"https://openalex.org/C111472728","wikidata":"https://www.wikidata.org/wiki/Q9471","display_name":"Epistemology","level":1,"score":0.0},{"id":"https://openalex.org/C33923547","wikidata":"https://www.wikidata.org/wiki/Q395","display_name":"Mathematics","level":0,"score":0.0},{"id":"https://openalex.org/C44870925","wikidata":"https://www.wikidata.org/wiki/Q37547","display_name":"Astrophysics","level":1,"score":0.0},{"id":"https://openalex.org/C120665830","wikidata":"https://www.wikidata.org/wiki/Q14620","display_name":"Optics","level":1,"score":0.0}],"mesh":[],"locations_count":2,"locations":[{"id":"doi:10.1109/asru.2009.5373493","is_oa":false,"landing_page_url":"https://doi.org/10.1109/asru.2009.5373493","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"2009 IEEE Workshop on Automatic Speech Recognition &amp; Understanding","raw_type":"proceedings-article"},{"id":"pmh:oai:t2r2.star.titech.ac.jp:50095230","is_oa":true,"landing_page_url":"http://t2r2.star.titech.ac.jp/cgi-bin/publicationinfo.cgi?q_publication_content_number=CTT100598393","pdf_url":"http://t2r2.star.titech.ac.jp/rrws/file/CTT100598393/ATD100000413/","source":{"id":"https://openalex.org/S4377196385","display_name":"Tokyo Tech Research Repository (Tokyo Institute of Technology)","issn_l":null,"issn":null,"is_oa":false,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I114531698","host_organization_name":"Tokyo Institute of Technology","host_organization_lineage":["https://openalex.org/I114531698"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":"","raw_type":"Conference Paper"}],"best_oa_location":{"id":"pmh:oai:t2r2.star.titech.ac.jp:50095230","is_oa":true,"landing_page_url":"http://t2r2.star.titech.ac.jp/cgi-bin/publicationinfo.cgi?q_publication_content_number=CTT100598393","pdf_url":"http://t2r2.star.titech.ac.jp/rrws/file/CTT100598393/ATD100000413/","source":{"id":"https://openalex.org/S4377196385","display_name":"Tokyo Tech Research Repository (Tokyo Institute of Technology)","issn_l":null,"issn":null,"is_oa":false,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I114531698","host_organization_name":"Tokyo Institute of Technology","host_organization_lineage":["https://openalex.org/I114531698"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":"","raw_type":"Conference Paper"},"sustainable_development_goals":[{"score":0.7799999713897705,"id":"https://metadata.un.org/sdg/16","display_name":"Peace, Justice and strong institutions"}],"awards":[],"funders":[],"has_content":{"grobid_xml":false,"pdf":true},"content_urls":{"pdf":"https://content.openalex.org/works/W2124338691.pdf"},"referenced_works_count":94,"referenced_works":["https://openalex.org/W10427819","https://openalex.org/W16400594","https://openalex.org/W17294665","https://openalex.org/W31925794","https://openalex.org/W43454013","https://openalex.org/W63005457","https://openalex.org/W87533929","https://openalex.org/W108537639","https://openalex.org/W117579468","https://openalex.org/W142031455","https://openalex.org/W158338006","https://openalex.org/W175821084","https://openalex.org/W193308610","https://openalex.org/W285205250","https://openalex.org/W1481751294","https://openalex.org/W1483145160","https://openalex.org/W1511242468","https://openalex.org/W1572419603","https://openalex.org/W1574530145","https://openalex.org/W1599512239","https://openalex.org/W1898467614","https://openalex.org/W1900229942","https://openalex.org/W1920923476","https://openalex.org/W1953949349","https://openalex.org/W1966737826","https://openalex.org/W1979120075","https://openalex.org/W1987535750","https://openalex.org/W2002342963","https://openalex.org/W2014408663","https://openalex.org/W2034537249","https://openalex.org/W2037740282","https://openalex.org/W2038288667","https://openalex.org/W2053567709","https://openalex.org/W2053967299","https://openalex.org/W2063541597","https://openalex.org/W2081166343","https://openalex.org/W2081976287","https://openalex.org/W2089576851","https://openalex.org/W2096044236","https://openalex.org/W2096297019","https://openalex.org/W2100336732","https://openalex.org/W2100969003","https://openalex.org/W2104924374","https://openalex.org/W2106119541","https://openalex.org/W2106208939","https://openalex.org/W2111421849","https://openalex.org/W2113911479","https://openalex.org/W2114140497","https://openalex.org/W2118504934","https://openalex.org/W2120019470","https://openalex.org/W2121981798","https://openalex.org/W2123867168","https://openalex.org/W2124060484","https://openalex.org/W2131118559","https://openalex.org/W2135153490","https://openalex.org/W2142416747","https://openalex.org/W2143264198","https://openalex.org/W2146871184","https://openalex.org/W2149175990","https://openalex.org/W2150660184","https://openalex.org/W2150907703","https://openalex.org/W2153190454","https://openalex.org/W2155045454","https://openalex.org/W2155569120","https://openalex.org/W2156886787","https://openalex.org/W2157084746","https://openalex.org/W2160397028","https://openalex.org/W2164713009","https://openalex.org/W2167152389","https://openalex.org/W2384542382","https://openalex.org/W2484208911","https://openalex.org/W2799061466","https://openalex.org/W3142877555","https://openalex.org/W3144168424","https://openalex.org/W4205130185","https://openalex.org/W4239875977","https://openalex.org/W4256112632","https://openalex.org/W6600416867","https://openalex.org/W6601314542","https://openalex.org/W6602521540","https://openalex.org/W6603544418","https://openalex.org/W6606443625","https://openalex.org/W6607219637","https://openalex.org/W6610301154","https://openalex.org/W6628832040","https://openalex.org/W6641010790","https://openalex.org/W6663848509","https://openalex.org/W6671064254","https://openalex.org/W6674653747","https://openalex.org/W6674893724","https://openalex.org/W6676853410","https://openalex.org/W6677554280","https://openalex.org/W6682398751","https://openalex.org/W6683552698"],"related_works":["https://openalex.org/W2148579858","https://openalex.org/W2374918184","https://openalex.org/W2349258661","https://openalex.org/W2055900849","https://openalex.org/W4372341334","https://openalex.org/W1925506410","https://openalex.org/W562177300","https://openalex.org/W1535088811","https://openalex.org/W1489795889","https://openalex.org/W2793122029"],"abstract_inverted_index":{"Since":[0],"speech":[1,23,107,111,173,180],"is":[2,39,85,120,126],"highly":[3],"variable,":[4],"even":[5],"if":[6],"we":[7,13,157],"have":[8,55,140,154,161],"a":[9,103,110,162],"fairly":[10],"large-scale":[11],"database,":[12],"cannot":[14],"avoid":[15],"the":[16,42,60,82,87,133,179],"data":[17,38,181],"sparseness":[18],"problem":[19,62],"in":[20,47,63,91],"constructing":[21],"automatic":[22],"recognition":[24,75],"(ASR)":[25],"systems.":[26],"How":[27],"to":[28,58,72,146,169],"train":[29],"and":[30,67,94,132,144,175,185],"adapt":[31],"statistical":[32],"models":[33],"using":[34],"limited":[35],"amounts":[36],"of":[37,41,81,89,106,137,172,178],"one":[40],"most":[43],"important":[44],"research":[45],"issues":[46],"ASR.":[48],"This":[49],"paper":[50],"summarizes":[51],"major":[52],"techniques":[53,97,139,153],"that":[54,69,165],"been":[56,142,155],"proposed":[57],"solve":[59],"generalization":[61],"acoustic":[64],"model":[65,92],"training":[66,93,130,184],"adaptation,":[68],"is,":[70],"how":[71],"achieve":[73],"high":[74],"accuracy":[76],"for":[77,183],"new":[78],"utterances.":[79],"One":[80],"common":[83],"approaches":[84],"controlling":[86],"degree":[88],"freedom":[90],"adaptation.":[95,186],"The":[96],"can":[98,166],"be":[99,167],"classified":[100],"by":[101,109,117],"whether":[102],"priori":[104],"knowledge":[105],"obtained":[108],"database":[112],"such":[113],"as":[114],"those":[115],"spoken":[116],"many":[118,151],"speakers":[119],"used":[121],"or":[122],"not.":[123],"Another":[124],"approach":[125],"maximizing":[127],"\u00bfmargins\u00bf":[128],"between":[129],"samples":[131],"decision":[134],"boundaries.":[135],"Many":[136],"these":[138],"also":[141],"combined":[143],"extended":[145],"further":[147],"improve":[148],"performance.":[149],"Although":[150],"useful":[152],"developed,":[156],"still":[158],"do":[159],"not":[160],"golden":[163],"standard":[164],"applied":[168],"any":[170,176],"kind":[171],"variation":[174],"condition":[177],"available":[182]},"counts_by_year":[{"year":2021,"cited_by_count":1},{"year":2016,"cited_by_count":1},{"year":2014,"cited_by_count":3},{"year":2013,"cited_by_count":1},{"year":2012,"cited_by_count":3}],"updated_date":"2025-11-06T03:46:38.306776","created_date":"2025-10-10T00:00:00"}
