{"id":"https://openalex.org/W2972682576","doi":"https://doi.org/10.21437/interspeech.2019-2620","title":"Acoustic Model Optimization Based on Evolutionary Stochastic Gradient Descent with Anchors for Automatic Speech Recognition","display_name":"Acoustic Model Optimization Based on Evolutionary Stochastic Gradient Descent with Anchors for Automatic Speech Recognition","publication_year":2019,"publication_date":"2019-09-13","ids":{"openalex":"https://openalex.org/W2972682576","doi":"https://doi.org/10.21437/interspeech.2019-2620","mag":"2972682576"},"language":"en","primary_location":{"id":"doi:10.21437/interspeech.2019-2620","is_oa":false,"landing_page_url":"https://doi.org/10.21437/interspeech.2019-2620","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Interspeech 2019","raw_type":"proceedings-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":false,"oa_status":"closed","oa_url":null,"any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5102014291","display_name":"Xiaodong Cui","orcid":"https://orcid.org/0000-0003-4865-1307"},"institutions":[{"id":"https://openalex.org/I1341412227","display_name":"IBM (United States)","ror":"https://ror.org/05hh8d621","country_code":"US","type":"company","lineage":["https://openalex.org/I1341412227"]}],"countries":["US"],"is_corresponding":true,"raw_author_name":"Xiaodong Cui","raw_affiliation_strings":["IBM Research AI IBM T. J. Watson Research Center, Yorktown Heights, NY 10598, USA"],"affiliations":[{"raw_affiliation_string":"IBM Research AI IBM T. J. Watson Research Center, Yorktown Heights, NY 10598, USA","institution_ids":["https://openalex.org/I1341412227"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5034529775","display_name":"Michael Picheny","orcid":null},"institutions":[{"id":"https://openalex.org/I1341412227","display_name":"IBM (United States)","ror":"https://ror.org/05hh8d621","country_code":"US","type":"company","lineage":["https://openalex.org/I1341412227"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Michael Picheny","raw_affiliation_strings":["IBM Research AI IBM T. J. Watson Research Center, Yorktown Heights, NY 10598, USA"],"affiliations":[{"raw_affiliation_string":"IBM Research AI IBM T. J. Watson Research Center, Yorktown Heights, NY 10598, USA","institution_ids":["https://openalex.org/I1341412227"]}]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":2,"corresponding_author_ids":["https://openalex.org/A5102014291"],"corresponding_institution_ids":["https://openalex.org/I1341412227"],"apc_list":null,"apc_paid":null,"fwci":0.3317,"has_fulltext":false,"cited_by_count":4,"citation_normalized_percentile":{"value":0.55781269,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":{"min":89,"max":95},"biblio":{"volume":null,"issue":null,"first_page":"1581","last_page":"1585"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10860","display_name":"Speech and Audio Processing","score":0.9995999932289124,"subfield":{"id":"https://openalex.org/subfields/1711","display_name":"Signal Processing"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10860","display_name":"Speech and Audio Processing","score":0.9995999932289124,"subfield":{"id":"https://openalex.org/subfields/1711","display_name":"Signal Processing"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11309","display_name":"Music and Audio Processing","score":0.9994999766349792,"subfield":{"id":"https://openalex.org/subfields/1711","display_name":"Signal Processing"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10201","display_name":"Speech Recognition and Synthesis","score":0.9991999864578247,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.7394018173217773},{"id":"https://openalex.org/keywords/gradient-descent","display_name":"Gradient descent","score":0.6497329473495483},{"id":"https://openalex.org/keywords/stochastic-gradient-descent","display_name":"Stochastic gradient descent","score":0.6061428785324097},{"id":"https://openalex.org/keywords/population","display_name":"Population","score":0.5468286871910095},{"id":"https://openalex.org/keywords/evolutionary-algorithm","display_name":"Evolutionary algorithm","score":0.5023007392883301},{"id":"https://openalex.org/keywords/evolutionary-computation","display_name":"Evolutionary computation","score":0.50156569480896},{"id":"https://openalex.org/keywords/speech-recognition","display_name":"Speech recognition","score":0.43994542956352234},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.43004870414733887},{"id":"https://openalex.org/keywords/artificial-neural-network","display_name":"Artificial neural network","score":0.17015770077705383}],"concepts":[{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.7394018173217773},{"id":"https://openalex.org/C153258448","wikidata":"https://www.wikidata.org/wiki/Q1199743","display_name":"Gradient descent","level":3,"score":0.6497329473495483},{"id":"https://openalex.org/C206688291","wikidata":"https://www.wikidata.org/wiki/Q7617819","display_name":"Stochastic gradient descent","level":3,"score":0.6061428785324097},{"id":"https://openalex.org/C2908647359","wikidata":"https://www.wikidata.org/wiki/Q2625603","display_name":"Population","level":2,"score":0.5468286871910095},{"id":"https://openalex.org/C159149176","wikidata":"https://www.wikidata.org/wiki/Q14489129","display_name":"Evolutionary algorithm","level":2,"score":0.5023007392883301},{"id":"https://openalex.org/C105902424","wikidata":"https://www.wikidata.org/wiki/Q1197129","display_name":"Evolutionary computation","level":2,"score":0.50156569480896},{"id":"https://openalex.org/C28490314","wikidata":"https://www.wikidata.org/wiki/Q189436","display_name":"Speech recognition","level":1,"score":0.43994542956352234},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.43004870414733887},{"id":"https://openalex.org/C50644808","wikidata":"https://www.wikidata.org/wiki/Q192776","display_name":"Artificial neural network","level":2,"score":0.17015770077705383},{"id":"https://openalex.org/C144024400","wikidata":"https://www.wikidata.org/wiki/Q21201","display_name":"Sociology","level":0,"score":0.0},{"id":"https://openalex.org/C149923435","wikidata":"https://www.wikidata.org/wiki/Q37732","display_name":"Demography","level":1,"score":0.0}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.21437/interspeech.2019-2620","is_oa":false,"landing_page_url":"https://doi.org/10.21437/interspeech.2019-2620","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Interspeech 2019","raw_type":"proceedings-article"}],"best_oa_location":null,"sustainable_development_goals":[],"awards":[],"funders":[],"has_content":{"grobid_xml":false,"pdf":false},"content_urls":null,"referenced_works_count":11,"referenced_works":["https://openalex.org/W1522301498","https://openalex.org/W1899249567","https://openalex.org/W2090861223","https://openalex.org/W2114016253","https://openalex.org/W2129272928","https://openalex.org/W2150769028","https://openalex.org/W2150907703","https://openalex.org/W2952716993","https://openalex.org/W2963157343","https://openalex.org/W4324106947","https://openalex.org/W4394662461"],"related_works":["https://openalex.org/W4206903459","https://openalex.org/W2754816816","https://openalex.org/W4366280654","https://openalex.org/W3160167280","https://openalex.org/W4231621013","https://openalex.org/W4362706668","https://openalex.org/W3008318776","https://openalex.org/W2041416246","https://openalex.org/W3020853991","https://openalex.org/W3035836947"],"abstract_inverted_index":{"Evolutionary":[0],"stochastic":[1],"gradient":[2],"descent":[3],"(ESGD)":[4],"was":[5],"proposed":[6],"as":[7,58],"a":[8,30,51],"population-based":[9],"approach":[10],"that":[11,85,111],"combines":[12],"the":[13,48,62,71,74,81,88,92,98,112,119,125],"merits":[14],"of":[15,32,36,50,91],"gradient-aware":[16],"and":[17,55,106,121],"gradient-free":[18],"optimization":[19,24,35],"algorithms":[20],"for":[21,34,39],"superior":[22],"overall":[23],"performance.In":[25],"this":[26,44],"paper":[27],"we":[28,46],"investigate":[29],"variant":[31],"ESGD":[33,78,113],"acoustic":[37,53,128],"models":[38,83],"automatic":[40],"speech":[41],"recognition":[42],"(ASR).In":[43],"variant,":[45],"assume":[47],"existence":[49],"well-trained":[52,127],"model":[54],"use":[56],"it":[57,86],"an":[59,77],"anchor":[60,82,99],"in":[61,70],"parent":[63],"population":[64,93],"whose":[65],"good":[66],"\"gene\"":[67],"will":[68,94],"propagate":[69],"evolution":[72],"to":[73],"offsprings.We":[75],"propose":[76],"algorithm":[79],"leveraging":[80],"such":[84],"guarantees":[87],"best":[89],"fitness":[90],"never":[95],"degrade":[96],"from":[97],"model.Experiments":[100],"on":[101],"50-hour":[102],"Broadcast":[103],"News":[104],"(BN50)":[105],"300-hour":[107],"Switchboard":[108],"(SWB300)":[109],"show":[110],"with":[114],"anchors":[115],"can":[116],"further":[117],"improve":[118],"loss":[120],"ASR":[122],"performance":[123],"over":[124],"existing":[126],"models.":[129]},"counts_by_year":[{"year":2025,"cited_by_count":1},{"year":2023,"cited_by_count":1},{"year":2021,"cited_by_count":1},{"year":2020,"cited_by_count":1}],"updated_date":"2025-11-06T03:46:38.306776","created_date":"2025-10-10T00:00:00"}
