{"id":"https://openalex.org/W2786839803","doi":"https://doi.org/10.1109/asru.2017.8268987","title":"Exploring ASR-free end-to-end modeling to improve spoken language understanding in a cloud-based dialog system","display_name":"Exploring ASR-free end-to-end modeling to improve spoken language understanding in a cloud-based dialog system","publication_year":2017,"publication_date":"2017-12-01","ids":{"openalex":"https://openalex.org/W2786839803","doi":"https://doi.org/10.1109/asru.2017.8268987","mag":"2786839803"},"language":"en","primary_location":{"id":"doi:10.1109/asru.2017.8268987","is_oa":false,"landing_page_url":"https://doi.org/10.1109/asru.2017.8268987","pdf_url":null,"source":{"id":"https://openalex.org/S4306498158","display_name":"2017 IEEE Automatic Speech Recognition and Understanding Workshop (ASRU)","issn_l":null,"issn":null,"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":null,"host_organization_name":null,"host_organization_lineage":[],"host_organization_lineage_names":[],"type":"journal"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"2017 IEEE Automatic Speech Recognition and Understanding Workshop (ASRU)","raw_type":"proceedings-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":false,"oa_status":"closed","oa_url":null,"any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5100342006","display_name":"Yao Qian","orcid":"https://orcid.org/0000-0003-1855-9630"},"institutions":[{"id":"https://openalex.org/I1341030882","display_name":"Educational Testing Service","ror":"https://ror.org/03b5q4637","country_code":"US","type":"nonprofit","lineage":["https://openalex.org/I1341030882"]}],"countries":["US"],"is_corresponding":true,"raw_author_name":"Yao Qian","raw_affiliation_strings":["Educational Testing Service Research, USA"],"affiliations":[{"raw_affiliation_string":"Educational Testing Service Research, USA","institution_ids":["https://openalex.org/I1341030882"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5030738204","display_name":"Rutuja Ubale","orcid":null},"institutions":[{"id":"https://openalex.org/I1341030882","display_name":"Educational Testing Service","ror":"https://ror.org/03b5q4637","country_code":"US","type":"nonprofit","lineage":["https://openalex.org/I1341030882"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Rutuja Ubale","raw_affiliation_strings":["Educational Testing Service Research, USA"],"affiliations":[{"raw_affiliation_string":"Educational Testing Service Research, USA","institution_ids":["https://openalex.org/I1341030882"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5043115328","display_name":"Vikram Ramanaryanan","orcid":null},"institutions":[{"id":"https://openalex.org/I1341030882","display_name":"Educational Testing Service","ror":"https://ror.org/03b5q4637","country_code":"US","type":"nonprofit","lineage":["https://openalex.org/I1341030882"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Vikram Ramanaryanan","raw_affiliation_strings":["Educational Testing Service Research, USA"],"affiliations":[{"raw_affiliation_string":"Educational Testing Service Research, USA","institution_ids":["https://openalex.org/I1341030882"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5029778136","display_name":"Patrick Lange","orcid":"https://orcid.org/0000-0003-3935-663X"},"institutions":[{"id":"https://openalex.org/I1341030882","display_name":"Educational Testing Service","ror":"https://ror.org/03b5q4637","country_code":"US","type":"nonprofit","lineage":["https://openalex.org/I1341030882"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Patrick Lange","raw_affiliation_strings":["Educational Testing Service Research, USA"],"affiliations":[{"raw_affiliation_string":"Educational Testing Service Research, USA","institution_ids":["https://openalex.org/I1341030882"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5008930900","display_name":"David Suendermann\u2010Oeft","orcid":null},"institutions":[{"id":"https://openalex.org/I1341030882","display_name":"Educational Testing Service","ror":"https://ror.org/03b5q4637","country_code":"US","type":"nonprofit","lineage":["https://openalex.org/I1341030882"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"David Suendermann-Oeft","raw_affiliation_strings":["Educational Testing Service Research, USA"],"affiliations":[{"raw_affiliation_string":"Educational Testing Service Research, USA","institution_ids":["https://openalex.org/I1341030882"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5030816616","display_name":"Keelan Evanini","orcid":"https://orcid.org/0000-0003-4243-3376"},"institutions":[{"id":"https://openalex.org/I1341030882","display_name":"Educational Testing Service","ror":"https://ror.org/03b5q4637","country_code":"US","type":"nonprofit","lineage":["https://openalex.org/I1341030882"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Keelan Evanini","raw_affiliation_strings":["Educational Testing Service Research, USA"],"affiliations":[{"raw_affiliation_string":"Educational Testing Service Research, USA","institution_ids":["https://openalex.org/I1341030882"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5030778828","display_name":"Eugene Tsuprun","orcid":null},"institutions":[{"id":"https://openalex.org/I1341030882","display_name":"Educational Testing Service","ror":"https://ror.org/03b5q4637","country_code":"US","type":"nonprofit","lineage":["https://openalex.org/I1341030882"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Eugene Tsuprun","raw_affiliation_strings":["Educational Testing Service Research, USA"],"affiliations":[{"raw_affiliation_string":"Educational Testing Service Research, USA","institution_ids":["https://openalex.org/I1341030882"]}]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":7,"corresponding_author_ids":["https://openalex.org/A5100342006"],"corresponding_institution_ids":["https://openalex.org/I1341030882"],"apc_list":null,"apc_paid":null,"fwci":5.4605,"has_fulltext":false,"cited_by_count":63,"citation_normalized_percentile":{"value":0.96633249,"is_in_top_1_percent":false,"is_in_top_10_percent":true},"cited_by_percentile_year":{"min":90,"max":100},"biblio":{"volume":null,"issue":null,"first_page":"569","last_page":"576"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T12031","display_name":"Speech and dialogue systems","score":0.9998000264167786,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T12031","display_name":"Speech and dialogue systems","score":0.9998000264167786,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10201","display_name":"Speech Recognition and Synthesis","score":0.9994999766349792,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10028","display_name":"Topic Modeling","score":0.9994000196456909,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.8911277055740356},{"id":"https://openalex.org/keywords/dialog-box","display_name":"Dialog box","score":0.8341733813285828},{"id":"https://openalex.org/keywords/dialog-system","display_name":"Dialog system","score":0.7435089349746704},{"id":"https://openalex.org/keywords/spoken-language","display_name":"Spoken language","score":0.6841856837272644},{"id":"https://openalex.org/keywords/natural-language-understanding","display_name":"Natural language understanding","score":0.6047824025154114},{"id":"https://openalex.org/keywords/natural-language-processing","display_name":"Natural language processing","score":0.5633922815322876},{"id":"https://openalex.org/keywords/speech-recognition","display_name":"Speech recognition","score":0.5241944193840027},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.49609169363975525},{"id":"https://openalex.org/keywords/natural-language","display_name":"Natural language","score":0.4926827549934387},{"id":"https://openalex.org/keywords/modular-design","display_name":"Modular design","score":0.4836669862270355},{"id":"https://openalex.org/keywords/language-model","display_name":"Language model","score":0.4777066707611084},{"id":"https://openalex.org/keywords/cloud-computing","display_name":"Cloud computing","score":0.4320400059223175},{"id":"https://openalex.org/keywords/programming-language","display_name":"Programming language","score":0.12740889191627502},{"id":"https://openalex.org/keywords/world-wide-web","display_name":"World Wide Web","score":0.11678680777549744}],"concepts":[{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.8911277055740356},{"id":"https://openalex.org/C173853756","wikidata":"https://www.wikidata.org/wiki/Q86915","display_name":"Dialog box","level":2,"score":0.8341733813285828},{"id":"https://openalex.org/C190954187","wikidata":"https://www.wikidata.org/wiki/Q5270587","display_name":"Dialog system","level":3,"score":0.7435089349746704},{"id":"https://openalex.org/C2776230583","wikidata":"https://www.wikidata.org/wiki/Q1322198","display_name":"Spoken language","level":2,"score":0.6841856837272644},{"id":"https://openalex.org/C2779439875","wikidata":"https://www.wikidata.org/wiki/Q1078276","display_name":"Natural language understanding","level":3,"score":0.6047824025154114},{"id":"https://openalex.org/C204321447","wikidata":"https://www.wikidata.org/wiki/Q30642","display_name":"Natural language processing","level":1,"score":0.5633922815322876},{"id":"https://openalex.org/C28490314","wikidata":"https://www.wikidata.org/wiki/Q189436","display_name":"Speech recognition","level":1,"score":0.5241944193840027},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.49609169363975525},{"id":"https://openalex.org/C195324797","wikidata":"https://www.wikidata.org/wiki/Q33742","display_name":"Natural language","level":2,"score":0.4926827549934387},{"id":"https://openalex.org/C101468663","wikidata":"https://www.wikidata.org/wiki/Q1620158","display_name":"Modular design","level":2,"score":0.4836669862270355},{"id":"https://openalex.org/C137293760","wikidata":"https://www.wikidata.org/wiki/Q3621696","display_name":"Language model","level":2,"score":0.4777066707611084},{"id":"https://openalex.org/C79974875","wikidata":"https://www.wikidata.org/wiki/Q483639","display_name":"Cloud computing","level":2,"score":0.4320400059223175},{"id":"https://openalex.org/C199360897","wikidata":"https://www.wikidata.org/wiki/Q9143","display_name":"Programming language","level":1,"score":0.12740889191627502},{"id":"https://openalex.org/C136764020","wikidata":"https://www.wikidata.org/wiki/Q466","display_name":"World Wide Web","level":1,"score":0.11678680777549744},{"id":"https://openalex.org/C111919701","wikidata":"https://www.wikidata.org/wiki/Q9135","display_name":"Operating system","level":1,"score":0.0}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.1109/asru.2017.8268987","is_oa":false,"landing_page_url":"https://doi.org/10.1109/asru.2017.8268987","pdf_url":null,"source":{"id":"https://openalex.org/S4306498158","display_name":"2017 IEEE Automatic Speech Recognition and Understanding Workshop (ASRU)","issn_l":null,"issn":null,"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":null,"host_organization_name":null,"host_organization_lineage":[],"host_organization_lineage_names":[],"type":"journal"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"2017 IEEE Automatic Speech Recognition and Understanding Workshop (ASRU)","raw_type":"proceedings-article"}],"best_oa_location":null,"sustainable_development_goals":[{"id":"https://metadata.un.org/sdg/4","display_name":"Quality Education","score":0.8199999928474426}],"awards":[],"funders":[],"has_content":{"grobid_xml":false,"pdf":false},"content_urls":null,"referenced_works_count":55,"referenced_works":["https://openalex.org/W39511165","https://openalex.org/W97072897","https://openalex.org/W149113674","https://openalex.org/W217970951","https://openalex.org/W1032614754","https://openalex.org/W1505640990","https://openalex.org/W1524333225","https://openalex.org/W1806039879","https://openalex.org/W1936920915","https://openalex.org/W2049759087","https://openalex.org/W2064675550","https://openalex.org/W2093973850","https://openalex.org/W2094472029","https://openalex.org/W2099877156","https://openalex.org/W2102113734","https://openalex.org/W2114925438","https://openalex.org/W2117520332","https://openalex.org/W2118620946","https://openalex.org/W2123379364","https://openalex.org/W2132037657","https://openalex.org/W2137871902","https://openalex.org/W2138857742","https://openalex.org/W2140279531","https://openalex.org/W2153501885","https://openalex.org/W2155524666","https://openalex.org/W2160306971","https://openalex.org/W2160815625","https://openalex.org/W2161466446","https://openalex.org/W2163922914","https://openalex.org/W2250974548","https://openalex.org/W2399456070","https://openalex.org/W2399733683","https://openalex.org/W2399855989","https://openalex.org/W2400092632","https://openalex.org/W2402146185","https://openalex.org/W2510063686","https://openalex.org/W2515090196","https://openalex.org/W2550112318","https://openalex.org/W2962826786","https://openalex.org/W2963211739","https://openalex.org/W2963311389","https://openalex.org/W2963571336","https://openalex.org/W4236521339","https://openalex.org/W6603931906","https://openalex.org/W6606067871","https://openalex.org/W6608710415","https://openalex.org/W6630235389","https://openalex.org/W6631362777","https://openalex.org/W6640440542","https://openalex.org/W6674796821","https://openalex.org/W6675365184","https://openalex.org/W6680300913","https://openalex.org/W6680672469","https://openalex.org/W6712742799","https://openalex.org/W6712930963"],"related_works":["https://openalex.org/W48079147","https://openalex.org/W2394821827","https://openalex.org/W326836678","https://openalex.org/W2563921006","https://openalex.org/W1963944933","https://openalex.org/W2111550420","https://openalex.org/W1977846844","https://openalex.org/W2166986207","https://openalex.org/W4230258867","https://openalex.org/W2786839803"],"abstract_inverted_index":{"Spoken":[0],"language":[1,13,114],"understanding":[2,14],"(SLU)":[3],"in":[4,39,126],"dialog":[5,33,92],"systems":[6],"is":[7,123,162],"generally":[8],"performed":[9],"using":[10],"a":[11,64,88,112,139],"natural":[12],"(NLU)":[15],"model":[16],"based":[17],"on":[18,102],"the":[19,58,67,97,136,151,157],"hypotheses":[20,148],"produced":[21],"by":[22,149],"an":[23,79],"automatic":[24],"speech":[25],"recognition":[26],"(ASR)":[27],"system.":[28],"However,":[29],"when":[30],"new":[31],"spoken":[32,91],"applications":[34],"are":[35],"built":[36],"from":[37,106,153,164],"scratch":[38],"real":[40],"user":[41],"environments":[42],"that":[43,120],"often":[44],"have":[45],"sub-optimal":[46],"audio":[47],"characteristics,":[48],"ASR":[49,130,147],"performance":[50,137],"can":[51,133],"suffer":[52],"due":[53],"to":[54,85,166],"factors":[55],"such":[56],"as":[57],"paucity":[59],"of":[60,99,138,160],"training":[61,68],"data":[62,104],"or":[63],"mismatch":[65],"between":[66],"and":[69],"test":[70],"data.":[71],"To":[72],"address":[73],"this":[74,76],"issue,":[75],"paper":[77],"proposes":[78],"ASR-free,":[80],"end-to-end":[81],"(E2E)":[82],"modeling":[83],"approach":[84,101,122],"SLU":[86,142,161],"for":[87],"cloud-based,":[89],"modular":[90],"system":[93,143],"(SDS).":[94],"We":[95],"evaluate":[96],"effectiveness":[98],"our":[100,121],"crowdsourced":[103],"collected":[105],"non-native":[107],"English":[108],"speakers":[109],"interacting":[110],"with":[111,128,144],"conversational":[113],"learning":[115],"application.":[116],"Experimental":[117],"results":[118],"show":[119],"particularly":[124],"promising":[125],"situations":[127],"low":[129],"accuracy.":[131],"It":[132],"further":[134],"improve":[135],"sophisticated":[140],"CNN-based":[141],"more":[145],"accurate":[146],"fusing":[150],"scores":[152],"E2E":[154],"system,":[155],"i.e.,":[156],"overall":[158],"accuracy":[159],"improved":[163],"85.6%":[165],"86.5%.":[167]},"counts_by_year":[{"year":2024,"cited_by_count":1},{"year":2023,"cited_by_count":2},{"year":2022,"cited_by_count":9},{"year":2021,"cited_by_count":23},{"year":2020,"cited_by_count":19},{"year":2019,"cited_by_count":7},{"year":2018,"cited_by_count":2}],"updated_date":"2025-11-06T03:46:38.306776","created_date":"2025-10-10T00:00:00"}
