{"id":"https://openalex.org/W2793012778","doi":"https://doi.org/10.1109/taslp.2018.2797420","title":"Language/Dialect Recognition Based on Unsupervised Deep Learning","display_name":"Language/Dialect Recognition Based on Unsupervised Deep Learning","publication_year":2018,"publication_date":"2018-01-24","ids":{"openalex":"https://openalex.org/W2793012778","doi":"https://doi.org/10.1109/taslp.2018.2797420","mag":"2793012778"},"language":"en","primary_location":{"id":"doi:10.1109/taslp.2018.2797420","is_oa":false,"landing_page_url":"https://doi.org/10.1109/taslp.2018.2797420","pdf_url":null,"source":{"id":"https://openalex.org/S4210169297","display_name":"IEEE/ACM Transactions on Audio Speech and Language Processing","issn_l":"2329-9290","issn":["2329-9290","2329-9304"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310319808","host_organization_name":"Institute of Electrical and Electronics Engineers","host_organization_lineage":["https://openalex.org/P4310319808"],"host_organization_lineage_names":["Institute of Electrical and Electronics Engineers"],"type":"journal"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"IEEE/ACM Transactions on Audio, Speech, and Language Processing","raw_type":"journal-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":false,"oa_status":"closed","oa_url":null,"any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5115603610","display_name":"Qian Zhang","orcid":"https://orcid.org/0000-0001-5975-9781"},"institutions":[{"id":"https://openalex.org/I162577319","display_name":"The University of Texas at Dallas","ror":"https://ror.org/049emcs32","country_code":"US","type":"education","lineage":["https://openalex.org/I162577319"]}],"countries":["US"],"is_corresponding":true,"raw_author_name":"Qian Zhang","raw_affiliation_strings":["Center for Robust Speech Systems, Erik Jonsson School of Engineering University of Texas at Dallas, Richardson, TX, USA"],"affiliations":[{"raw_affiliation_string":"Center for Robust Speech Systems, Erik Jonsson School of Engineering University of Texas at Dallas, Richardson, TX, USA","institution_ids":["https://openalex.org/I162577319"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5057910370","display_name":"John H. L. Hansen","orcid":"https://orcid.org/0000-0003-1382-9929"},"institutions":[{"id":"https://openalex.org/I162577319","display_name":"The University of Texas at Dallas","ror":"https://ror.org/049emcs32","country_code":"US","type":"education","lineage":["https://openalex.org/I162577319"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"John H. L. Hansen","raw_affiliation_strings":["Center for Robust Speech Systems, Erik Jonsson School of Engineering University of Texas at Dallas, Richardson, TX, USA"],"affiliations":[{"raw_affiliation_string":"Center for Robust Speech Systems, Erik Jonsson School of Engineering University of Texas at Dallas, Richardson, TX, USA","institution_ids":["https://openalex.org/I162577319"]}]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":2,"corresponding_author_ids":["https://openalex.org/A5115603610"],"corresponding_institution_ids":["https://openalex.org/I162577319"],"apc_list":null,"apc_paid":null,"fwci":4.7236,"has_fulltext":false,"cited_by_count":41,"citation_normalized_percentile":{"value":0.95839435,"is_in_top_1_percent":false,"is_in_top_10_percent":true},"cited_by_percentile_year":{"min":90,"max":99},"biblio":{"volume":"26","issue":"5","first_page":"873","last_page":"882"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10201","display_name":"Speech Recognition and Synthesis","score":0.9994999766349792,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10201","display_name":"Speech Recognition and Synthesis","score":0.9994999766349792,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10181","display_name":"Natural Language Processing Techniques","score":0.996999979019165,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11309","display_name":"Music and Audio Processing","score":0.9929999709129333,"subfield":{"id":"https://openalex.org/subfields/1711","display_name":"Signal Processing"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/autoencoder","display_name":"Autoencoder","score":0.8907632827758789},{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.7636628150939941},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.7532905340194702},{"id":"https://openalex.org/keywords/bottleneck","display_name":"Bottleneck","score":0.7080256938934326},{"id":"https://openalex.org/keywords/natural-language-processing","display_name":"Natural language processing","score":0.603699803352356},{"id":"https://openalex.org/keywords/feature-extraction","display_name":"Feature extraction","score":0.5780476331710815},{"id":"https://openalex.org/keywords/feature","display_name":"Feature (linguistics)","score":0.5401498079299927},{"id":"https://openalex.org/keywords/speech-recognition","display_name":"Speech recognition","score":0.4606840908527374},{"id":"https://openalex.org/keywords/speech-processing","display_name":"Speech processing","score":0.41466018557548523},{"id":"https://openalex.org/keywords/deep-learning","display_name":"Deep learning","score":0.40276187658309937},{"id":"https://openalex.org/keywords/pattern-recognition","display_name":"Pattern recognition (psychology)","score":0.387633740901947},{"id":"https://openalex.org/keywords/linguistics","display_name":"Linguistics","score":0.0872284471988678}],"concepts":[{"id":"https://openalex.org/C101738243","wikidata":"https://www.wikidata.org/wiki/Q786435","display_name":"Autoencoder","level":3,"score":0.8907632827758789},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.7636628150939941},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.7532905340194702},{"id":"https://openalex.org/C2780513914","wikidata":"https://www.wikidata.org/wiki/Q18210350","display_name":"Bottleneck","level":2,"score":0.7080256938934326},{"id":"https://openalex.org/C204321447","wikidata":"https://www.wikidata.org/wiki/Q30642","display_name":"Natural language processing","level":1,"score":0.603699803352356},{"id":"https://openalex.org/C52622490","wikidata":"https://www.wikidata.org/wiki/Q1026626","display_name":"Feature extraction","level":2,"score":0.5780476331710815},{"id":"https://openalex.org/C2776401178","wikidata":"https://www.wikidata.org/wiki/Q12050496","display_name":"Feature (linguistics)","level":2,"score":0.5401498079299927},{"id":"https://openalex.org/C28490314","wikidata":"https://www.wikidata.org/wiki/Q189436","display_name":"Speech recognition","level":1,"score":0.4606840908527374},{"id":"https://openalex.org/C61328038","wikidata":"https://www.wikidata.org/wiki/Q3358061","display_name":"Speech processing","level":2,"score":0.41466018557548523},{"id":"https://openalex.org/C108583219","wikidata":"https://www.wikidata.org/wiki/Q197536","display_name":"Deep learning","level":2,"score":0.40276187658309937},{"id":"https://openalex.org/C153180895","wikidata":"https://www.wikidata.org/wiki/Q7148389","display_name":"Pattern recognition (psychology)","level":2,"score":0.387633740901947},{"id":"https://openalex.org/C41895202","wikidata":"https://www.wikidata.org/wiki/Q8162","display_name":"Linguistics","level":1,"score":0.0872284471988678},{"id":"https://openalex.org/C138885662","wikidata":"https://www.wikidata.org/wiki/Q5891","display_name":"Philosophy","level":0,"score":0.0},{"id":"https://openalex.org/C149635348","wikidata":"https://www.wikidata.org/wiki/Q193040","display_name":"Embedded system","level":1,"score":0.0}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.1109/taslp.2018.2797420","is_oa":false,"landing_page_url":"https://doi.org/10.1109/taslp.2018.2797420","pdf_url":null,"source":{"id":"https://openalex.org/S4210169297","display_name":"IEEE/ACM Transactions on Audio Speech and Language Processing","issn_l":"2329-9290","issn":["2329-9290","2329-9304"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310319808","host_organization_name":"Institute of Electrical and Electronics Engineers","host_organization_lineage":["https://openalex.org/P4310319808"],"host_organization_lineage_names":["Institute of Electrical and Electronics Engineers"],"type":"journal"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"IEEE/ACM Transactions on Audio, Speech, and Language Processing","raw_type":"journal-article"}],"best_oa_location":null,"sustainable_development_goals":[{"display_name":"Quality Education","score":0.7900000214576721,"id":"https://metadata.un.org/sdg/4"}],"awards":[{"id":"https://openalex.org/G8087301405","display_name":null,"funder_award_id":"FA8750-15-1-0205","funder_id":"https://openalex.org/F4320338294","funder_display_name":"Air Force Research Laboratory"}],"funders":[{"id":"https://openalex.org/F4320338294","display_name":"Air Force Research Laboratory","ror":"https://ror.org/02e2egq70"}],"has_content":{"grobid_xml":false,"pdf":false},"content_urls":null,"referenced_works_count":44,"referenced_works":["https://openalex.org/W1499798934","https://openalex.org/W1524333225","https://openalex.org/W1936725236","https://openalex.org/W1968377371","https://openalex.org/W1990501283","https://openalex.org/W2001285277","https://openalex.org/W2011142564","https://openalex.org/W2023582935","https://openalex.org/W2025929295","https://openalex.org/W2034626437","https://openalex.org/W2039057510","https://openalex.org/W2046015436","https://openalex.org/W2095501777","https://openalex.org/W2107638917","https://openalex.org/W2113832997","https://openalex.org/W2128952115","https://openalex.org/W2131703294","https://openalex.org/W2134817403","https://openalex.org/W2147768505","https://openalex.org/W2151534428","https://openalex.org/W2158069733","https://openalex.org/W2183016404","https://openalex.org/W2184170932","https://openalex.org/W2185814970","https://openalex.org/W2187089797","https://openalex.org/W2296483664","https://openalex.org/W2340176088","https://openalex.org/W2398046886","https://openalex.org/W2406718879","https://openalex.org/W2408548175","https://openalex.org/W2505434962","https://openalex.org/W2509153213","https://openalex.org/W2963486098","https://openalex.org/W4234330420","https://openalex.org/W4293568373","https://openalex.org/W4361745846","https://openalex.org/W6606123296","https://openalex.org/W6629687487","https://openalex.org/W6631362777","https://openalex.org/W6680125536","https://openalex.org/W6686429374","https://openalex.org/W6691580672","https://openalex.org/W6697003656","https://openalex.org/W6780248173"],"related_works":["https://openalex.org/W2595172197","https://openalex.org/W3013693939","https://openalex.org/W2566616303","https://openalex.org/W2159052453","https://openalex.org/W3131327266","https://openalex.org/W2669956259","https://openalex.org/W4249005693","https://openalex.org/W4392946183","https://openalex.org/W3088732000","https://openalex.org/W3013299381"],"abstract_inverted_index":{"Over":[0],"the":[1,57,113,116,162,180],"past":[2],"decade,":[3],"bottleneck":[4,20,47,59],"features":[5,147,164],"within":[6],"an":[7,45],"i-Vector":[8],"framework":[9],"have":[10,89],"been":[11,90],"used":[12],"for":[13,84,93,142,177],"state-of-the-art":[14],"language/dialect":[15],"identification":[16],"(LID/DID).":[17],"However,":[18],"traditional":[19,58,152],"feature":[21,48,86,154],"extraction":[22,49],"requires":[23],"additional":[24],"transcribed":[25],"speech":[26,85,109,185],"information.":[27],"Alternatively,":[28],"two":[29,75],"types":[30,76],"of":[31,77,108,115,182],"unsupervised":[32,46],"deep":[33],"learning":[34,80],"methods":[35],"are":[36,82,103,121,148],"introduced":[37,83],"in":[38,172],"this":[39,43],"study.":[40],"To":[41,111],"address":[42],"limitation,":[44],"approach":[50],"is":[51,54],"proposed,":[52],"which":[53,88],"derived":[55],"from":[56],"structure":[60],"but":[61],"trained":[62],"with":[63],"estimated":[64],"phonetic":[65],"labels.":[66],"In":[67],"addition,":[68],"based":[69],"on":[70,105],"a":[71,97,124,130,168],"generative":[72],"modeling":[73],"autoencoder,":[74],"latent":[78],"variable":[79],"algorithms":[81],"processing,":[87],"previous":[91],"considered":[92],"image":[94],"processing/reconstruction.":[95],"Specifically,":[96],"variational":[98],"autoencoder":[99,102],"and":[100,135],"adversarial":[101],"utilized":[104],"alternative":[106],"phase":[107],"processing.":[110],"demonstrate":[112],"effectiveness":[114],"proposed":[117,146,163],"methods,":[118],"three":[119,158],"corpora":[120],"evaluated:":[122],"1)":[123],"four":[125],"Chinese":[126],"dialect":[127,133],"dataset,":[128],"2)":[129],"five":[131],"Arabic":[132],"corpus,":[134],"3)":[136],"multigenre":[137],"broadcast":[138],"challenge":[139],"corpus":[140],"(MGB-3)":[141],"arabic":[143],"DID.":[144],"The":[145],"shown":[149],"to":[150,167],"outperform":[151],"acoustic":[153],"MFCCs":[155],"consistently":[156],"across":[157],"corpora.":[159,186],"Taken":[160],"collectively,":[161],"achieve":[165],"up":[166],"relative":[169],"+58%":[170],"improvement":[171],"C":[173],"<sub":[174],"xmlns:mml=\"http://www.w3.org/1998/Math/MathML\"":[175],"xmlns:xlink=\"http://www.w3.org/1999/xlink\">avg</sub>":[176],"LID/DID":[178],"without":[179],"need":[181],"any":[183],"secondary":[184]},"counts_by_year":[{"year":2025,"cited_by_count":3},{"year":2024,"cited_by_count":1},{"year":2023,"cited_by_count":3},{"year":2022,"cited_by_count":5},{"year":2021,"cited_by_count":7},{"year":2020,"cited_by_count":13},{"year":2019,"cited_by_count":6},{"year":2018,"cited_by_count":3}],"updated_date":"2025-11-06T03:46:38.306776","created_date":"2025-10-10T00:00:00"}
