{"id":"https://openalex.org/W4385938132","doi":"https://doi.org/10.1109/access.2023.3306026","title":"Application of Split Residual Multilevel Attention Network in Speaker Recognition","display_name":"Application of Split Residual Multilevel Attention Network in Speaker Recognition","publication_year":2023,"publication_date":"2023-01-01","ids":{"openalex":"https://openalex.org/W4385938132","doi":"https://doi.org/10.1109/access.2023.3306026"},"language":"en","primary_location":{"id":"doi:10.1109/access.2023.3306026","is_oa":true,"landing_page_url":"https://doi.org/10.1109/access.2023.3306026","pdf_url":"https://ieeexplore.ieee.org/ielx7/6287639/6514899/10223220.pdf","source":{"id":"https://openalex.org/S2485537415","display_name":"IEEE Access","issn_l":"2169-3536","issn":["2169-3536"],"is_oa":true,"is_in_doaj":true,"is_core":true,"host_organization":"https://openalex.org/P4310319808","host_organization_name":"Institute of Electrical and Electronics Engineers","host_organization_lineage":["https://openalex.org/P4310319808"],"host_organization_lineage_names":["Institute of Electrical and Electronics Engineers"],"type":"journal"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"IEEE Access","raw_type":"journal-article"},"type":"article","indexed_in":["crossref","doaj"],"open_access":{"is_oa":true,"oa_status":"gold","oa_url":"https://ieeexplore.ieee.org/ielx7/6287639/6514899/10223220.pdf","any_repository_has_fulltext":true},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5081733792","display_name":"Jiji Wang","orcid":"https://orcid.org/0009-0006-5833-0266"},"institutions":[{"id":"https://openalex.org/I31595395","display_name":"Chengdu University of Technology","ror":"https://ror.org/05pejbw21","country_code":"CN","type":"education","lineage":["https://openalex.org/I31595395"]}],"countries":["CN"],"is_corresponding":true,"raw_author_name":"Jiji Wang","raw_affiliation_strings":["College of Computer Science and Cyber Security, Chengdu University of Technology, Chengdu, China"],"raw_orcid":"https://orcid.org/0009-0006-5833-0266","affiliations":[{"raw_affiliation_string":"College of Computer Science and Cyber Security, Chengdu University of Technology, Chengdu, China","institution_ids":["https://openalex.org/I31595395"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5103187741","display_name":"Fei Deng","orcid":"https://orcid.org/0000-0002-2218-0853"},"institutions":[{"id":"https://openalex.org/I31595395","display_name":"Chengdu University of Technology","ror":"https://ror.org/05pejbw21","country_code":"CN","type":"education","lineage":["https://openalex.org/I31595395"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Fei Deng","raw_affiliation_strings":["College of Computer Science and Cyber Security, Chengdu University of Technology, Chengdu, China"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"College of Computer Science and Cyber Security, Chengdu University of Technology, Chengdu, China","institution_ids":["https://openalex.org/I31595395"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5064646267","display_name":"Lihong Deng","orcid":"https://orcid.org/0000-0002-2090-7158"},"institutions":[{"id":"https://openalex.org/I31595395","display_name":"Chengdu University of Technology","ror":"https://ror.org/05pejbw21","country_code":"CN","type":"education","lineage":["https://openalex.org/I31595395"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Lihong Deng","raw_affiliation_strings":["College of Computer Science and Cyber Security, Chengdu University of Technology, Chengdu, China"],"raw_orcid":"https://orcid.org/0000-0002-2090-7158","affiliations":[{"raw_affiliation_string":"College of Computer Science and Cyber Security, Chengdu University of Technology, Chengdu, China","institution_ids":["https://openalex.org/I31595395"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5101168953","display_name":"Ping Gao","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Ping Gao","raw_affiliation_strings":["Sichuan Tianyi Ecological Garden Group Company Ltd., Chengdu, China","Sichuan Tianyi Ecological Garden Group Co., LTD., No.1 Keyuan South Road, High-tech Zone, Chengdu City, Sichuan Province, China"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"Sichuan Tianyi Ecological Garden Group Company Ltd., Chengdu, China","institution_ids":[]},{"raw_affiliation_string":"Sichuan Tianyi Ecological Garden Group Co., LTD., No.1 Keyuan South Road, High-tech Zone, Chengdu City, Sichuan Province, China","institution_ids":[]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5103248376","display_name":"Yuanxiang Huang","orcid":"https://orcid.org/0009-0000-8123-7269"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Yuanxiang Huang","raw_affiliation_strings":["Sichuan Tianyi Ecological Garden Group Company Ltd., Chengdu, China","Sichuan Tianyi Ecological Garden Group Co., LTD., No.1 Keyuan South Road, High-tech Zone, Chengdu City, Sichuan Province, China"],"raw_orcid":"https://orcid.org/0009-0000-8123-7269","affiliations":[{"raw_affiliation_string":"Sichuan Tianyi Ecological Garden Group Company Ltd., Chengdu, China","institution_ids":[]},{"raw_affiliation_string":"Sichuan Tianyi Ecological Garden Group Co., LTD., No.1 Keyuan South Road, High-tech Zone, Chengdu City, Sichuan Province, China","institution_ids":[]}]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":5,"corresponding_author_ids":["https://openalex.org/A5081733792"],"corresponding_institution_ids":["https://openalex.org/I31595395"],"apc_list":{"value":1850,"currency":"USD","value_usd":1850},"apc_paid":{"value":1850,"currency":"USD","value_usd":1850},"fwci":0.5055,"has_fulltext":true,"cited_by_count":3,"citation_normalized_percentile":{"value":0.71241751,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":{"min":95,"max":98},"biblio":{"volume":"11","issue":null,"first_page":"89359","last_page":"89368"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10201","display_name":"Speech Recognition and Synthesis","score":0.9994000196456909,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10201","display_name":"Speech Recognition and Synthesis","score":0.9994000196456909,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10860","display_name":"Speech and Audio Processing","score":0.9965000152587891,"subfield":{"id":"https://openalex.org/subfields/1711","display_name":"Signal Processing"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11309","display_name":"Music and Audio Processing","score":0.9943000078201294,"subfield":{"id":"https://openalex.org/subfields/1711","display_name":"Signal Processing"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.8285413980484009},{"id":"https://openalex.org/keywords/speaker-recognition","display_name":"Speaker recognition","score":0.7933356761932373},{"id":"https://openalex.org/keywords/speech-recognition","display_name":"Speech recognition","score":0.6719685792922974},{"id":"https://openalex.org/keywords/discriminative-model","display_name":"Discriminative model","score":0.627006471157074},{"id":"https://openalex.org/keywords/pattern-recognition","display_name":"Pattern recognition (psychology)","score":0.5714303255081177},{"id":"https://openalex.org/keywords/feature-extraction","display_name":"Feature extraction","score":0.5495877265930176},{"id":"https://openalex.org/keywords/residual","display_name":"Residual","score":0.5450965166091919},{"id":"https://openalex.org/keywords/inference","display_name":"Inference","score":0.5334152579307556},{"id":"https://openalex.org/keywords/speaker-diarisation","display_name":"Speaker diarisation","score":0.5253835916519165},{"id":"https://openalex.org/keywords/residual-neural-network","display_name":"Residual neural network","score":0.47099918127059937},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.46656739711761475},{"id":"https://openalex.org/keywords/test-set","display_name":"Test set","score":0.43812209367752075},{"id":"https://openalex.org/keywords/feature","display_name":"Feature (linguistics)","score":0.43044358491897583},{"id":"https://openalex.org/keywords/artificial-neural-network","display_name":"Artificial neural network","score":0.2838839590549469},{"id":"https://openalex.org/keywords/algorithm","display_name":"Algorithm","score":0.08941909670829773}],"concepts":[{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.8285413980484009},{"id":"https://openalex.org/C133892786","wikidata":"https://www.wikidata.org/wiki/Q1145189","display_name":"Speaker recognition","level":2,"score":0.7933356761932373},{"id":"https://openalex.org/C28490314","wikidata":"https://www.wikidata.org/wiki/Q189436","display_name":"Speech recognition","level":1,"score":0.6719685792922974},{"id":"https://openalex.org/C97931131","wikidata":"https://www.wikidata.org/wiki/Q5282087","display_name":"Discriminative model","level":2,"score":0.627006471157074},{"id":"https://openalex.org/C153180895","wikidata":"https://www.wikidata.org/wiki/Q7148389","display_name":"Pattern recognition (psychology)","level":2,"score":0.5714303255081177},{"id":"https://openalex.org/C52622490","wikidata":"https://www.wikidata.org/wiki/Q1026626","display_name":"Feature extraction","level":2,"score":0.5495877265930176},{"id":"https://openalex.org/C155512373","wikidata":"https://www.wikidata.org/wiki/Q287450","display_name":"Residual","level":2,"score":0.5450965166091919},{"id":"https://openalex.org/C2776214188","wikidata":"https://www.wikidata.org/wiki/Q408386","display_name":"Inference","level":2,"score":0.5334152579307556},{"id":"https://openalex.org/C149838564","wikidata":"https://www.wikidata.org/wiki/Q7574248","display_name":"Speaker diarisation","level":3,"score":0.5253835916519165},{"id":"https://openalex.org/C2944601119","wikidata":"https://www.wikidata.org/wiki/Q43744058","display_name":"Residual neural network","level":3,"score":0.47099918127059937},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.46656739711761475},{"id":"https://openalex.org/C169903167","wikidata":"https://www.wikidata.org/wiki/Q3985153","display_name":"Test set","level":2,"score":0.43812209367752075},{"id":"https://openalex.org/C2776401178","wikidata":"https://www.wikidata.org/wiki/Q12050496","display_name":"Feature (linguistics)","level":2,"score":0.43044358491897583},{"id":"https://openalex.org/C50644808","wikidata":"https://www.wikidata.org/wiki/Q192776","display_name":"Artificial neural network","level":2,"score":0.2838839590549469},{"id":"https://openalex.org/C11413529","wikidata":"https://www.wikidata.org/wiki/Q8366","display_name":"Algorithm","level":1,"score":0.08941909670829773},{"id":"https://openalex.org/C41895202","wikidata":"https://www.wikidata.org/wiki/Q8162","display_name":"Linguistics","level":1,"score":0.0},{"id":"https://openalex.org/C138885662","wikidata":"https://www.wikidata.org/wiki/Q5891","display_name":"Philosophy","level":0,"score":0.0}],"mesh":[],"locations_count":2,"locations":[{"id":"doi:10.1109/access.2023.3306026","is_oa":true,"landing_page_url":"https://doi.org/10.1109/access.2023.3306026","pdf_url":"https://ieeexplore.ieee.org/ielx7/6287639/6514899/10223220.pdf","source":{"id":"https://openalex.org/S2485537415","display_name":"IEEE Access","issn_l":"2169-3536","issn":["2169-3536"],"is_oa":true,"is_in_doaj":true,"is_core":true,"host_organization":"https://openalex.org/P4310319808","host_organization_name":"Institute of Electrical and Electronics Engineers","host_organization_lineage":["https://openalex.org/P4310319808"],"host_organization_lineage_names":["Institute of Electrical and Electronics Engineers"],"type":"journal"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"IEEE Access","raw_type":"journal-article"},{"id":"pmh:oai:doaj.org/article:8494073d9a5041298329d8792f6bb69e","is_oa":true,"landing_page_url":"https://doaj.org/article/8494073d9a5041298329d8792f6bb69e","pdf_url":null,"source":{"id":"https://openalex.org/S4306401280","display_name":"DOAJ (DOAJ: Directory of Open Access Journals)","issn_l":null,"issn":null,"is_oa":false,"is_in_doaj":false,"is_core":false,"host_organization":null,"host_organization_name":null,"host_organization_lineage":[],"host_organization_lineage_names":[],"type":"repository"},"license":"cc-by-sa","license_id":"https://openalex.org/licenses/cc-by-sa","version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":"IEEE Access, Vol 11, Pp 89359-89368 (2023)","raw_type":"article"}],"best_oa_location":{"id":"doi:10.1109/access.2023.3306026","is_oa":true,"landing_page_url":"https://doi.org/10.1109/access.2023.3306026","pdf_url":"https://ieeexplore.ieee.org/ielx7/6287639/6514899/10223220.pdf","source":{"id":"https://openalex.org/S2485537415","display_name":"IEEE Access","issn_l":"2169-3536","issn":["2169-3536"],"is_oa":true,"is_in_doaj":true,"is_core":true,"host_organization":"https://openalex.org/P4310319808","host_organization_name":"Institute of Electrical and Electronics Engineers","host_organization_lineage":["https://openalex.org/P4310319808"],"host_organization_lineage_names":["Institute of Electrical and Electronics Engineers"],"type":"journal"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"IEEE Access","raw_type":"journal-article"},"sustainable_development_goals":[{"score":0.6600000262260437,"id":"https://metadata.un.org/sdg/10","display_name":"Reduced inequalities"}],"awards":[],"funders":[],"has_content":{"grobid_xml":true,"pdf":true},"content_urls":{"pdf":"https://content.openalex.org/works/W4385938132.pdf","grobid_xml":"https://content.openalex.org/works/W4385938132.grobid-xml"},"referenced_works_count":38,"referenced_works":["https://openalex.org/W86526702","https://openalex.org/W1522301498","https://openalex.org/W2046056978","https://openalex.org/W2101261946","https://openalex.org/W2194775991","https://openalex.org/W2408021097","https://openalex.org/W2612434969","https://openalex.org/W2726515241","https://openalex.org/W2748488820","https://openalex.org/W2784163702","https://openalex.org/W2794506738","https://openalex.org/W2808631503","https://openalex.org/W2884585870","https://openalex.org/W2890354241","https://openalex.org/W2890964092","https://openalex.org/W2916104401","https://openalex.org/W2928165649","https://openalex.org/W2963420686","https://openalex.org/W2972552635","https://openalex.org/W2981087920","https://openalex.org/W3015261361","https://openalex.org/W3024869864","https://openalex.org/W3103152812","https://openalex.org/W3108091009","https://openalex.org/W3118639295","https://openalex.org/W3197940657","https://openalex.org/W3198698812","https://openalex.org/W3206114047","https://openalex.org/W4220884846","https://openalex.org/W4225789456","https://openalex.org/W4288091954","https://openalex.org/W6631190155","https://openalex.org/W6687442591","https://openalex.org/W6737575990","https://openalex.org/W6753412334","https://openalex.org/W6769178842","https://openalex.org/W6797356783","https://openalex.org/W6801723603"],"related_works":["https://openalex.org/W4384929466","https://openalex.org/W2206035908","https://openalex.org/W3148366653","https://openalex.org/W2162158162","https://openalex.org/W4247736853","https://openalex.org/W1493012537","https://openalex.org/W2175373321","https://openalex.org/W2125642021","https://openalex.org/W4310979479","https://openalex.org/W2696990509"],"abstract_inverted_index":{"Current":[0],"speaker":[1,27,132,144,158,187,192],"recognition":[2,133,145,159,188],"systems":[3,146],"are":[4,19],"mainly":[5],"for":[6,56],"the":[7,37,113,122,131,148,157],"combined":[8],"application":[9],"of":[10,26,39,45,64,76,138],"network":[11,54],"architectures":[12],"and":[13,30,32,42,83,87,104,115,118,124,140,169,179,197],"attention":[14,98],"mechanisms,":[15],"however,":[16],"lightweight":[17],"networks":[18,34],"not":[20],"able":[21],"to":[22],"extract":[23],"frame-level":[24],"features":[25,103,107,111],"speech":[28],"well,":[29],"deeper":[31],"wider":[33],"also":[35],"face":[36],"problems":[38],"slower":[40],"inference":[41],"excessive":[43],"number":[44],"parameters.":[46],"To":[47],"this":[48,163],"end,":[49],"we":[50,93],"proposes":[51],"Split-ResNet,":[52],"a":[53,62,69,74,95,136,186],"structure":[55],"split":[57],"residuals,":[58],"which":[59],"can":[60],"obtain":[61],"combination":[63,137],"multiple":[65],"receptive":[66],"field":[67],"at":[68],"finer-grained":[70],"level,":[71],"thus":[72],"obtaining":[73],"variety":[75],"feature":[77,194],"representations":[78],"with":[79,175,190],"different":[80],"scale":[81],"combinations":[82],"producing":[84],"more":[85],"informative":[86],"comprehensive":[88],"multi-scale":[89],"features.":[90],"In":[91],"addition":[92],"propose":[94],"dual":[96],"time-frequency":[97],"(DTFA)":[99],"that":[100,156,183],"enhances":[101],"key":[102],"suppresses":[105],"unimportant":[106],"by":[108],"focusing":[109],"on":[110,147],"in":[112,162,172],"time":[114,123],"frequency":[116,125],"domains":[117],"learning":[119],"weights":[120],"from":[121],"channels,":[126],"respectively.":[127],"We":[128],"finally":[129],"tested":[130],"system":[134,160,189],"using":[135],"Split-ResNet":[139],"DTFA":[141],"against":[142],"other":[143],"Voxceleb1-O":[149],"test":[150,153],"set.":[151],"The":[152],"results":[154],"show":[155],"proposed":[161],"paper":[164],"is":[165,185],"0.98%,":[166],"0.39%,":[167],"0.69%":[168],"0.47%":[170],"lower":[171],"EER":[173],"compared":[174],"SpeechNAS,":[176],"RawNet2,":[177],"Y-vector":[178],"CNN+Transformer,":[180],"respectively,":[181],"proving":[182],"DTFA+Split-ResNet":[184],"good":[191],"audio":[193],"extraction":[195],"capability":[196],"discriminative":[198],"capability.":[199]},"counts_by_year":[{"year":2026,"cited_by_count":1},{"year":2025,"cited_by_count":2}],"updated_date":"2026-05-06T08:25:59.206177","created_date":"2025-10-10T00:00:00"}
