{"id":"https://openalex.org/W3042558177","doi":"https://doi.org/10.1109/access.2020.3009987","title":"Speaker Identification in Multi-Talker Overlapping Speech Using Neural Networks","display_name":"Speaker Identification in Multi-Talker Overlapping Speech Using Neural Networks","publication_year":2020,"publication_date":"2020-01-01","ids":{"openalex":"https://openalex.org/W3042558177","doi":"https://doi.org/10.1109/access.2020.3009987","mag":"3042558177"},"language":"en","primary_location":{"id":"doi:10.1109/access.2020.3009987","is_oa":true,"landing_page_url":"https://doi.org/10.1109/access.2020.3009987","pdf_url":"https://ieeexplore.ieee.org/ielx7/6287639/8948470/09143073.pdf","source":{"id":"https://openalex.org/S2485537415","display_name":"IEEE Access","issn_l":"2169-3536","issn":["2169-3536"],"is_oa":true,"is_in_doaj":true,"is_core":true,"host_organization":"https://openalex.org/P4310319808","host_organization_name":"Institute of Electrical and Electronics Engineers","host_organization_lineage":["https://openalex.org/P4310319808"],"host_organization_lineage_names":["Institute of Electrical and Electronics Engineers"],"type":"journal"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"IEEE Access","raw_type":"journal-article"},"type":"article","indexed_in":["crossref","doaj"],"open_access":{"is_oa":true,"oa_status":"gold","oa_url":"https://ieeexplore.ieee.org/ielx7/6287639/8948470/09143073.pdf","any_repository_has_fulltext":true},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5010107824","display_name":"Van-Thuan Tran","orcid":"https://orcid.org/0000-0002-3197-679X"},"institutions":[{"id":"https://openalex.org/I118292597","display_name":"National Taipei University of Technology","ror":"https://ror.org/00cn92c09","country_code":"TW","type":"education","lineage":["https://openalex.org/I118292597"]}],"countries":["TW"],"is_corresponding":true,"raw_author_name":"Van-Thuan Tran","raw_affiliation_strings":["Department of Electronic Engineering, National Taipei University of Technology, Taipei, Taiwan"],"raw_orcid":"https://orcid.org/0000-0002-3197-679X","affiliations":[{"raw_affiliation_string":"Department of Electronic Engineering, National Taipei University of Technology, Taipei, Taiwan","institution_ids":["https://openalex.org/I118292597"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5020303183","display_name":"Wei-Ho Tsai","orcid":"https://orcid.org/0000-0002-0867-7951"},"institutions":[{"id":"https://openalex.org/I118292597","display_name":"National Taipei University of Technology","ror":"https://ror.org/00cn92c09","country_code":"TW","type":"education","lineage":["https://openalex.org/I118292597"]}],"countries":["TW"],"is_corresponding":false,"raw_author_name":"Wei-Ho Tsai","raw_affiliation_strings":["Department of Electronic Engineering, National Taipei University of Technology, Taipei, Taiwan"],"raw_orcid":"https://orcid.org/0000-0002-0867-7951","affiliations":[{"raw_affiliation_string":"Department of Electronic Engineering, National Taipei University of Technology, Taipei, Taiwan","institution_ids":["https://openalex.org/I118292597"]}]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":2,"corresponding_author_ids":["https://openalex.org/A5010107824"],"corresponding_institution_ids":["https://openalex.org/I118292597"],"apc_list":{"value":1850,"currency":"USD","value_usd":1850},"apc_paid":{"value":1850,"currency":"USD","value_usd":1850},"fwci":0.544,"has_fulltext":true,"cited_by_count":11,"citation_normalized_percentile":{"value":0.735162,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":{"min":89,"max":98},"biblio":{"volume":"8","issue":null,"first_page":"134868","last_page":"134879"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10201","display_name":"Speech Recognition and Synthesis","score":0.9998999834060669,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10201","display_name":"Speech Recognition and Synthesis","score":0.9998999834060669,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10860","display_name":"Speech and Audio Processing","score":0.9998999834060669,"subfield":{"id":"https://openalex.org/subfields/1711","display_name":"Signal Processing"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11309","display_name":"Music and Audio Processing","score":0.9986000061035156,"subfield":{"id":"https://openalex.org/subfields/1711","display_name":"Signal Processing"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.8131314516067505},{"id":"https://openalex.org/keywords/speech-recognition","display_name":"Speech recognition","score":0.7289878129959106},{"id":"https://openalex.org/keywords/speaker-identification","display_name":"Speaker identification","score":0.7127752304077148},{"id":"https://openalex.org/keywords/classifier","display_name":"Classifier (UML)","score":0.5800324082374573},{"id":"https://openalex.org/keywords/mixture-model","display_name":"Mixture model","score":0.566070556640625},{"id":"https://openalex.org/keywords/convolutional-neural-network","display_name":"Convolutional neural network","score":0.5640829801559448},{"id":"https://openalex.org/keywords/speaker-recognition","display_name":"Speaker recognition","score":0.5521324872970581},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.5319196581840515},{"id":"https://openalex.org/keywords/identification","display_name":"Identification (biology)","score":0.5095577239990234},{"id":"https://openalex.org/keywords/pattern-recognition","display_name":"Pattern recognition (psychology)","score":0.4976373016834259},{"id":"https://openalex.org/keywords/single-stage","display_name":"Single stage","score":0.4740331470966339},{"id":"https://openalex.org/keywords/multilayer-perceptron","display_name":"Multilayer perceptron","score":0.4331216812133789},{"id":"https://openalex.org/keywords/artificial-neural-network","display_name":"Artificial neural network","score":0.4309220016002655},{"id":"https://openalex.org/keywords/gaussian","display_name":"Gaussian","score":0.4292443096637726},{"id":"https://openalex.org/keywords/perceptron","display_name":"Perceptron","score":0.42704713344573975}],"concepts":[{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.8131314516067505},{"id":"https://openalex.org/C28490314","wikidata":"https://www.wikidata.org/wiki/Q189436","display_name":"Speech recognition","level":1,"score":0.7289878129959106},{"id":"https://openalex.org/C2986627078","wikidata":"https://www.wikidata.org/wiki/Q1145189","display_name":"Speaker identification","level":3,"score":0.7127752304077148},{"id":"https://openalex.org/C95623464","wikidata":"https://www.wikidata.org/wiki/Q1096149","display_name":"Classifier (UML)","level":2,"score":0.5800324082374573},{"id":"https://openalex.org/C61224824","wikidata":"https://www.wikidata.org/wiki/Q2260434","display_name":"Mixture model","level":2,"score":0.566070556640625},{"id":"https://openalex.org/C81363708","wikidata":"https://www.wikidata.org/wiki/Q17084460","display_name":"Convolutional neural network","level":2,"score":0.5640829801559448},{"id":"https://openalex.org/C133892786","wikidata":"https://www.wikidata.org/wiki/Q1145189","display_name":"Speaker recognition","level":2,"score":0.5521324872970581},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.5319196581840515},{"id":"https://openalex.org/C116834253","wikidata":"https://www.wikidata.org/wiki/Q2039217","display_name":"Identification (biology)","level":2,"score":0.5095577239990234},{"id":"https://openalex.org/C153180895","wikidata":"https://www.wikidata.org/wiki/Q7148389","display_name":"Pattern recognition (psychology)","level":2,"score":0.4976373016834259},{"id":"https://openalex.org/C3020376581","wikidata":"https://www.wikidata.org/wiki/Q16866784","display_name":"Single stage","level":2,"score":0.4740331470966339},{"id":"https://openalex.org/C179717631","wikidata":"https://www.wikidata.org/wiki/Q2991667","display_name":"Multilayer perceptron","level":3,"score":0.4331216812133789},{"id":"https://openalex.org/C50644808","wikidata":"https://www.wikidata.org/wiki/Q192776","display_name":"Artificial neural network","level":2,"score":0.4309220016002655},{"id":"https://openalex.org/C163716315","wikidata":"https://www.wikidata.org/wiki/Q901177","display_name":"Gaussian","level":2,"score":0.4292443096637726},{"id":"https://openalex.org/C60908668","wikidata":"https://www.wikidata.org/wiki/Q690207","display_name":"Perceptron","level":3,"score":0.42704713344573975},{"id":"https://openalex.org/C146978453","wikidata":"https://www.wikidata.org/wiki/Q3798668","display_name":"Aerospace engineering","level":1,"score":0.0},{"id":"https://openalex.org/C127413603","wikidata":"https://www.wikidata.org/wiki/Q11023","display_name":"Engineering","level":0,"score":0.0},{"id":"https://openalex.org/C62520636","wikidata":"https://www.wikidata.org/wiki/Q944","display_name":"Quantum mechanics","level":1,"score":0.0},{"id":"https://openalex.org/C59822182","wikidata":"https://www.wikidata.org/wiki/Q441","display_name":"Botany","level":1,"score":0.0},{"id":"https://openalex.org/C121332964","wikidata":"https://www.wikidata.org/wiki/Q413","display_name":"Physics","level":0,"score":0.0},{"id":"https://openalex.org/C86803240","wikidata":"https://www.wikidata.org/wiki/Q420","display_name":"Biology","level":0,"score":0.0}],"mesh":[],"locations_count":2,"locations":[{"id":"doi:10.1109/access.2020.3009987","is_oa":true,"landing_page_url":"https://doi.org/10.1109/access.2020.3009987","pdf_url":"https://ieeexplore.ieee.org/ielx7/6287639/8948470/09143073.pdf","source":{"id":"https://openalex.org/S2485537415","display_name":"IEEE Access","issn_l":"2169-3536","issn":["2169-3536"],"is_oa":true,"is_in_doaj":true,"is_core":true,"host_organization":"https://openalex.org/P4310319808","host_organization_name":"Institute of Electrical and Electronics Engineers","host_organization_lineage":["https://openalex.org/P4310319808"],"host_organization_lineage_names":["Institute of Electrical and Electronics Engineers"],"type":"journal"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"IEEE Access","raw_type":"journal-article"},{"id":"pmh:oai:doaj.org/article:2db1bbf963904497866472b1a4a22c84","is_oa":true,"landing_page_url":"https://doaj.org/article/2db1bbf963904497866472b1a4a22c84","pdf_url":null,"source":{"id":"https://openalex.org/S4306401280","display_name":"DOAJ (DOAJ: Directory of Open Access Journals)","issn_l":null,"issn":null,"is_oa":false,"is_in_doaj":false,"is_core":false,"host_organization":null,"host_organization_name":null,"host_organization_lineage":[],"host_organization_lineage_names":[],"type":"repository"},"license":"cc-by-sa","license_id":"https://openalex.org/licenses/cc-by-sa","version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":"IEEE Access, Vol 8, Pp 134868-134879 (2020)","raw_type":"article"}],"best_oa_location":{"id":"doi:10.1109/access.2020.3009987","is_oa":true,"landing_page_url":"https://doi.org/10.1109/access.2020.3009987","pdf_url":"https://ieeexplore.ieee.org/ielx7/6287639/8948470/09143073.pdf","source":{"id":"https://openalex.org/S2485537415","display_name":"IEEE Access","issn_l":"2169-3536","issn":["2169-3536"],"is_oa":true,"is_in_doaj":true,"is_core":true,"host_organization":"https://openalex.org/P4310319808","host_organization_name":"Institute of Electrical and Electronics Engineers","host_organization_lineage":["https://openalex.org/P4310319808"],"host_organization_lineage_names":["Institute of Electrical and Electronics Engineers"],"type":"journal"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"IEEE Access","raw_type":"journal-article"},"sustainable_development_goals":[{"id":"https://metadata.un.org/sdg/7","score":0.41999998688697815,"display_name":"Affordable and clean energy"}],"awards":[{"id":"https://openalex.org/G1192399272","display_name":null,"funder_award_id":"MOST 106-","funder_id":"https://openalex.org/F4320322795","funder_display_name":"Ministry of Science and Technology, Taiwan"},{"id":"https://openalex.org/G1662538391","display_name":null,"funder_award_id":"2221-E-027","funder_id":"https://openalex.org/F4320322795","funder_display_name":"Ministry of Science and Technology, Taiwan"},{"id":"https://openalex.org/G4905506096","display_name":null,"funder_award_id":"106-2221-E-027-125-MY2","funder_id":"https://openalex.org/F4320322795","funder_display_name":"Ministry of Science and Technology, Taiwan"},{"id":"https://openalex.org/G5563719332","display_name":null,"funder_award_id":"106-2221-E-","funder_id":"https://openalex.org/F4320322795","funder_display_name":"Ministry of Science and Technology, Taiwan"},{"id":"https://openalex.org/G8622225470","display_name":null,"funder_award_id":"MOST 106-2221-E-027-125-MY2","funder_id":"https://openalex.org/F4320322795","funder_display_name":"Ministry of Science and Technology, Taiwan"},{"id":"https://openalex.org/G939887807","display_name":null,"funder_award_id":"MOST 106","funder_id":"https://openalex.org/F4320322795","funder_display_name":"Ministry of Science and Technology, Taiwan"}],"funders":[{"id":"https://openalex.org/F4320322795","display_name":"Ministry of Science and Technology, Taiwan","ror":"https://ror.org/02kv4zf79"}],"has_content":{"pdf":true,"grobid_xml":true},"content_urls":{"pdf":"https://content.openalex.org/works/W3042558177.pdf","grobid_xml":"https://content.openalex.org/works/W3042558177.grobid-xml"},"referenced_works_count":28,"referenced_works":["https://openalex.org/W32904849","https://openalex.org/W80245499","https://openalex.org/W603591469","https://openalex.org/W814827736","https://openalex.org/W1006777433","https://openalex.org/W1558276682","https://openalex.org/W2003522884","https://openalex.org/W2046056978","https://openalex.org/W2097583714","https://openalex.org/W2106103082","https://openalex.org/W2115483887","https://openalex.org/W2146502635","https://openalex.org/W2163704482","https://openalex.org/W2169264834","https://openalex.org/W2191779130","https://openalex.org/W2577680292","https://openalex.org/W2726515241","https://openalex.org/W2767537758","https://openalex.org/W2890964092","https://openalex.org/W2915280872","https://openalex.org/W2964052309","https://openalex.org/W2972627751","https://openalex.org/W2983799728","https://openalex.org/W6601320802","https://openalex.org/W6603318777","https://openalex.org/W6618327443","https://openalex.org/W6675718704","https://openalex.org/W6681435938"],"related_works":["https://openalex.org/W2128073728","https://openalex.org/W4234190324","https://openalex.org/W1197719229","https://openalex.org/W2381158726","https://openalex.org/W1992796048","https://openalex.org/W4396668120","https://openalex.org/W2126085626","https://openalex.org/W2129048388","https://openalex.org/W2129090883","https://openalex.org/W2972577568"],"abstract_inverted_index":{"Although":[0],"numerous":[1],"works":[2,16],"have":[3],"studied":[4],"the":[5,18,28,54,65,84,92,101,121,128,139,145,158,181,205],"problem":[6],"of":[7,25,30,94,138,210],"automatic":[8],"speaker":[9],"identification":[10,134],"(SID),":[11],"there":[12],"are":[13],"only":[14],"few":[15],"on":[17,149,161],"SID":[19,58],"for":[20,56,180],"overlapping":[21,38,57,66,202],"speech,":[22],"and":[23,83,165,200],"none":[24],"them":[26],"consider":[27],"case":[29],"more":[31,117,192],"than":[32,120,136,157],"two":[33,76],"simultaneous":[34,72,95,189],"speakers.":[35,73,190],"Recognizing":[36],"that":[37,60,127,137],"speech":[39,67],"occurs":[40],"frequently":[41],"in":[42,47,64],"real-life":[43],"scenarios,":[44],"such":[45],"as":[46],"meetings":[48],"or":[49],"debates,":[50],"this":[51],"work":[52],"investigates":[53],"methods":[55],"(OSID)":[59],"can":[61],"determine":[62],"identities":[63],"from":[68],"up":[69,186],"to":[70,110,187],"five":[71,188],"We":[74],"propose":[75],"deep-learning":[77],"OSID":[78,112,130,146,174,178],"systems,":[79],"one":[80],"is":[81,86,115],"two-stage":[82,89,122,129,173],"other":[85],"single-stage.":[87],"The":[88,103,170],"system":[90,105,131,175,206],"determines":[91],"number":[93],"speakers":[96],"firstly,":[97],"followed":[98],"by":[99],"identifying":[100],"speaker(s).":[102],"single-stage":[104,140],"uses":[106],"a":[107],"single":[108],"classifier":[109],"perform":[111,155],"directly,":[113],"which":[114],"slightly":[116],"computationally":[118],"efficient":[119],"system.":[123,141],"Our":[124],"experiments":[125],"show":[126],"achieves":[132,176],"better":[133,156],"accuracy":[135,179],"In":[142,191],"addition,":[143],"both":[144,197],"systems":[147,159],"based":[148,160],"one-dimensional":[150],"convolutional":[151],"neural":[152],"networks":[153],"(1DCNN)":[154],"multilayer":[162],"perceptron":[163],"(MLP)":[164],"Gaussian":[166],"mixture":[167],"models":[168],"(GMMs).":[169],"proposed":[171],"1DCNN-based":[172],"98.55%":[177],"clean":[182],"audio":[183],"data":[184],"containing":[185],"challenging":[193],"experimental":[194],"conditions":[195],"involving":[196],"background":[198],"noises":[199],"high":[201],"energy":[203],"ratios,":[204],"still":[207],"attained":[208],"accuracies":[209],"above":[211],"90%.":[212]},"counts_by_year":[{"year":2026,"cited_by_count":1},{"year":2025,"cited_by_count":2},{"year":2024,"cited_by_count":4},{"year":2022,"cited_by_count":3},{"year":2021,"cited_by_count":1}],"updated_date":"2026-05-06T08:25:59.206177","created_date":"2025-10-10T00:00:00"}
