{"id":"https://openalex.org/W3021717829","doi":"https://doi.org/10.1109/taslp.2020.2990275","title":"Speaker Verification by Partial AUC Optimization With Mahalanobis Distance Metric Learning","display_name":"Speaker Verification by Partial AUC Optimization With Mahalanobis Distance Metric Learning","publication_year":2020,"publication_date":"2020-01-01","ids":{"openalex":"https://openalex.org/W3021717829","doi":"https://doi.org/10.1109/taslp.2020.2990275","mag":"3021717829"},"language":"en","primary_location":{"id":"doi:10.1109/taslp.2020.2990275","is_oa":false,"landing_page_url":"https://doi.org/10.1109/taslp.2020.2990275","pdf_url":null,"source":{"id":"https://openalex.org/S4210169297","display_name":"IEEE/ACM Transactions on Audio Speech and Language Processing","issn_l":"2329-9290","issn":["2329-9290","2329-9304"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310319808","host_organization_name":"Institute of Electrical and Electronics Engineers","host_organization_lineage":["https://openalex.org/P4310319808"],"host_organization_lineage_names":["Institute of Electrical and Electronics Engineers"],"type":"journal"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"IEEE/ACM Transactions on Audio, Speech, and Language Processing","raw_type":"journal-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":false,"oa_status":"closed","oa_url":null,"any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5041350492","display_name":"Zhongxin Bai","orcid":"https://orcid.org/0000-0003-3575-7014"},"institutions":[{"id":"https://openalex.org/I17145004","display_name":"Northwestern Polytechnical University","ror":"https://ror.org/01y0j0j86","country_code":"CN","type":"education","lineage":["https://openalex.org/I17145004"]}],"countries":["CN"],"is_corresponding":true,"raw_author_name":"Zhongxin Bai","raw_affiliation_strings":["Center of Intelligent Acoustics and Immersive Communications (CIAIC) and the School of Marine Science and Technology, Northwestern Polytechnical University, Xi\u2019an, China","Center of Intelligent Acoustics and Immersive Communications (CIAIC) and the School of Marine Science and Technology, Northwestern Polytechnical University, Xi'an, China"],"affiliations":[{"raw_affiliation_string":"Center of Intelligent Acoustics and Immersive Communications (CIAIC) and the School of Marine Science and Technology, Northwestern Polytechnical University, Xi\u2019an, China","institution_ids":["https://openalex.org/I17145004"]},{"raw_affiliation_string":"Center of Intelligent Acoustics and Immersive Communications (CIAIC) and the School of Marine Science and Technology, Northwestern Polytechnical University, Xi'an, China","institution_ids":["https://openalex.org/I17145004"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5100450091","display_name":"Xiao-Lei Zhang","orcid":"https://orcid.org/0000-0001-7694-193X"},"institutions":[{"id":"https://openalex.org/I17145004","display_name":"Northwestern Polytechnical University","ror":"https://ror.org/01y0j0j86","country_code":"CN","type":"education","lineage":["https://openalex.org/I17145004"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Xiao-Lei Zhang","raw_affiliation_strings":["Center of Intelligent Acoustics and Immersive Communications (CIAIC) and the School of Marine Science and Technology, Northwestern Polytechnical University, Xi\u2019an, China","Center of Intelligent Acoustics and Immersive Communications (CIAIC) and the School of Marine Science and Technology, Northwestern Polytechnical University, Xi'an, China"],"affiliations":[{"raw_affiliation_string":"Center of Intelligent Acoustics and Immersive Communications (CIAIC) and the School of Marine Science and Technology, Northwestern Polytechnical University, Xi\u2019an, China","institution_ids":["https://openalex.org/I17145004"]},{"raw_affiliation_string":"Center of Intelligent Acoustics and Immersive Communications (CIAIC) and the School of Marine Science and Technology, Northwestern Polytechnical University, Xi'an, China","institution_ids":["https://openalex.org/I17145004"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5056129529","display_name":"Jingdong Chen","orcid":"https://orcid.org/0000-0003-0083-9247"},"institutions":[{"id":"https://openalex.org/I17145004","display_name":"Northwestern Polytechnical University","ror":"https://ror.org/01y0j0j86","country_code":"CN","type":"education","lineage":["https://openalex.org/I17145004"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Jingdong Chen","raw_affiliation_strings":["CIAIC, Northwestern Polytechnical University, Xi\u2019an, China","CIAIC, Northwestern Polytechnical University, Xi'an, China"],"affiliations":[{"raw_affiliation_string":"CIAIC, Northwestern Polytechnical University, Xi\u2019an, China","institution_ids":["https://openalex.org/I17145004"]},{"raw_affiliation_string":"CIAIC, Northwestern Polytechnical University, Xi'an, China","institution_ids":["https://openalex.org/I17145004"]}]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":3,"corresponding_author_ids":["https://openalex.org/A5041350492"],"corresponding_institution_ids":["https://openalex.org/I17145004"],"apc_list":null,"apc_paid":null,"fwci":1.9205,"has_fulltext":false,"cited_by_count":23,"citation_normalized_percentile":{"value":0.88730668,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":{"min":94,"max":99},"biblio":{"volume":"28","issue":null,"first_page":"1533","last_page":"1548"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10201","display_name":"Speech Recognition and Synthesis","score":0.9998999834060669,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10201","display_name":"Speech Recognition and Synthesis","score":0.9998999834060669,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10860","display_name":"Speech and Audio Processing","score":0.9994000196456909,"subfield":{"id":"https://openalex.org/subfields/1711","display_name":"Signal Processing"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11309","display_name":"Music and Audio Processing","score":0.9944999814033508,"subfield":{"id":"https://openalex.org/subfields/1711","display_name":"Signal Processing"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/mahalanobis-distance","display_name":"Mahalanobis distance","score":0.8369600772857666},{"id":"https://openalex.org/keywords/normalization","display_name":"Normalization (sociology)","score":0.6782382726669312},{"id":"https://openalex.org/keywords/metric","display_name":"Metric (unit)","score":0.665250837802887},{"id":"https://openalex.org/keywords/speaker-verification","display_name":"Speaker verification","score":0.5830967426300049},{"id":"https://openalex.org/keywords/receiver-operating-characteristic","display_name":"Receiver operating characteristic","score":0.5827102065086365},{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.5805137157440186},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.5613885521888733},{"id":"https://openalex.org/keywords/preprocessor","display_name":"Preprocessor","score":0.4985966682434082},{"id":"https://openalex.org/keywords/nist","display_name":"NIST","score":0.49372372031211853},{"id":"https://openalex.org/keywords/pattern-recognition","display_name":"Pattern recognition (psychology)","score":0.4774644672870636},{"id":"https://openalex.org/keywords/probabilistic-logic","display_name":"Probabilistic logic","score":0.4362347722053528},{"id":"https://openalex.org/keywords/mathematics","display_name":"Mathematics","score":0.354219913482666},{"id":"https://openalex.org/keywords/algorithm","display_name":"Algorithm","score":0.33710378408432007},{"id":"https://openalex.org/keywords/speech-recognition","display_name":"Speech recognition","score":0.30858343839645386},{"id":"https://openalex.org/keywords/machine-learning","display_name":"Machine learning","score":0.25592148303985596},{"id":"https://openalex.org/keywords/speaker-recognition","display_name":"Speaker recognition","score":0.17577162384986877}],"concepts":[{"id":"https://openalex.org/C1921717","wikidata":"https://www.wikidata.org/wiki/Q1334846","display_name":"Mahalanobis distance","level":2,"score":0.8369600772857666},{"id":"https://openalex.org/C136886441","wikidata":"https://www.wikidata.org/wiki/Q926129","display_name":"Normalization (sociology)","level":2,"score":0.6782382726669312},{"id":"https://openalex.org/C176217482","wikidata":"https://www.wikidata.org/wiki/Q860554","display_name":"Metric (unit)","level":2,"score":0.665250837802887},{"id":"https://openalex.org/C2982762665","wikidata":"https://www.wikidata.org/wiki/Q1145189","display_name":"Speaker verification","level":3,"score":0.5830967426300049},{"id":"https://openalex.org/C58471807","wikidata":"https://www.wikidata.org/wiki/Q327120","display_name":"Receiver operating characteristic","level":2,"score":0.5827102065086365},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.5805137157440186},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.5613885521888733},{"id":"https://openalex.org/C34736171","wikidata":"https://www.wikidata.org/wiki/Q918333","display_name":"Preprocessor","level":2,"score":0.4985966682434082},{"id":"https://openalex.org/C111219384","wikidata":"https://www.wikidata.org/wiki/Q6954384","display_name":"NIST","level":2,"score":0.49372372031211853},{"id":"https://openalex.org/C153180895","wikidata":"https://www.wikidata.org/wiki/Q7148389","display_name":"Pattern recognition (psychology)","level":2,"score":0.4774644672870636},{"id":"https://openalex.org/C49937458","wikidata":"https://www.wikidata.org/wiki/Q2599292","display_name":"Probabilistic logic","level":2,"score":0.4362347722053528},{"id":"https://openalex.org/C33923547","wikidata":"https://www.wikidata.org/wiki/Q395","display_name":"Mathematics","level":0,"score":0.354219913482666},{"id":"https://openalex.org/C11413529","wikidata":"https://www.wikidata.org/wiki/Q8366","display_name":"Algorithm","level":1,"score":0.33710378408432007},{"id":"https://openalex.org/C28490314","wikidata":"https://www.wikidata.org/wiki/Q189436","display_name":"Speech recognition","level":1,"score":0.30858343839645386},{"id":"https://openalex.org/C119857082","wikidata":"https://www.wikidata.org/wiki/Q2539","display_name":"Machine learning","level":1,"score":0.25592148303985596},{"id":"https://openalex.org/C133892786","wikidata":"https://www.wikidata.org/wiki/Q1145189","display_name":"Speaker recognition","level":2,"score":0.17577162384986877},{"id":"https://openalex.org/C144024400","wikidata":"https://www.wikidata.org/wiki/Q21201","display_name":"Sociology","level":0,"score":0.0},{"id":"https://openalex.org/C19165224","wikidata":"https://www.wikidata.org/wiki/Q23404","display_name":"Anthropology","level":1,"score":0.0},{"id":"https://openalex.org/C162324750","wikidata":"https://www.wikidata.org/wiki/Q8134","display_name":"Economics","level":0,"score":0.0},{"id":"https://openalex.org/C21547014","wikidata":"https://www.wikidata.org/wiki/Q1423657","display_name":"Operations management","level":1,"score":0.0}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.1109/taslp.2020.2990275","is_oa":false,"landing_page_url":"https://doi.org/10.1109/taslp.2020.2990275","pdf_url":null,"source":{"id":"https://openalex.org/S4210169297","display_name":"IEEE/ACM Transactions on Audio Speech and Language Processing","issn_l":"2329-9290","issn":["2329-9290","2329-9304"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310319808","host_organization_name":"Institute of Electrical and Electronics Engineers","host_organization_lineage":["https://openalex.org/P4310319808"],"host_organization_lineage_names":["Institute of Electrical and Electronics Engineers"],"type":"journal"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"IEEE/ACM Transactions on Audio, Speech, and Language Processing","raw_type":"journal-article"}],"best_oa_location":null,"sustainable_development_goals":[{"score":0.5799999833106995,"display_name":"Reduced inequalities","id":"https://metadata.un.org/sdg/10"}],"awards":[{"id":"https://openalex.org/G5133417063","display_name":null,"funder_award_id":"2018AAA0102200","funder_id":"https://openalex.org/F4320335777","funder_display_name":"National Key Research and Development Program of China"}],"funders":[{"id":"https://openalex.org/F4320321001","display_name":"National Natural Science Foundation of China","ror":"https://ror.org/01h0zpd94"},{"id":"https://openalex.org/F4320335777","display_name":"National Key Research and Development Program of China","ror":null}],"has_content":{"grobid_xml":false,"pdf":false},"content_urls":null,"referenced_works_count":66,"referenced_works":["https://openalex.org/W1524333225","https://openalex.org/W1586405805","https://openalex.org/W1589137271","https://openalex.org/W1916834241","https://openalex.org/W1971758513","https://openalex.org/W2023238506","https://openalex.org/W2039057510","https://openalex.org/W2041823554","https://openalex.org/W2046056978","https://openalex.org/W2068042582","https://openalex.org/W2078169166","https://openalex.org/W2085668081","https://openalex.org/W2106053110","https://openalex.org/W2114925438","https://openalex.org/W2121949863","https://openalex.org/W2123768812","https://openalex.org/W2137310491","https://openalex.org/W2150769028","https://openalex.org/W2167136086","https://openalex.org/W2169495281","https://openalex.org/W2170088868","https://openalex.org/W2183016404","https://openalex.org/W2268629890","https://openalex.org/W2294814385","https://openalex.org/W2395750323","https://openalex.org/W2406312423","https://openalex.org/W2513304932","https://openalex.org/W2516764878","https://openalex.org/W2584329820","https://openalex.org/W2587150483","https://openalex.org/W2592513362","https://openalex.org/W2726515241","https://openalex.org/W2728421214","https://openalex.org/W2748488820","https://openalex.org/W2781787017","https://openalex.org/W2783693219","https://openalex.org/W2786386907","https://openalex.org/W2790091699","https://openalex.org/W2794506738","https://openalex.org/W2802488037","https://openalex.org/W2802973008","https://openalex.org/W2808631503","https://openalex.org/W2888897023","https://openalex.org/W2889016587","https://openalex.org/W2889045432","https://openalex.org/W2889050834","https://openalex.org/W2889385246","https://openalex.org/W2889519245","https://openalex.org/W2890250568","https://openalex.org/W2890964092","https://openalex.org/W2953271441","https://openalex.org/W2962714336","https://openalex.org/W2962832278","https://openalex.org/W2963026686","https://openalex.org/W2963775347","https://openalex.org/W3006478128","https://openalex.org/W3123535731","https://openalex.org/W3141593045","https://openalex.org/W4210880854","https://openalex.org/W6631362777","https://openalex.org/W6640010188","https://openalex.org/W6675751002","https://openalex.org/W6680117457","https://openalex.org/W6686491854","https://openalex.org/W6713727690","https://openalex.org/W6759166234"],"related_works":["https://openalex.org/W1968216131","https://openalex.org/W2355011896","https://openalex.org/W3089964815","https://openalex.org/W1581134722","https://openalex.org/W2051274299","https://openalex.org/W2169890399","https://openalex.org/W2170952763","https://openalex.org/W2359348847","https://openalex.org/W468945283","https://openalex.org/W2148960477"],"abstract_inverted_index":{"Receiver":[0],"operating":[1],"characteristic":[2],"(ROC)":[3],"and":[4,39,158,176],"detection":[5],"error":[6],"tradeoff":[7],"(DET)":[8],"curves":[9],"are":[10,20],"two":[11,151],"widely":[12],"used":[13],"evaluation":[14,91,199],"metrics":[15],"for":[16,93],"speaker":[17,49,94,141,192],"verification.":[18,95],"They":[19],"equivalent":[21],"since":[22],"the":[23,30,58,63,78,83,109,116,120,128,136,139,145,166,170,177,186,190],"latter":[24],"can":[25],"be":[26],"obtained":[27],"by":[28,44,144],"transforming":[29],"former's":[31],"true":[32],"positive":[33],"y-axis":[34,38],"to":[35,76,105],"false":[36],"negative":[37],"then":[40],"re-scaling":[41],"both":[42],"axes":[43],"a":[45,88,123],"probit":[46],"operator.":[47],"Real-world":[48],"verification":[50,142,193],"systems,":[51],"however,":[52],"usually":[53],"work":[54],"on":[55,156,169],"part":[56,81],"of":[57,62,82,119,138,173,180,197],"ROC":[59,65,84],"curve":[60,66,85],"instead":[61],"entire":[64],"given":[67],"an":[68],"application.":[69],"Therefore,":[70],"we":[71,148],"propose":[72,150],"in":[73,195],"this":[74],"article":[75],"use":[77],"area":[79],"under":[80],"(pAUC)":[86],"as":[87],"more":[89],"efficient":[90],"metric":[92,99,112],"A":[96],"Mahalanobis":[97,110],"distance":[98,111],"learning":[100,113],"based":[101,155],"back-end":[102,121,188],"is":[103,122,132],"applied":[104],"optimize":[106],"pAUC,":[107],"where":[108],"guarantees":[114],"that":[115,127,185],"optimization":[117],"objective":[118],"convex":[124],"one":[125],"so":[126],"global":[129],"optimum":[130],"solution":[131],"achievable.":[133],"To":[134],"improve":[135],"performance":[137],"state-of-the-art":[140,191],"systems":[143,168],"proposed":[146,167,187],"back-end,":[147],"further":[149],"feature":[152],"preprocessing":[153],"techniques":[154],"length-normalization":[157],"probabilistic":[159],"linear":[160],"discriminant":[161],"analysis":[162],"respectively.":[163],"We":[164],"evaluate":[165],"major":[171],"languages":[172],"NIST":[174],"SRE16":[175],"core":[178],"tasks":[179],"SITW.":[181],"Experimental":[182],"results":[183],"show":[184],"outperforms":[189],"back-ends":[194],"terms":[196],"seven":[198],"metrics.":[200]},"counts_by_year":[{"year":2026,"cited_by_count":1},{"year":2025,"cited_by_count":5},{"year":2024,"cited_by_count":3},{"year":2023,"cited_by_count":2},{"year":2022,"cited_by_count":4},{"year":2021,"cited_by_count":5},{"year":2020,"cited_by_count":3}],"updated_date":"2026-03-27T05:58:40.876381","created_date":"2025-10-10T00:00:00"}
