{"id":"https://openalex.org/W32477078","doi":"https://doi.org/10.21437/interspeech.2007-163","title":"Cluster adaptive training weights as features in SVM-based speaker verification","display_name":"Cluster adaptive training weights as features in SVM-based speaker verification","publication_year":2007,"publication_date":"2007-08-27","ids":{"openalex":"https://openalex.org/W32477078","doi":"https://doi.org/10.21437/interspeech.2007-163","mag":"32477078"},"language":"en","primary_location":{"id":"doi:10.21437/interspeech.2007-163","is_oa":false,"landing_page_url":"https://doi.org/10.21437/interspeech.2007-163","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Interspeech 2007","raw_type":"proceedings-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":true,"oa_status":"green","oa_url":"http://hdl.handle.net/20.500.11820/1704b725-18c9-4323-914d-bb4e05f5d0c5","any_repository_has_fulltext":true},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5101503841","display_name":"Hao Yang","orcid":"https://orcid.org/0009-0009-8480-5298"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Hao Yang","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5056136429","display_name":"Yuan Dong","orcid":"https://orcid.org/0009-0004-8650-1603"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Yuan Dong","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5100518039","display_name":"Xianyu Zhao","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Xianyu Zhao","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5078587654","display_name":"Jian Zhao","orcid":"https://orcid.org/0000-0002-3508-756X"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Jian Zhao","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5101607148","display_name":"Liang Lu","orcid":"https://orcid.org/0000-0003-4005-679X"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Liang Lu","raw_affiliation_strings":["School of Informatics"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"School of Informatics","institution_ids":[]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5078897088","display_name":"Haila Wang","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Haila Wang","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]}],"institutions":[],"countries_distinct_count":0,"institutions_distinct_count":6,"corresponding_author_ids":[],"corresponding_institution_ids":[],"apc_list":null,"apc_paid":null,"fwci":2.422,"has_fulltext":true,"cited_by_count":9,"citation_normalized_percentile":{"value":0.89360594,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":{"min":90,"max":94},"biblio":{"volume":null,"issue":null,"first_page":"2013","last_page":"2016"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10201","display_name":"Speech Recognition and Synthesis","score":0.9998000264167786,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10201","display_name":"Speech Recognition and Synthesis","score":0.9998000264167786,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10860","display_name":"Speech and Audio Processing","score":0.9936000108718872,"subfield":{"id":"https://openalex.org/subfields/1711","display_name":"Signal Processing"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11309","display_name":"Music and Audio Processing","score":0.9674999713897705,"subfield":{"id":"https://openalex.org/subfields/1711","display_name":"Signal Processing"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.7980180978775024},{"id":"https://openalex.org/keywords/speaker-recognition","display_name":"Speaker recognition","score":0.649253785610199},{"id":"https://openalex.org/keywords/speech-recognition","display_name":"Speech recognition","score":0.6184899806976318},{"id":"https://openalex.org/keywords/speaker-diarisation","display_name":"Speaker diarisation","score":0.5983628034591675},{"id":"https://openalex.org/keywords/nist","display_name":"NIST","score":0.5941447019577026},{"id":"https://openalex.org/keywords/pattern-recognition","display_name":"Pattern recognition (psychology)","score":0.5895294547080994},{"id":"https://openalex.org/keywords/support-vector-machine","display_name":"Support vector machine","score":0.5770925283432007},{"id":"https://openalex.org/keywords/cluster-analysis","display_name":"Cluster analysis","score":0.5684906840324402},{"id":"https://openalex.org/keywords/mixture-model","display_name":"Mixture model","score":0.5525208711624146},{"id":"https://openalex.org/keywords/weighting","display_name":"Weighting","score":0.5170007944107056},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.512612521648407},{"id":"https://openalex.org/keywords/mel-frequency-cepstrum","display_name":"Mel-frequency cepstrum","score":0.46540743112564087},{"id":"https://openalex.org/keywords/feature-extraction","display_name":"Feature extraction","score":0.28196173906326294}],"concepts":[{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.7980180978775024},{"id":"https://openalex.org/C133892786","wikidata":"https://www.wikidata.org/wiki/Q1145189","display_name":"Speaker recognition","level":2,"score":0.649253785610199},{"id":"https://openalex.org/C28490314","wikidata":"https://www.wikidata.org/wiki/Q189436","display_name":"Speech recognition","level":1,"score":0.6184899806976318},{"id":"https://openalex.org/C149838564","wikidata":"https://www.wikidata.org/wiki/Q7574248","display_name":"Speaker diarisation","level":3,"score":0.5983628034591675},{"id":"https://openalex.org/C111219384","wikidata":"https://www.wikidata.org/wiki/Q6954384","display_name":"NIST","level":2,"score":0.5941447019577026},{"id":"https://openalex.org/C153180895","wikidata":"https://www.wikidata.org/wiki/Q7148389","display_name":"Pattern recognition (psychology)","level":2,"score":0.5895294547080994},{"id":"https://openalex.org/C12267149","wikidata":"https://www.wikidata.org/wiki/Q282453","display_name":"Support vector machine","level":2,"score":0.5770925283432007},{"id":"https://openalex.org/C73555534","wikidata":"https://www.wikidata.org/wiki/Q622825","display_name":"Cluster analysis","level":2,"score":0.5684906840324402},{"id":"https://openalex.org/C61224824","wikidata":"https://www.wikidata.org/wiki/Q2260434","display_name":"Mixture model","level":2,"score":0.5525208711624146},{"id":"https://openalex.org/C183115368","wikidata":"https://www.wikidata.org/wiki/Q856577","display_name":"Weighting","level":2,"score":0.5170007944107056},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.512612521648407},{"id":"https://openalex.org/C151989614","wikidata":"https://www.wikidata.org/wiki/Q440370","display_name":"Mel-frequency cepstrum","level":3,"score":0.46540743112564087},{"id":"https://openalex.org/C52622490","wikidata":"https://www.wikidata.org/wiki/Q1026626","display_name":"Feature extraction","level":2,"score":0.28196173906326294},{"id":"https://openalex.org/C126838900","wikidata":"https://www.wikidata.org/wiki/Q77604","display_name":"Radiology","level":1,"score":0.0},{"id":"https://openalex.org/C71924100","wikidata":"https://www.wikidata.org/wiki/Q11190","display_name":"Medicine","level":0,"score":0.0}],"mesh":[],"locations_count":4,"locations":[{"id":"doi:10.21437/interspeech.2007-163","is_oa":false,"landing_page_url":"https://doi.org/10.21437/interspeech.2007-163","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Interspeech 2007","raw_type":"proceedings-article"},{"id":"pmh:oai:pure.ed.ac.uk:publications/1704b725-18c9-4323-914d-bb4e05f5d0c5","is_oa":true,"landing_page_url":null,"pdf_url":"http://hdl.handle.net/20.500.11820/1704b725-18c9-4323-914d-bb4e05f5d0c5","source":{"id":"https://openalex.org/S4406922455","display_name":"Edinburgh Research Explorer","issn_l":null,"issn":null,"is_oa":false,"is_in_doaj":false,"is_core":false,"host_organization":null,"host_organization_name":null,"host_organization_lineage":[],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":"","raw_type":""},{"id":"pmh:oai:pure.ed.ac.uk:publications/1704b725-18c9-4323-914d-bb4e05f5d0c5","is_oa":true,"landing_page_url":"https://www.research.ed.ac.uk/en/publications/1704b725-18c9-4323-914d-bb4e05f5d0c5","pdf_url":"http://hdl.handle.net/20.500.11820/1704b725-18c9-4323-914d-bb4e05f5d0c5","source":{"id":"https://openalex.org/S4306400321","display_name":"Edinburgh Research Explorer (University of Edinburgh)","issn_l":null,"issn":null,"is_oa":false,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I98677209","host_organization_name":"University of Edinburgh","host_organization_lineage":["https://openalex.org/I98677209"],"host_organization_lineage_names":[],"type":"repository"},"license":"other-oa","license_id":"https://openalex.org/licenses/other-oa","version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":"Yang, H, Dong, Y, Zhao, X, Zhao, J, Lu, L & Wang, H 2007, Cluster adaptive training weights as features in SVM-based speaker verification. in INTERSPEECH 2007, 8th Annual Conference of the International Speech Communication Association, Antwerp, Belgium, August 27-31, 2007. pp. 2013-2016, 8th Annual Conference of the International Speech Communication Association, Antwerp, Belgium, 27/08/07. < http://www.isca-speech.org/archive/interspeech_2007/i07_2013.html >","raw_type":"contributionToPeriodical"},{"id":"pmh:oai:CiteSeerX.psu:10.1.1.414.19","is_oa":false,"landing_page_url":"http://citeseerx.ist.psu.edu/viewdoc/summary?doi=10.1.1.414.19","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":"http://homepages.inf.ed.ac.uk/llu/pdf/cluster.pdf","raw_type":"text"}],"best_oa_location":{"id":"pmh:oai:pure.ed.ac.uk:publications/1704b725-18c9-4323-914d-bb4e05f5d0c5","is_oa":true,"landing_page_url":null,"pdf_url":"http://hdl.handle.net/20.500.11820/1704b725-18c9-4323-914d-bb4e05f5d0c5","source":{"id":"https://openalex.org/S4406922455","display_name":"Edinburgh Research Explorer","issn_l":null,"issn":null,"is_oa":false,"is_in_doaj":false,"is_core":false,"host_organization":null,"host_organization_name":null,"host_organization_lineage":[],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":"","raw_type":""},"sustainable_development_goals":[{"score":0.6000000238418579,"id":"https://metadata.un.org/sdg/10","display_name":"Reduced inequalities"}],"awards":[],"funders":[],"has_content":{"pdf":true,"grobid_xml":true},"content_urls":{"pdf":"https://content.openalex.org/works/W32477078.pdf","grobid_xml":"https://content.openalex.org/works/W32477078.grobid-xml"},"referenced_works_count":14,"referenced_works":["https://openalex.org/W31925794","https://openalex.org/W1916834241","https://openalex.org/W2009921239","https://openalex.org/W2023238506","https://openalex.org/W2041823554","https://openalex.org/W2069631319","https://openalex.org/W2101556109","https://openalex.org/W2108948497","https://openalex.org/W2119603452","https://openalex.org/W2124667332","https://openalex.org/W2144760012","https://openalex.org/W2148554390","https://openalex.org/W2165108269","https://openalex.org/W4285719527"],"related_works":["https://openalex.org/W1963976507","https://openalex.org/W2048014685","https://openalex.org/W2370972896","https://openalex.org/W2206035908","https://openalex.org/W3119288895","https://openalex.org/W2185075503","https://openalex.org/W1197719229","https://openalex.org/W4247736853","https://openalex.org/W2381158726","https://openalex.org/W2552734076"],"abstract_inverted_index":{"In":[0],"this":[1,100],"paper,":[2],"we":[3],"propose":[4],"the":[5,39,47,56,59,62,67],"use":[6],"of":[7,32,46,49,58,64,79],"cluster":[8,33,40],"adaptive":[9,41],"training":[10,42],"(CAT)":[11],"weights":[12,102],"as":[13],"features":[14],"in":[15,92],"support":[16],"vector":[17,31],"machine":[18],"(SVM)":[19],"based":[20],"text-independent":[21],"verification":[22,68,113],"task.":[23],"The":[24,44],"speaker":[25],"utterance":[26],"is":[27,87],"characterized":[28],"by":[29,54],"a":[30,93,109],"weights,":[34],"which":[35,51],"are":[36,52,70],"extracted":[37],"during":[38],"process.":[43],"effects":[45],"number":[48,63],"classes,":[50],"obtained":[53],"partitioning":[55],"components":[57],"model,":[60],"and":[61,115],"clusters":[65],"on":[66],"performance":[69,107,121],"investigated.":[71],"To":[72],"remove":[73],"session":[74],"variability":[75],"due":[76],"to":[77,108],"influences":[78],"microphone,":[80],"environment,":[81],"etc,":[82],"Nuisance":[83],"Attribute":[84],"Projection":[85],"(NAP)":[86],"also":[88],"evaluated.":[89],"Experimental":[90],"results":[91],"NIST":[94],"SRE":[95],"2006":[96],"task":[97],"show":[98],"that":[99],"CAT":[101],"SVM":[103],"system":[104],"achieves":[105],"comparable":[106],"state-of-the-art":[110],"cepstral":[111],"GMM-UBM":[112],"system,":[114],"their":[116],"fusion":[117],"can":[118],"give":[119],"further":[120],"gains.":[122]},"counts_by_year":[{"year":2016,"cited_by_count":1},{"year":2015,"cited_by_count":1},{"year":2014,"cited_by_count":1}],"updated_date":"2026-06-11T09:08:48.828518","created_date":"2025-10-10T00:00:00"}
