{"id":"https://openalex.org/W2059254811","doi":"https://doi.org/10.1109/icassp.2009.4960557","title":"iFLY system for the NIST 2008 speaker recognition evaluation","display_name":"iFLY system for the NIST 2008 speaker recognition evaluation","publication_year":2009,"publication_date":"2009-04-01","ids":{"openalex":"https://openalex.org/W2059254811","doi":"https://doi.org/10.1109/icassp.2009.4960557","mag":"2059254811"},"language":"en","primary_location":{"id":"doi:10.1109/icassp.2009.4960557","is_oa":false,"landing_page_url":"https://doi.org/10.1109/icassp.2009.4960557","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"2009 IEEE International Conference on Acoustics, Speech and Signal Processing","raw_type":"proceedings-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":false,"oa_status":"closed","oa_url":null,"any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5038369085","display_name":"Wu Guo","orcid":"https://orcid.org/0000-0002-3779-7944"},"institutions":[{"id":"https://openalex.org/I126520041","display_name":"University of Science and Technology of China","ror":"https://ror.org/04c4dkn09","country_code":"CN","type":"education","lineage":["https://openalex.org/I126520041","https://openalex.org/I19820366"]}],"countries":["CN"],"is_corresponding":true,"raw_author_name":"Wu Guo","raw_affiliation_strings":["MOE-Microsoft Key Laboratory of Multimedia Computing and Communication, University of Science and Technology, China","MOE-Microsoft Key Laboratory of Multimedia Computing and Communication, University of Science and Technology of China (USTC), China"],"affiliations":[{"raw_affiliation_string":"MOE-Microsoft Key Laboratory of Multimedia Computing and Communication, University of Science and Technology, China","institution_ids":["https://openalex.org/I126520041"]},{"raw_affiliation_string":"MOE-Microsoft Key Laboratory of Multimedia Computing and Communication, University of Science and Technology of China (USTC), China","institution_ids":["https://openalex.org/I126520041"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5056415893","display_name":"Yanhua Long","orcid":"https://orcid.org/0000-0003-0924-408X"},"institutions":[{"id":"https://openalex.org/I126520041","display_name":"University of Science and Technology of China","ror":"https://ror.org/04c4dkn09","country_code":"CN","type":"education","lineage":["https://openalex.org/I126520041","https://openalex.org/I19820366"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Yanhua Long","raw_affiliation_strings":["MOE-Microsoft Key Laboratory of Multimedia Computing and Communication, University of Science and Technology, China","MOE-Microsoft Key Laboratory of Multimedia Computing and Communication, University of Science and Technology of China (USTC), China"],"affiliations":[{"raw_affiliation_string":"MOE-Microsoft Key Laboratory of Multimedia Computing and Communication, University of Science and Technology, China","institution_ids":["https://openalex.org/I126520041"]},{"raw_affiliation_string":"MOE-Microsoft Key Laboratory of Multimedia Computing and Communication, University of Science and Technology of China (USTC), China","institution_ids":["https://openalex.org/I126520041"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5034059240","display_name":"Yijie Li","orcid":null},"institutions":[{"id":"https://openalex.org/I126520041","display_name":"University of Science and Technology of China","ror":"https://ror.org/04c4dkn09","country_code":"CN","type":"education","lineage":["https://openalex.org/I126520041","https://openalex.org/I19820366"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Yijie Li","raw_affiliation_strings":["MOE-Microsoft Key Laboratory of Multimedia Computing and Communication, University of Science and Technology, China","MOE-Microsoft Key Laboratory of Multimedia Computing and Communication, University of Science and Technology of China (USTC), China"],"affiliations":[{"raw_affiliation_string":"MOE-Microsoft Key Laboratory of Multimedia Computing and Communication, University of Science and Technology, China","institution_ids":["https://openalex.org/I126520041"]},{"raw_affiliation_string":"MOE-Microsoft Key Laboratory of Multimedia Computing and Communication, University of Science and Technology of China (USTC), China","institution_ids":["https://openalex.org/I126520041"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5048654038","display_name":"Lei Pan","orcid":"https://orcid.org/0000-0002-1111-5570"},"institutions":[{"id":"https://openalex.org/I126520041","display_name":"University of Science and Technology of China","ror":"https://ror.org/04c4dkn09","country_code":"CN","type":"education","lineage":["https://openalex.org/I126520041","https://openalex.org/I19820366"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Lei Pan","raw_affiliation_strings":["MOE-Microsoft Key Laboratory of Multimedia Computing and Communication, University of Science and Technology, China","MOE-Microsoft Key Laboratory of Multimedia Computing and Communication, University of Science and Technology of China (USTC), China"],"affiliations":[{"raw_affiliation_string":"MOE-Microsoft Key Laboratory of Multimedia Computing and Communication, University of Science and Technology, China","institution_ids":["https://openalex.org/I126520041"]},{"raw_affiliation_string":"MOE-Microsoft Key Laboratory of Multimedia Computing and Communication, University of Science and Technology of China (USTC), China","institution_ids":["https://openalex.org/I126520041"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5002548873","display_name":"Eryu Wang","orcid":null},"institutions":[{"id":"https://openalex.org/I126520041","display_name":"University of Science and Technology of China","ror":"https://ror.org/04c4dkn09","country_code":"CN","type":"education","lineage":["https://openalex.org/I126520041","https://openalex.org/I19820366"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Eryu Wang","raw_affiliation_strings":["MOE-Microsoft Key Laboratory of Multimedia Computing and Communication, University of Science and Technology, China","MOE-Microsoft Key Laboratory of Multimedia Computing and Communication, University of Science and Technology of China (USTC), China"],"affiliations":[{"raw_affiliation_string":"MOE-Microsoft Key Laboratory of Multimedia Computing and Communication, University of Science and Technology, China","institution_ids":["https://openalex.org/I126520041"]},{"raw_affiliation_string":"MOE-Microsoft Key Laboratory of Multimedia Computing and Communication, University of Science and Technology of China (USTC), China","institution_ids":["https://openalex.org/I126520041"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5057227915","display_name":"Li-Rong Dai","orcid":"https://orcid.org/0000-0002-0859-2827"},"institutions":[{"id":"https://openalex.org/I126520041","display_name":"University of Science and Technology of China","ror":"https://ror.org/04c4dkn09","country_code":"CN","type":"education","lineage":["https://openalex.org/I126520041","https://openalex.org/I19820366"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Lirong Dai","raw_affiliation_strings":["MOE-Microsoft Key Laboratory of Multimedia Computing and Communication, University of Science and Technology, China","MOE-Microsoft Key Laboratory of Multimedia Computing and Communication, University of Science and Technology of China (USTC), China"],"affiliations":[{"raw_affiliation_string":"MOE-Microsoft Key Laboratory of Multimedia Computing and Communication, University of Science and Technology, China","institution_ids":["https://openalex.org/I126520041"]},{"raw_affiliation_string":"MOE-Microsoft Key Laboratory of Multimedia Computing and Communication, University of Science and Technology of China (USTC), China","institution_ids":["https://openalex.org/I126520041"]}]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":6,"corresponding_author_ids":["https://openalex.org/A5038369085"],"corresponding_institution_ids":["https://openalex.org/I126520041"],"apc_list":null,"apc_paid":null,"fwci":1.7447,"has_fulltext":false,"cited_by_count":8,"citation_normalized_percentile":{"value":0.86963681,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":{"min":89,"max":94},"biblio":{"volume":null,"issue":null,"first_page":"4209","last_page":"4212"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10201","display_name":"Speech Recognition and Synthesis","score":0.9998999834060669,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10201","display_name":"Speech Recognition and Synthesis","score":0.9998999834060669,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10860","display_name":"Speech and Audio Processing","score":0.9980000257492065,"subfield":{"id":"https://openalex.org/subfields/1711","display_name":"Signal Processing"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11309","display_name":"Music and Audio Processing","score":0.9890999794006348,"subfield":{"id":"https://openalex.org/subfields/1711","display_name":"Signal Processing"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/nist","display_name":"NIST","score":0.9317684173583984},{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.7656234502792358},{"id":"https://openalex.org/keywords/speech-recognition","display_name":"Speech recognition","score":0.7375266551971436},{"id":"https://openalex.org/keywords/speaker-recognition","display_name":"Speaker recognition","score":0.6434146165847778},{"id":"https://openalex.org/keywords/focus","display_name":"Focus (optics)","score":0.6067171692848206},{"id":"https://openalex.org/keywords/support-vector-machine","display_name":"Support vector machine","score":0.5154464840888977},{"id":"https://openalex.org/keywords/key","display_name":"Key (lock)","score":0.5064989328384399},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.4928927421569824},{"id":"https://openalex.org/keywords/selection","display_name":"Selection (genetic algorithm)","score":0.459328830242157},{"id":"https://openalex.org/keywords/compensation","display_name":"Compensation (psychology)","score":0.45836812257766724},{"id":"https://openalex.org/keywords/pattern-recognition","display_name":"Pattern recognition (psychology)","score":0.43775075674057007},{"id":"https://openalex.org/keywords/point","display_name":"Point (geometry)","score":0.41491276025772095}],"concepts":[{"id":"https://openalex.org/C111219384","wikidata":"https://www.wikidata.org/wiki/Q6954384","display_name":"NIST","level":2,"score":0.9317684173583984},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.7656234502792358},{"id":"https://openalex.org/C28490314","wikidata":"https://www.wikidata.org/wiki/Q189436","display_name":"Speech recognition","level":1,"score":0.7375266551971436},{"id":"https://openalex.org/C133892786","wikidata":"https://www.wikidata.org/wiki/Q1145189","display_name":"Speaker recognition","level":2,"score":0.6434146165847778},{"id":"https://openalex.org/C192209626","wikidata":"https://www.wikidata.org/wiki/Q190909","display_name":"Focus (optics)","level":2,"score":0.6067171692848206},{"id":"https://openalex.org/C12267149","wikidata":"https://www.wikidata.org/wiki/Q282453","display_name":"Support vector machine","level":2,"score":0.5154464840888977},{"id":"https://openalex.org/C26517878","wikidata":"https://www.wikidata.org/wiki/Q228039","display_name":"Key (lock)","level":2,"score":0.5064989328384399},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.4928927421569824},{"id":"https://openalex.org/C81917197","wikidata":"https://www.wikidata.org/wiki/Q628760","display_name":"Selection (genetic algorithm)","level":2,"score":0.459328830242157},{"id":"https://openalex.org/C2780023022","wikidata":"https://www.wikidata.org/wiki/Q1338171","display_name":"Compensation (psychology)","level":2,"score":0.45836812257766724},{"id":"https://openalex.org/C153180895","wikidata":"https://www.wikidata.org/wiki/Q7148389","display_name":"Pattern recognition (psychology)","level":2,"score":0.43775075674057007},{"id":"https://openalex.org/C28719098","wikidata":"https://www.wikidata.org/wiki/Q44946","display_name":"Point (geometry)","level":2,"score":0.41491276025772095},{"id":"https://openalex.org/C121332964","wikidata":"https://www.wikidata.org/wiki/Q413","display_name":"Physics","level":0,"score":0.0},{"id":"https://openalex.org/C11171543","wikidata":"https://www.wikidata.org/wiki/Q41630","display_name":"Psychoanalysis","level":1,"score":0.0},{"id":"https://openalex.org/C33923547","wikidata":"https://www.wikidata.org/wiki/Q395","display_name":"Mathematics","level":0,"score":0.0},{"id":"https://openalex.org/C120665830","wikidata":"https://www.wikidata.org/wiki/Q14620","display_name":"Optics","level":1,"score":0.0},{"id":"https://openalex.org/C38652104","wikidata":"https://www.wikidata.org/wiki/Q3510521","display_name":"Computer security","level":1,"score":0.0},{"id":"https://openalex.org/C15744967","wikidata":"https://www.wikidata.org/wiki/Q9418","display_name":"Psychology","level":0,"score":0.0},{"id":"https://openalex.org/C2524010","wikidata":"https://www.wikidata.org/wiki/Q8087","display_name":"Geometry","level":1,"score":0.0}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.1109/icassp.2009.4960557","is_oa":false,"landing_page_url":"https://doi.org/10.1109/icassp.2009.4960557","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"2009 IEEE International Conference on Acoustics, Speech and Signal Processing","raw_type":"proceedings-article"}],"best_oa_location":null,"sustainable_development_goals":[],"awards":[],"funders":[],"has_content":{"grobid_xml":false,"pdf":false},"content_urls":null,"referenced_works_count":9,"referenced_works":["https://openalex.org/W134766468","https://openalex.org/W2041823554","https://openalex.org/W2073693905","https://openalex.org/W2079076391","https://openalex.org/W2123486077","https://openalex.org/W2128391065","https://openalex.org/W2131469787","https://openalex.org/W2136879537","https://openalex.org/W2144760012"],"related_works":["https://openalex.org/W2158491338","https://openalex.org/W2807901368","https://openalex.org/W2133733652","https://openalex.org/W2072658171","https://openalex.org/W2606392311","https://openalex.org/W2320042380","https://openalex.org/W4385956668","https://openalex.org/W2900895161","https://openalex.org/W4380838366","https://openalex.org/W2539884462"],"abstract_inverted_index":{"The":[0],"description":[1],"of":[2,34,45],"iFLY":[3],"system":[4,30,89],"submitted":[5],"for":[6],"NIST":[7],"2008":[8,20],"speaker":[9],"recognition":[10],"evaluation":[11],"(SRE),":[12],"which":[13],"has":[14],"achieved":[15],"excellent":[16],"performance":[17],"in":[18,25,60,87],"the":[19,70,88],"SRE":[21],"evaluation,":[22],"is":[23,31],"presented":[24],"this":[26,61],"paper.":[27],"Our":[28],"primary":[29],"a":[32],"fusion":[33],"two":[35,43],"subsystems":[36],"GMM-UBM":[37],"and":[38,50,69,81],"GMM-SVM.":[39],"For":[40],"each":[41],"sub-system,":[42],"kinds":[44],"short-time":[46],"acoustic":[47],"features":[48],"PLP":[49],"LPCC":[51],"are":[52],"adopted.":[53],"We":[54,74],"focus":[55],"on":[56],"three":[57],"key":[58,85],"issues":[59],"evaluation:":[62],"channel":[63],"compensation,":[64],"multi-lingual":[65],"or":[66],"bi-lingual":[67],"cues":[68],"voice":[71],"activity":[72],"detection.":[73],"also":[75],"point":[76],"out":[77],"that":[78],"data":[79],"selection":[80],"factor":[82],"analysis":[83],"play":[84],"roles":[86],"improvement.":[90]},"counts_by_year":[{"year":2024,"cited_by_count":1},{"year":2016,"cited_by_count":1},{"year":2014,"cited_by_count":1},{"year":2013,"cited_by_count":1},{"year":2012,"cited_by_count":1}],"updated_date":"2025-11-06T03:46:38.306776","created_date":"2025-10-10T00:00:00"}
