{"id":"https://openalex.org/W2786656445","doi":"https://doi.org/10.1109/asru.2017.8268991","title":"Adversarial manifold learning for speaker recognition","display_name":"Adversarial manifold learning for speaker recognition","publication_year":2017,"publication_date":"2017-12-01","ids":{"openalex":"https://openalex.org/W2786656445","doi":"https://doi.org/10.1109/asru.2017.8268991","mag":"2786656445"},"language":"en","primary_location":{"id":"doi:10.1109/asru.2017.8268991","is_oa":false,"landing_page_url":"https://doi.org/10.1109/asru.2017.8268991","pdf_url":null,"source":{"id":"https://openalex.org/S4306498158","display_name":"2017 IEEE Automatic Speech Recognition and Understanding Workshop (ASRU)","issn_l":null,"issn":null,"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":null,"host_organization_name":null,"host_organization_lineage":[],"host_organization_lineage_names":[],"type":"journal"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"2017 IEEE Automatic Speech Recognition and Understanding Workshop (ASRU)","raw_type":"proceedings-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":false,"oa_status":"closed","oa_url":null,"any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5061908942","display_name":"Jen\u2010Tzung Chien","orcid":"https://orcid.org/0000-0003-3466-8941"},"institutions":[{"id":"https://openalex.org/I148366613","display_name":"National Yang Ming Chiao Tung University","ror":"https://ror.org/00se2k293","country_code":"TW","type":"education","lineage":["https://openalex.org/I148366613"]}],"countries":["TW"],"is_corresponding":true,"raw_author_name":"Jen-Tzung Chien","raw_affiliation_strings":["Department of Electrical and Computer Engineering, National Chiao Tung University, Taiwan"],"affiliations":[{"raw_affiliation_string":"Department of Electrical and Computer Engineering, National Chiao Tung University, Taiwan","institution_ids":["https://openalex.org/I148366613"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5022495855","display_name":"Kang-Ting Peng","orcid":null},"institutions":[{"id":"https://openalex.org/I148366613","display_name":"National Yang Ming Chiao Tung University","ror":"https://ror.org/00se2k293","country_code":"TW","type":"education","lineage":["https://openalex.org/I148366613"]}],"countries":["TW"],"is_corresponding":false,"raw_author_name":"Kang-Ting Peng","raw_affiliation_strings":["Department of Electrical and Computer Engineering, National Chiao Tung University, Taiwan"],"affiliations":[{"raw_affiliation_string":"Department of Electrical and Computer Engineering, National Chiao Tung University, Taiwan","institution_ids":["https://openalex.org/I148366613"]}]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":2,"corresponding_author_ids":["https://openalex.org/A5061908942"],"corresponding_institution_ids":["https://openalex.org/I148366613"],"apc_list":null,"apc_paid":null,"fwci":3.1204,"has_fulltext":false,"cited_by_count":16,"citation_normalized_percentile":{"value":0.93588858,"is_in_top_1_percent":false,"is_in_top_10_percent":true},"cited_by_percentile_year":{"min":96,"max":99},"biblio":{"volume":"9","issue":null,"first_page":"599","last_page":"605"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10201","display_name":"Speech Recognition and Synthesis","score":0.9983000159263611,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10201","display_name":"Speech Recognition and Synthesis","score":0.9983000159263611,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10860","display_name":"Speech and Audio Processing","score":0.9947999715805054,"subfield":{"id":"https://openalex.org/subfields/1711","display_name":"Signal Processing"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10057","display_name":"Face and Expression Recognition","score":0.9865999817848206,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/discriminator","display_name":"Discriminator","score":0.9066898822784424},{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.7577642202377319},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.6992640495300293},{"id":"https://openalex.org/keywords/subspace-topology","display_name":"Subspace topology","score":0.6344174742698669},{"id":"https://openalex.org/keywords/pattern-recognition","display_name":"Pattern recognition (psychology)","score":0.6074607968330383},{"id":"https://openalex.org/keywords/embedding","display_name":"Embedding","score":0.5877129435539246},{"id":"https://openalex.org/keywords/generator","display_name":"Generator (circuit theory)","score":0.5509153008460999},{"id":"https://openalex.org/keywords/deep-learning","display_name":"Deep learning","score":0.5265536308288574},{"id":"https://openalex.org/keywords/latent-variable","display_name":"Latent variable","score":0.5075181722640991},{"id":"https://openalex.org/keywords/autoencoder","display_name":"Autoencoder","score":0.465166836977005},{"id":"https://openalex.org/keywords/speech-recognition","display_name":"Speech recognition","score":0.4529208540916443},{"id":"https://openalex.org/keywords/detector","display_name":"Detector","score":0.071282297372818}],"concepts":[{"id":"https://openalex.org/C2779803651","wikidata":"https://www.wikidata.org/wiki/Q5282088","display_name":"Discriminator","level":3,"score":0.9066898822784424},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.7577642202377319},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.6992640495300293},{"id":"https://openalex.org/C32834561","wikidata":"https://www.wikidata.org/wiki/Q660730","display_name":"Subspace topology","level":2,"score":0.6344174742698669},{"id":"https://openalex.org/C153180895","wikidata":"https://www.wikidata.org/wiki/Q7148389","display_name":"Pattern recognition (psychology)","level":2,"score":0.6074607968330383},{"id":"https://openalex.org/C41608201","wikidata":"https://www.wikidata.org/wiki/Q980509","display_name":"Embedding","level":2,"score":0.5877129435539246},{"id":"https://openalex.org/C2780992000","wikidata":"https://www.wikidata.org/wiki/Q17016113","display_name":"Generator (circuit theory)","level":3,"score":0.5509153008460999},{"id":"https://openalex.org/C108583219","wikidata":"https://www.wikidata.org/wiki/Q197536","display_name":"Deep learning","level":2,"score":0.5265536308288574},{"id":"https://openalex.org/C51167844","wikidata":"https://www.wikidata.org/wiki/Q4422623","display_name":"Latent variable","level":2,"score":0.5075181722640991},{"id":"https://openalex.org/C101738243","wikidata":"https://www.wikidata.org/wiki/Q786435","display_name":"Autoencoder","level":3,"score":0.465166836977005},{"id":"https://openalex.org/C28490314","wikidata":"https://www.wikidata.org/wiki/Q189436","display_name":"Speech recognition","level":1,"score":0.4529208540916443},{"id":"https://openalex.org/C94915269","wikidata":"https://www.wikidata.org/wiki/Q1834857","display_name":"Detector","level":2,"score":0.071282297372818},{"id":"https://openalex.org/C62520636","wikidata":"https://www.wikidata.org/wiki/Q944","display_name":"Quantum mechanics","level":1,"score":0.0},{"id":"https://openalex.org/C163258240","wikidata":"https://www.wikidata.org/wiki/Q25342","display_name":"Power (physics)","level":2,"score":0.0},{"id":"https://openalex.org/C76155785","wikidata":"https://www.wikidata.org/wiki/Q418","display_name":"Telecommunications","level":1,"score":0.0},{"id":"https://openalex.org/C121332964","wikidata":"https://www.wikidata.org/wiki/Q413","display_name":"Physics","level":0,"score":0.0}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.1109/asru.2017.8268991","is_oa":false,"landing_page_url":"https://doi.org/10.1109/asru.2017.8268991","pdf_url":null,"source":{"id":"https://openalex.org/S4306498158","display_name":"2017 IEEE Automatic Speech Recognition and Understanding Workshop (ASRU)","issn_l":null,"issn":null,"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":null,"host_organization_name":null,"host_organization_lineage":[],"host_organization_lineage_names":[],"type":"journal"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"2017 IEEE Automatic Speech Recognition and Understanding Workshop (ASRU)","raw_type":"proceedings-article"}],"best_oa_location":null,"sustainable_development_goals":[{"display_name":"Reduced inequalities","id":"https://metadata.un.org/sdg/10","score":0.7599999904632568}],"awards":[],"funders":[],"has_content":{"pdf":false,"grobid_xml":false},"content_urls":null,"referenced_works_count":32,"referenced_works":["https://openalex.org/W1522301498","https://openalex.org/W1539175566","https://openalex.org/W1959608418","https://openalex.org/W2049633694","https://openalex.org/W2099471712","https://openalex.org/W2109761419","https://openalex.org/W2121812409","https://openalex.org/W2143797877","https://openalex.org/W2150769028","https://openalex.org/W2157444450","https://openalex.org/W2162055300","https://openalex.org/W2180339972","https://openalex.org/W2187089797","https://openalex.org/W2405331948","https://openalex.org/W2408468826","https://openalex.org/W2585630030","https://openalex.org/W2590440273","https://openalex.org/W2604209903","https://openalex.org/W2606786299","https://openalex.org/W2662551090","https://openalex.org/W2662639535","https://openalex.org/W2748488820","https://openalex.org/W2941689885","https://openalex.org/W2963865839","https://openalex.org/W2964121744","https://openalex.org/W4293568373","https://openalex.org/W4320013936","https://openalex.org/W6631190155","https://openalex.org/W6632384406","https://openalex.org/W6640963894","https://openalex.org/W6681474766","https://openalex.org/W6683161245"],"related_works":["https://openalex.org/W4293202849","https://openalex.org/W1980965563","https://openalex.org/W1489300767","https://openalex.org/W2387995142","https://openalex.org/W4380714744","https://openalex.org/W4319453655","https://openalex.org/W2089959425","https://openalex.org/W2057775761","https://openalex.org/W2988134182","https://openalex.org/W2770818364"],"abstract_inverted_index":{"This":[0,66],"paper":[1],"presents":[2],"an":[3,25,60,90],"adversarial":[4,61,91],"manifold":[5,148],"learning":[6,46,62,74,85,149],"(AML)":[7],"for":[8,27,35,47,86],"speaker":[9,140],"recognition":[10,141],"based":[11,80],"on":[12,81,139],"the":[13,29,37,101,105,111,132,143],"probabilistic":[14],"linear":[15],"discriminant":[16],"analysis":[17],"(PLDA)":[18],"using":[19,131],"i-vectors.":[20,38],"PLDA":[21],"basically":[22],"consists":[23],"of":[24,145],"encoder":[26],"finding":[28],"latent":[30,49,53,118],"variables":[31],"and":[32,42,89,97,125,150],"a":[33,48,77,83,95,98],"decoder":[34,124],"reconstructing":[36],"AML":[39],"is":[40,55,68,107],"developed":[41],"incorporated":[43],"in":[44,117,122,147],"deep":[45,102],"variable":[50],"model.":[51],"Low-dimensional":[52],"space":[54],"therefore":[56],"constructed":[57],"according":[58],"to":[59,70,109],"with":[63,113],"neighbor":[64,87],"embedding.":[65],"AML-PLDA":[67,146],"formulated":[69],"jointly":[71,128],"optimize":[72],"three":[73],"objectives":[75],"including":[76],"reconstruction":[78],"error":[79],"PLDA,":[82],"subspace":[84],"embedding":[88],"loss":[92],"caused":[93],"by":[94,130],"discriminator":[96,112,126],"generator.":[99],"Using":[100],"neural":[103],"networks,":[104],"generator":[106],"trained":[108],"fool":[110],"its":[114],"generated":[115],"samples":[116],"space.":[119],"The":[120,137],"parameters":[121],"encoder,":[123],"are":[127],"estimated":[129],"stochastic":[133],"gradient":[134],"descent":[135],"algorithm.":[136],"experiments":[138],"show":[142],"merit":[144],"pattern":[151],"classification.":[152]},"counts_by_year":[{"year":2020,"cited_by_count":13},{"year":2019,"cited_by_count":3}],"updated_date":"2025-11-06T03:46:38.306776","created_date":"2025-10-10T00:00:00"}
