{"id":"https://openalex.org/W4389318028","doi":"https://doi.org/10.1109/tnnls.2023.3335119","title":"GLGAN-VC: A Guided Loss-Based Generative Adversarial Network for Many-to-Many Voice Conversion","display_name":"GLGAN-VC: A Guided Loss-Based Generative Adversarial Network for Many-to-Many Voice Conversion","publication_year":2023,"publication_date":"2023-12-04","ids":{"openalex":"https://openalex.org/W4389318028","doi":"https://doi.org/10.1109/tnnls.2023.3335119","pmid":"https://pubmed.ncbi.nlm.nih.gov/38048246"},"language":"en","primary_location":{"id":"doi:10.1109/tnnls.2023.3335119","is_oa":false,"landing_page_url":"https://doi.org/10.1109/tnnls.2023.3335119","pdf_url":null,"source":{"id":"https://openalex.org/S4210175523","display_name":"IEEE Transactions on Neural Networks and Learning Systems","issn_l":"2162-237X","issn":["2162-237X","2162-2388"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310319808","host_organization_name":"Institute of Electrical and Electronics Engineers","host_organization_lineage":["https://openalex.org/P4310319808"],"host_organization_lineage_names":["Institute of Electrical and Electronics Engineers"],"type":"journal"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"IEEE Transactions on Neural Networks and Learning Systems","raw_type":"journal-article"},"type":"article","indexed_in":["crossref","pubmed"],"open_access":{"is_oa":false,"oa_status":"closed","oa_url":null,"any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5102798862","display_name":"Sandipan Dhar","orcid":"https://orcid.org/0000-0002-3606-6664"},"institutions":[{"id":"https://openalex.org/I155837530","display_name":"National Institute of Technology Durgapur","ror":"https://ror.org/04ds0jm32","country_code":"IN","type":"education","lineage":["https://openalex.org/I155837530"]}],"countries":["IN"],"is_corresponding":true,"raw_author_name":"Sandipan Dhar","raw_affiliation_strings":["Department of Computer Science and Engineering, National Institute of Technology Durgapur, Durgapur, West Bengal, India"],"affiliations":[{"raw_affiliation_string":"Department of Computer Science and Engineering, National Institute of Technology Durgapur, Durgapur, West Bengal, India","institution_ids":["https://openalex.org/I155837530"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5055489209","display_name":"Nanda Dulal Jana","orcid":"https://orcid.org/0000-0003-0631-9912"},"institutions":[{"id":"https://openalex.org/I155837530","display_name":"National Institute of Technology Durgapur","ror":"https://ror.org/04ds0jm32","country_code":"IN","type":"education","lineage":["https://openalex.org/I155837530"]}],"countries":["IN"],"is_corresponding":false,"raw_author_name":"Nanda Dulal Jana","raw_affiliation_strings":["Department of Computer Science and Engineering, National Institute of Technology Durgapur, Durgapur, West Bengal, India"],"affiliations":[{"raw_affiliation_string":"Department of Computer Science and Engineering, National Institute of Technology Durgapur, Durgapur, West Bengal, India","institution_ids":["https://openalex.org/I155837530"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5000078546","display_name":"Swagatam Das","orcid":"https://orcid.org/0000-0001-6843-4508"},"institutions":[{"id":"https://openalex.org/I6498739","display_name":"Indian Statistical Institute","ror":"https://ror.org/00q2w1j53","country_code":"IN","type":"education","lineage":["https://openalex.org/I6498739"]}],"countries":["IN"],"is_corresponding":false,"raw_author_name":"Swagatam Das","raw_affiliation_strings":["Institute for Advancing Intelligence (IAI), TCG CREST, Kolkata, India","Electronics and Communication Sciences Unit, Indian Statistical Institute, Kolkata, India"],"affiliations":[{"raw_affiliation_string":"Institute for Advancing Intelligence (IAI), TCG CREST, Kolkata, India","institution_ids":[]},{"raw_affiliation_string":"Electronics and Communication Sciences Unit, Indian Statistical Institute, Kolkata, India","institution_ids":["https://openalex.org/I6498739"]}]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":3,"corresponding_author_ids":["https://openalex.org/A5102798862"],"corresponding_institution_ids":["https://openalex.org/I155837530"],"apc_list":null,"apc_paid":null,"fwci":1.8942,"has_fulltext":false,"cited_by_count":11,"citation_normalized_percentile":{"value":0.8884642,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":{"min":96,"max":99},"biblio":{"volume":"36","issue":"1","first_page":"1813","last_page":"1826"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10201","display_name":"Speech Recognition and Synthesis","score":0.9988999962806702,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10201","display_name":"Speech Recognition and Synthesis","score":0.9988999962806702,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10860","display_name":"Speech and Audio Processing","score":0.9871000051498413,"subfield":{"id":"https://openalex.org/subfields/1711","display_name":"Signal Processing"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10863","display_name":"Voice and Speech Disorders","score":0.9851999878883362,"subfield":{"id":"https://openalex.org/subfields/2737","display_name":"Physiology"},"field":{"id":"https://openalex.org/fields/27","display_name":"Medicine"},"domain":{"id":"https://openalex.org/domains/4","display_name":"Health Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/upsampling","display_name":"Upsampling","score":0.8000056147575378},{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.7595577239990234},{"id":"https://openalex.org/keywords/naturalness","display_name":"Naturalness","score":0.751065731048584},{"id":"https://openalex.org/keywords/discriminator","display_name":"Discriminator","score":0.6551821827888489},{"id":"https://openalex.org/keywords/speech-recognition","display_name":"Speech recognition","score":0.6492893695831299},{"id":"https://openalex.org/keywords/feature","display_name":"Feature (linguistics)","score":0.4987168312072754},{"id":"https://openalex.org/keywords/generative-adversarial-network","display_name":"Generative adversarial network","score":0.42914503812789917},{"id":"https://openalex.org/keywords/speech-enhancement","display_name":"Speech enhancement","score":0.4285087287425995},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.3376370072364807},{"id":"https://openalex.org/keywords/deep-learning","display_name":"Deep learning","score":0.30021560192108154}],"concepts":[{"id":"https://openalex.org/C110384440","wikidata":"https://www.wikidata.org/wiki/Q1143270","display_name":"Upsampling","level":3,"score":0.8000056147575378},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.7595577239990234},{"id":"https://openalex.org/C134537474","wikidata":"https://www.wikidata.org/wiki/Q17144832","display_name":"Naturalness","level":2,"score":0.751065731048584},{"id":"https://openalex.org/C2779803651","wikidata":"https://www.wikidata.org/wiki/Q5282088","display_name":"Discriminator","level":3,"score":0.6551821827888489},{"id":"https://openalex.org/C28490314","wikidata":"https://www.wikidata.org/wiki/Q189436","display_name":"Speech recognition","level":1,"score":0.6492893695831299},{"id":"https://openalex.org/C2776401178","wikidata":"https://www.wikidata.org/wiki/Q12050496","display_name":"Feature (linguistics)","level":2,"score":0.4987168312072754},{"id":"https://openalex.org/C2988773926","wikidata":"https://www.wikidata.org/wiki/Q25104379","display_name":"Generative adversarial network","level":3,"score":0.42914503812789917},{"id":"https://openalex.org/C2776182073","wikidata":"https://www.wikidata.org/wiki/Q7575395","display_name":"Speech enhancement","level":3,"score":0.4285087287425995},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.3376370072364807},{"id":"https://openalex.org/C108583219","wikidata":"https://www.wikidata.org/wiki/Q197536","display_name":"Deep learning","level":2,"score":0.30021560192108154},{"id":"https://openalex.org/C115961682","wikidata":"https://www.wikidata.org/wiki/Q860623","display_name":"Image (mathematics)","level":2,"score":0.0},{"id":"https://openalex.org/C138885662","wikidata":"https://www.wikidata.org/wiki/Q5891","display_name":"Philosophy","level":0,"score":0.0},{"id":"https://openalex.org/C76155785","wikidata":"https://www.wikidata.org/wiki/Q418","display_name":"Telecommunications","level":1,"score":0.0},{"id":"https://openalex.org/C163294075","wikidata":"https://www.wikidata.org/wiki/Q581861","display_name":"Noise reduction","level":2,"score":0.0},{"id":"https://openalex.org/C62520636","wikidata":"https://www.wikidata.org/wiki/Q944","display_name":"Quantum mechanics","level":1,"score":0.0},{"id":"https://openalex.org/C41895202","wikidata":"https://www.wikidata.org/wiki/Q8162","display_name":"Linguistics","level":1,"score":0.0},{"id":"https://openalex.org/C121332964","wikidata":"https://www.wikidata.org/wiki/Q413","display_name":"Physics","level":0,"score":0.0},{"id":"https://openalex.org/C94915269","wikidata":"https://www.wikidata.org/wiki/Q1834857","display_name":"Detector","level":2,"score":0.0}],"mesh":[],"locations_count":2,"locations":[{"id":"doi:10.1109/tnnls.2023.3335119","is_oa":false,"landing_page_url":"https://doi.org/10.1109/tnnls.2023.3335119","pdf_url":null,"source":{"id":"https://openalex.org/S4210175523","display_name":"IEEE Transactions on Neural Networks and Learning Systems","issn_l":"2162-237X","issn":["2162-237X","2162-2388"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310319808","host_organization_name":"Institute of Electrical and Electronics Engineers","host_organization_lineage":["https://openalex.org/P4310319808"],"host_organization_lineage_names":["Institute of Electrical and Electronics Engineers"],"type":"journal"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"IEEE Transactions on Neural Networks and Learning Systems","raw_type":"journal-article"},{"id":"pmid:38048246","is_oa":false,"landing_page_url":"https://pubmed.ncbi.nlm.nih.gov/38048246","pdf_url":null,"source":{"id":"https://openalex.org/S4306525036","display_name":"PubMed","issn_l":null,"issn":null,"is_oa":false,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I1299303238","host_organization_name":"National Institutes of Health","host_organization_lineage":["https://openalex.org/I1299303238"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"IEEE transactions on neural networks and learning systems","raw_type":null}],"best_oa_location":null,"sustainable_development_goals":[{"score":0.6800000071525574,"display_name":"Reduced inequalities","id":"https://metadata.un.org/sdg/10"}],"awards":[],"funders":[],"has_content":{"pdf":false,"grobid_xml":false},"content_urls":null,"referenced_works_count":50,"referenced_works":["https://openalex.org/W1552314771","https://openalex.org/W2008622809","https://openalex.org/W2040734426","https://openalex.org/W2123771434","https://openalex.org/W2126143605","https://openalex.org/W2423276646","https://openalex.org/W2471520273","https://openalex.org/W2473388484","https://openalex.org/W2518172956","https://openalex.org/W2576309025","https://openalex.org/W2589759987","https://openalex.org/W2765293924","https://openalex.org/W2804998325","https://openalex.org/W2888922217","https://openalex.org/W2902070858","https://openalex.org/W2913006054","https://openalex.org/W2936002583","https://openalex.org/W2937579788","https://openalex.org/W2962896155","https://openalex.org/W2963035245","https://openalex.org/W2963539064","https://openalex.org/W2963767194","https://openalex.org/W2972452545","https://openalex.org/W2972667718","https://openalex.org/W2972849140","https://openalex.org/W3015434413","https://openalex.org/W3015805741","https://openalex.org/W3015959238","https://openalex.org/W3024443431","https://openalex.org/W3095936335","https://openalex.org/W3096356991","https://openalex.org/W3096864844","https://openalex.org/W3098557217","https://openalex.org/W3158484908","https://openalex.org/W3163573274","https://openalex.org/W3196667132","https://openalex.org/W3200011735","https://openalex.org/W4205267278","https://openalex.org/W4252337780","https://openalex.org/W4293023358","https://openalex.org/W6631190155","https://openalex.org/W6687506355","https://openalex.org/W6722194198","https://openalex.org/W6729110096","https://openalex.org/W6741832134","https://openalex.org/W6762238293","https://openalex.org/W6762533536","https://openalex.org/W6767141205","https://openalex.org/W6767245602","https://openalex.org/W6840412704"],"related_works":["https://openalex.org/W3214732802","https://openalex.org/W3209202081","https://openalex.org/W4226324275","https://openalex.org/W3217069185","https://openalex.org/W3049340819","https://openalex.org/W4308928038","https://openalex.org/W4200430540","https://openalex.org/W3141413246","https://openalex.org/W2808862658","https://openalex.org/W4322709305"],"abstract_inverted_index":{"Many-to-many":[0],"voice":[1],"conversion":[2],"(VC)":[3],"is":[4,62,159,179],"a":[5,43,85,92,116,145],"technique":[6],"aimed":[7],"at":[8],"mapping":[9,128],"speech":[10,38,51,71,126,203,230,238],"features":[11],"between":[12,46,169],"multiple":[13],"speakers":[14],"during":[15],"training":[16],"and":[17,49,76,106,119,144,171,174,200,212,232],"transferring":[18],"the":[19,33,36,47,107,236],"vocal":[20],"characteristics":[21],"of":[22,35,55,109,229],"one":[23],"source":[24,37,170],"speaker":[25,233],"to":[26,97,140,151,161],"another":[27],"target":[28,172],"speaker,":[29],"all":[30],"while":[31],"maintaining":[32],"content":[34,142],"unchanged.":[39],"Existing":[40],"research":[41],"highlights":[42],"notable":[44],"gap":[45],"original":[48],"generated":[50,237],"samples":[52,72],"in":[53,67,130,165,227,235],"terms":[54,228],"naturalness":[56],"within":[57],"many-to-many":[58,99,223],"VC.":[59,132],"Therefore,":[60],"there":[61],"substantial":[63],"room":[64],"for":[65,73,124,181],"improvement":[66],"achieving":[68],"more":[69],"natural-sounding":[70],"both":[74,210],"parallel":[75],"nonparallel":[77],"VC":[78,100,225],"scenarios.":[79],"In":[80,133],"this":[81],"study,":[82],"we":[83,135],"introduce":[84],"generative":[86],"adversarial":[87],"network":[88,123,150],"(GAN)":[89],"system":[90],"with":[91],"guided":[93,155],"loss":[94,111,139,156,178],"(GLGAN-VC)":[95],"designed":[96],"enhance":[98],"by":[101],"focusing":[102],"on":[103,190,209],"architectural":[104],"improvements":[105],"integration":[108],"alternative":[110],"functions.":[112],"Our":[113,206],"approach":[114],"includes":[115],"pair-wise":[117],"downsampling":[118],"upsampling":[120],"(PDU)":[121],"generator":[122],"effective":[125],"feature":[127,167],"(FM)":[129],"multidomain":[131],"addition,":[134],"incorporate":[136],"an":[137,175,201],"FM":[138],"preserve":[141],"information":[143,184],"residual":[146],"connection":[147],"(RC)-based":[148],"discriminator":[149],"improve":[152],"learning.":[153],"A":[154],"(GL)":[157],"function":[158],"introduced":[160],"efficiently":[162],"capture":[163],"differences":[164],"latent":[166],"representations":[168],"speakers,":[173],"enhanced":[176],"reconstruction":[177],"proposed":[180],"better":[182],"contextual":[183],"preservation.":[185],"We":[186],"evaluate":[187],"our":[188,218],"model":[189,219],"various":[191],"datasets,":[192],"including":[193],"VCC":[194,196,198],"2016,":[195],"2018,":[197],"2020,":[199],"emotional":[202],"dataset":[204],"(ESD).":[205],"results,":[207],"based":[208],"subjective":[211],"objective":[213],"evaluation":[214],"metrics,":[215],"demonstrate":[216],"that":[217],"outperforms":[220],"state-of-the-art":[221],"(SOTA)":[222],"GAN-based":[224],"models":[226],"quality":[231],"similarity":[234],"samples.":[239]},"counts_by_year":[{"year":2026,"cited_by_count":1},{"year":2025,"cited_by_count":6},{"year":2024,"cited_by_count":4}],"updated_date":"2026-04-14T08:04:32.555800","created_date":"2025-10-10T00:00:00"}
