{"id":"https://openalex.org/W2808456396","doi":"https://doi.org/10.21437/interspeech.2018-1883","title":"On Enhancing Speech Emotion Recognition Using Generative Adversarial Networks","display_name":"On Enhancing Speech Emotion Recognition Using Generative Adversarial Networks","publication_year":2018,"publication_date":"2018-08-28","ids":{"openalex":"https://openalex.org/W2808456396","doi":"https://doi.org/10.21437/interspeech.2018-1883","mag":"2808456396"},"language":"en","primary_location":{"id":"doi:10.21437/interspeech.2018-1883","is_oa":false,"landing_page_url":"https://doi.org/10.21437/interspeech.2018-1883","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Interspeech 2018","raw_type":"proceedings-article"},"type":"preprint","indexed_in":["arxiv","crossref","datacite"],"open_access":{"is_oa":true,"oa_status":"green","oa_url":"https://arxiv.org/pdf/1806.06626","any_repository_has_fulltext":true},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5102988572","display_name":"Saurabh Sahu","orcid":"https://orcid.org/0000-0001-6222-1587"},"institutions":[{"id":"https://openalex.org/I1174212","display_name":"University of Southern California","ror":"https://ror.org/03taz7m60","country_code":"US","type":"education","lineage":["https://openalex.org/I1174212"]}],"countries":["US"],"is_corresponding":true,"raw_author_name":"Saurabh Sahu","raw_affiliation_strings":["University of Southern California, Los Angeles, United States"],"affiliations":[{"raw_affiliation_string":"University of Southern California, Los Angeles, United States","institution_ids":["https://openalex.org/I1174212"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5075937808","display_name":"Rahul Gupta","orcid":"https://orcid.org/0000-0002-9277-3718"},"institutions":[{"id":"https://openalex.org/I1311688040","display_name":"Amazon (United States)","ror":"https://ror.org/04mv4n011","country_code":"US","type":"company","lineage":["https://openalex.org/I1311688040"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Rahul Gupta","raw_affiliation_strings":["Amazon (United States), Seattle, United States"],"affiliations":[{"raw_affiliation_string":"Amazon (United States), Seattle, United States","institution_ids":["https://openalex.org/I1311688040"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5078241735","display_name":"Carol Espy-Wilson","orcid":"https://orcid.org/0000-0002-1012-183X"},"institutions":[{"id":"https://openalex.org/I1174212","display_name":"University of Southern California","ror":"https://ror.org/03taz7m60","country_code":"US","type":"education","lineage":["https://openalex.org/I1174212"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Carol Espy-Wilson","raw_affiliation_strings":["University of Southern California, Los Angeles, United States"],"affiliations":[{"raw_affiliation_string":"University of Southern California, Los Angeles, United States","institution_ids":["https://openalex.org/I1174212"]}]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":3,"corresponding_author_ids":["https://openalex.org/A5102988572"],"corresponding_institution_ids":["https://openalex.org/I1174212"],"apc_list":null,"apc_paid":null,"fwci":2.0209,"has_fulltext":false,"cited_by_count":19,"citation_normalized_percentile":{"value":0.9042938,"is_in_top_1_percent":false,"is_in_top_10_percent":true},"cited_by_percentile_year":{"min":98,"max":99},"biblio":{"volume":null,"issue":null,"first_page":"3693","last_page":"3697"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10775","display_name":"Generative Adversarial Networks and Image Synthesis","score":0.9998000264167786,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10775","display_name":"Generative Adversarial Networks and Image Synthesis","score":0.9998000264167786,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11309","display_name":"Music and Audio Processing","score":0.9976999759674072,"subfield":{"id":"https://openalex.org/subfields/1711","display_name":"Signal Processing"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10201","display_name":"Speech Recognition and Synthesis","score":0.9959999918937683,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/discriminator","display_name":"Discriminator","score":0.8836078643798828},{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.7204735279083252},{"id":"https://openalex.org/keywords/classifier","display_name":"Classifier (UML)","score":0.6322131752967834},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.5945107936859131},{"id":"https://openalex.org/keywords/pattern-recognition","display_name":"Pattern recognition (psychology)","score":0.5770899653434753},{"id":"https://openalex.org/keywords/generator","display_name":"Generator (circuit theory)","score":0.5611403584480286},{"id":"https://openalex.org/keywords/feature-vector","display_name":"Feature vector","score":0.5553596019744873},{"id":"https://openalex.org/keywords/feature","display_name":"Feature (linguistics)","score":0.47912144660949707},{"id":"https://openalex.org/keywords/generative-grammar","display_name":"Generative grammar","score":0.44969141483306885},{"id":"https://openalex.org/keywords/gaussian","display_name":"Gaussian","score":0.4228418469429016},{"id":"https://openalex.org/keywords/feature-learning","display_name":"Feature learning","score":0.41066649556159973},{"id":"https://openalex.org/keywords/machine-learning","display_name":"Machine learning","score":0.3816349506378174},{"id":"https://openalex.org/keywords/speech-recognition","display_name":"Speech recognition","score":0.3756210505962372},{"id":"https://openalex.org/keywords/power","display_name":"Power (physics)","score":0.07200458645820618}],"concepts":[{"id":"https://openalex.org/C2779803651","wikidata":"https://www.wikidata.org/wiki/Q5282088","display_name":"Discriminator","level":3,"score":0.8836078643798828},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.7204735279083252},{"id":"https://openalex.org/C95623464","wikidata":"https://www.wikidata.org/wiki/Q1096149","display_name":"Classifier (UML)","level":2,"score":0.6322131752967834},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.5945107936859131},{"id":"https://openalex.org/C153180895","wikidata":"https://www.wikidata.org/wiki/Q7148389","display_name":"Pattern recognition (psychology)","level":2,"score":0.5770899653434753},{"id":"https://openalex.org/C2780992000","wikidata":"https://www.wikidata.org/wiki/Q17016113","display_name":"Generator (circuit theory)","level":3,"score":0.5611403584480286},{"id":"https://openalex.org/C83665646","wikidata":"https://www.wikidata.org/wiki/Q42139305","display_name":"Feature vector","level":2,"score":0.5553596019744873},{"id":"https://openalex.org/C2776401178","wikidata":"https://www.wikidata.org/wiki/Q12050496","display_name":"Feature (linguistics)","level":2,"score":0.47912144660949707},{"id":"https://openalex.org/C39890363","wikidata":"https://www.wikidata.org/wiki/Q36108","display_name":"Generative grammar","level":2,"score":0.44969141483306885},{"id":"https://openalex.org/C163716315","wikidata":"https://www.wikidata.org/wiki/Q901177","display_name":"Gaussian","level":2,"score":0.4228418469429016},{"id":"https://openalex.org/C59404180","wikidata":"https://www.wikidata.org/wiki/Q17013334","display_name":"Feature learning","level":2,"score":0.41066649556159973},{"id":"https://openalex.org/C119857082","wikidata":"https://www.wikidata.org/wiki/Q2539","display_name":"Machine learning","level":1,"score":0.3816349506378174},{"id":"https://openalex.org/C28490314","wikidata":"https://www.wikidata.org/wiki/Q189436","display_name":"Speech recognition","level":1,"score":0.3756210505962372},{"id":"https://openalex.org/C163258240","wikidata":"https://www.wikidata.org/wiki/Q25342","display_name":"Power (physics)","level":2,"score":0.07200458645820618},{"id":"https://openalex.org/C121332964","wikidata":"https://www.wikidata.org/wiki/Q413","display_name":"Physics","level":0,"score":0.0},{"id":"https://openalex.org/C76155785","wikidata":"https://www.wikidata.org/wiki/Q418","display_name":"Telecommunications","level":1,"score":0.0},{"id":"https://openalex.org/C62520636","wikidata":"https://www.wikidata.org/wiki/Q944","display_name":"Quantum mechanics","level":1,"score":0.0},{"id":"https://openalex.org/C41895202","wikidata":"https://www.wikidata.org/wiki/Q8162","display_name":"Linguistics","level":1,"score":0.0},{"id":"https://openalex.org/C94915269","wikidata":"https://www.wikidata.org/wiki/Q1834857","display_name":"Detector","level":2,"score":0.0},{"id":"https://openalex.org/C138885662","wikidata":"https://www.wikidata.org/wiki/Q5891","display_name":"Philosophy","level":0,"score":0.0}],"mesh":[],"locations_count":4,"locations":[{"id":"doi:10.21437/interspeech.2018-1883","is_oa":false,"landing_page_url":"https://doi.org/10.21437/interspeech.2018-1883","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Interspeech 2018","raw_type":"proceedings-article"},{"id":"pmh:oai:arXiv.org:1806.06626","is_oa":true,"landing_page_url":"http://arxiv.org/abs/1806.06626","pdf_url":"https://arxiv.org/pdf/1806.06626","source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"text"},{"id":"mag:2808456396","is_oa":true,"landing_page_url":"https://arxiv.org/pdf/1806.06626.pdf","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":"arXiv (Cornell University)","raw_type":null},{"id":"doi:10.48550/arxiv.1806.06626","is_oa":true,"landing_page_url":"https://doi.org/10.48550/arxiv.1806.06626","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":null,"is_accepted":false,"is_published":null,"raw_source_name":null,"raw_type":"article"}],"best_oa_location":{"id":"pmh:oai:arXiv.org:1806.06626","is_oa":true,"landing_page_url":"http://arxiv.org/abs/1806.06626","pdf_url":"https://arxiv.org/pdf/1806.06626","source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"text"},"sustainable_development_goals":[{"id":"https://metadata.un.org/sdg/10","display_name":"Reduced inequalities","score":0.7300000190734863}],"awards":[],"funders":[],"has_content":{"pdf":false,"grobid_xml":false},"content_urls":null,"referenced_works_count":13,"referenced_works":["https://openalex.org/W1994348490","https://openalex.org/W2090777335","https://openalex.org/W2125389028","https://openalex.org/W2173520492","https://openalex.org/W2298992465","https://openalex.org/W2342475039","https://openalex.org/W2396718206","https://openalex.org/W2510254673","https://openalex.org/W2577946330","https://openalex.org/W2951520714","https://openalex.org/W2962686539","https://openalex.org/W2963073614","https://openalex.org/W2963569749"],"related_works":["https://openalex.org/W2962993399","https://openalex.org/W2146334809","https://openalex.org/W2173520492","https://openalex.org/W2099471712","https://openalex.org/W2963569749","https://openalex.org/W2962793481","https://openalex.org/W2962686539","https://openalex.org/W2399733683","https://openalex.org/W2903311573","https://openalex.org/W3119330895","https://openalex.org/W3160150257","https://openalex.org/W2972640480","https://openalex.org/W2963373786","https://openalex.org/W2890002510","https://openalex.org/W2800126857","https://openalex.org/W2342475039","https://openalex.org/W2239141610","https://openalex.org/W2055911634","https://openalex.org/W2945178666","https://openalex.org/W2964057616"],"abstract_inverted_index":{"Generative":[0],"Adversarial":[1],"Networks":[2],"(GANs)":[3],"have":[4],"gained":[5],"a":[6,29,32,38,43,54,98,106,119,145,159,180],"lot":[7],"of":[8,28,68,79,105,110,126,149],"attention":[9],"from":[10,53,71],"machine":[11],"learning":[12],"community":[13],"due":[14],"to":[15,18,41,81,140],"their":[16],"ability":[17],"learn":[19,42],"and":[20,31],"mimic":[21],"an":[22],"input":[23],"data":[24,46,165,171],"distribution.":[25,74],"GANs":[26,80],"consist":[27],"discriminator":[30],"generator":[33],"working":[34],"in":[35,158],"tandem":[36],"playing":[37],"min-max":[39],"game":[40],"target":[44,73],"underlying":[45],"distribution;":[47],"when":[48,162],"fed":[49],"with":[50,169],"data-points":[51],"sampled":[52,70],"simpler":[55],"distribution":[56,104,125],"(like":[57],"uniform":[58],"or":[59,136],"Gaussian":[60],"distribution).":[61],"Once":[62],"trained,":[63],"they":[64],"allow":[65],"synthetic":[66,83,164],"generation":[67],"examples":[69],"the":[72,77,103,111,124,127,134,137,163],"We":[75,174],"investigate":[76,93],"application":[78,148],"generate":[82],"feature":[84,115,130],"vectors":[85,131],"used":[86,167],"for":[87,172],"speech":[88],"emotion":[89],"recognition.":[90],"Specifically,":[91],"we":[92,154],"two":[94],"set":[95],"ups:":[96],"(i)":[97],"vanilla":[99],"GAN":[100,121],"that":[101,122],"learns":[102,123],"lower":[107],"dimensional":[108,114,129],"representation":[109],"actual":[112],"higher":[113,128],"vector":[116],"and,":[117],"(ii)":[118],"conditional":[120],"conditioned":[132],"on":[133],"labels":[135],"emotional":[138],"class":[139],"which":[141],"it":[142],"belongs.":[143],"As":[144],"potential":[146],"practical":[147],"these":[150],"synthetically":[151],"generated":[152],"samples,":[153],"measure":[155],"any":[156],"improvement":[157],"classifier's":[160],"performance":[161],"is":[166],"along":[168],"real":[170],"training.":[173],"perform":[175],"cross-validation":[176],"analyses":[177],"followed":[178],"by":[179],"cross-corpus":[181],"study.":[182]},"counts_by_year":[{"year":2021,"cited_by_count":6},{"year":2020,"cited_by_count":8},{"year":2019,"cited_by_count":5}],"updated_date":"2026-03-20T23:20:44.827607","created_date":"2025-10-10T00:00:00"}
