{"id":"https://openalex.org/W2944787130","doi":"https://doi.org/10.1109/iscslp.2018.8706610","title":"Speech Emotion Recognition using Convolutional Neural Network with Audio Word-based Embedding","display_name":"Speech Emotion Recognition using Convolutional Neural Network with Audio Word-based Embedding","publication_year":2018,"publication_date":"2018-11-01","ids":{"openalex":"https://openalex.org/W2944787130","doi":"https://doi.org/10.1109/iscslp.2018.8706610","mag":"2944787130"},"language":"en","primary_location":{"id":"doi:10.1109/iscslp.2018.8706610","is_oa":false,"landing_page_url":"https://doi.org/10.1109/iscslp.2018.8706610","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"2018 11th International Symposium on Chinese Spoken Language Processing (ISCSLP)","raw_type":"proceedings-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":false,"oa_status":"closed","oa_url":null,"any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5065699174","display_name":"Kun-Yi Huang","orcid":"https://orcid.org/0000-0002-3629-7091"},"institutions":[{"id":"https://openalex.org/I91807558","display_name":"National Cheng Kung University","ror":"https://ror.org/01b8kcc49","country_code":"TW","type":"education","lineage":["https://openalex.org/I91807558"]}],"countries":["TW"],"is_corresponding":false,"raw_author_name":"Kun-Yi Huang","raw_affiliation_strings":["Department of Computer Science and Information Engineering, National Cheng Kung University, Taiwan"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"Department of Computer Science and Information Engineering, National Cheng Kung University, Taiwan","institution_ids":["https://openalex.org/I91807558"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5103251327","display_name":"Chung\u2010Hsien Wu","orcid":"https://orcid.org/0000-0002-3947-2123"},"institutions":[{"id":"https://openalex.org/I84653119","display_name":"Academia Sinica","ror":"https://ror.org/05bxb3784","country_code":"TW","type":"facility","lineage":["https://openalex.org/I84653119"]},{"id":"https://openalex.org/I91807558","display_name":"National Cheng Kung University","ror":"https://ror.org/01b8kcc49","country_code":"TW","type":"education","lineage":["https://openalex.org/I91807558"]}],"countries":["TW"],"is_corresponding":false,"raw_author_name":"Chung-Hsien Wu","raw_affiliation_strings":["PhD Program for Multimedia Systems and Intelligent Computing, National Cheng Kung University and Academia Sinica, Taiwan"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"PhD Program for Multimedia Systems and Intelligent Computing, National Cheng Kung University and Academia Sinica, Taiwan","institution_ids":["https://openalex.org/I91807558","https://openalex.org/I84653119"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5054849851","display_name":"Qian-Bei Hong","orcid":"https://orcid.org/0000-0003-2123-1601"},"institutions":[{"id":"https://openalex.org/I84653119","display_name":"Academia Sinica","ror":"https://ror.org/05bxb3784","country_code":"TW","type":"facility","lineage":["https://openalex.org/I84653119"]},{"id":"https://openalex.org/I91807558","display_name":"National Cheng Kung University","ror":"https://ror.org/01b8kcc49","country_code":"TW","type":"education","lineage":["https://openalex.org/I91807558"]}],"countries":["TW"],"is_corresponding":false,"raw_author_name":"Qian-Bei Hong","raw_affiliation_strings":["PhD Program for Multimedia Systems and Intelligent Computing, National Cheng Kung University and Academia Sinica, Taiwan"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"PhD Program for Multimedia Systems and Intelligent Computing, National Cheng Kung University and Academia Sinica, Taiwan","institution_ids":["https://openalex.org/I91807558","https://openalex.org/I84653119"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5091093449","display_name":"Ming-Hsiang Su","orcid":"https://orcid.org/0000-0003-0633-774X"},"institutions":[{"id":"https://openalex.org/I91807558","display_name":"National Cheng Kung University","ror":"https://ror.org/01b8kcc49","country_code":"TW","type":"education","lineage":["https://openalex.org/I91807558"]}],"countries":["TW"],"is_corresponding":false,"raw_author_name":"Ming-Hsiang Su","raw_affiliation_strings":["Department of Computer Science and Information Engineering, National Cheng Kung University, Taiwan"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"Department of Computer Science and Information Engineering, National Cheng Kung University, Taiwan","institution_ids":["https://openalex.org/I91807558"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5033843478","display_name":"Yuan-Rong Zeng","orcid":null},"institutions":[{"id":"https://openalex.org/I91807558","display_name":"National Cheng Kung University","ror":"https://ror.org/01b8kcc49","country_code":"TW","type":"education","lineage":["https://openalex.org/I91807558"]}],"countries":["TW"],"is_corresponding":false,"raw_author_name":"Yuan-Rong Zeng","raw_affiliation_strings":["Department of Computer Science and Information Engineering, National Cheng Kung University, Taiwan"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"Department of Computer Science and Information Engineering, National Cheng Kung University, Taiwan","institution_ids":["https://openalex.org/I91807558"]}]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":5,"corresponding_author_ids":[],"corresponding_institution_ids":[],"apc_list":null,"apc_paid":null,"fwci":1.5327,"has_fulltext":false,"cited_by_count":20,"citation_normalized_percentile":{"value":0.8445081,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":{"min":90,"max":98},"biblio":{"volume":null,"issue":null,"first_page":null,"last_page":null},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10667","display_name":"Emotion and Mood Recognition","score":0.9998999834060669,"subfield":{"id":"https://openalex.org/subfields/3205","display_name":"Experimental and Cognitive Psychology"},"field":{"id":"https://openalex.org/fields/32","display_name":"Psychology"},"domain":{"id":"https://openalex.org/domains/2","display_name":"Social Sciences"}},"topics":[{"id":"https://openalex.org/T10667","display_name":"Emotion and Mood Recognition","score":0.9998999834060669,"subfield":{"id":"https://openalex.org/subfields/3205","display_name":"Experimental and Cognitive Psychology"},"field":{"id":"https://openalex.org/fields/32","display_name":"Psychology"},"domain":{"id":"https://openalex.org/domains/2","display_name":"Social Sciences"}},{"id":"https://openalex.org/T10429","display_name":"EEG and Brain-Computer Interfaces","score":0.9911999702453613,"subfield":{"id":"https://openalex.org/subfields/2805","display_name":"Cognitive Neuroscience"},"field":{"id":"https://openalex.org/fields/28","display_name":"Neuroscience"},"domain":{"id":"https://openalex.org/domains/1","display_name":"Life Sciences"}},{"id":"https://openalex.org/T10664","display_name":"Sentiment Analysis and Opinion Mining","score":0.9787999987602234,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.7859890460968018},{"id":"https://openalex.org/keywords/speech-recognition","display_name":"Speech recognition","score":0.732491672039032},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.5549331307411194},{"id":"https://openalex.org/keywords/convolutional-neural-network","display_name":"Convolutional neural network","score":0.48232194781303406},{"id":"https://openalex.org/keywords/utterance","display_name":"Utterance","score":0.47844627499580383},{"id":"https://openalex.org/keywords/sadness","display_name":"Sadness","score":0.43773478269577026},{"id":"https://openalex.org/keywords/natural-language-processing","display_name":"Natural language processing","score":0.4120633602142334},{"id":"https://openalex.org/keywords/anger","display_name":"Anger","score":0.24117842316627502},{"id":"https://openalex.org/keywords/psychology","display_name":"Psychology","score":0.11519089341163635}],"concepts":[{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.7859890460968018},{"id":"https://openalex.org/C28490314","wikidata":"https://www.wikidata.org/wiki/Q189436","display_name":"Speech recognition","level":1,"score":0.732491672039032},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.5549331307411194},{"id":"https://openalex.org/C81363708","wikidata":"https://www.wikidata.org/wiki/Q17084460","display_name":"Convolutional neural network","level":2,"score":0.48232194781303406},{"id":"https://openalex.org/C2775852435","wikidata":"https://www.wikidata.org/wiki/Q258403","display_name":"Utterance","level":2,"score":0.47844627499580383},{"id":"https://openalex.org/C2779812673","wikidata":"https://www.wikidata.org/wiki/Q169251","display_name":"Sadness","level":3,"score":0.43773478269577026},{"id":"https://openalex.org/C204321447","wikidata":"https://www.wikidata.org/wiki/Q30642","display_name":"Natural language processing","level":1,"score":0.4120633602142334},{"id":"https://openalex.org/C2779302386","wikidata":"https://www.wikidata.org/wiki/Q79871","display_name":"Anger","level":2,"score":0.24117842316627502},{"id":"https://openalex.org/C15744967","wikidata":"https://www.wikidata.org/wiki/Q9418","display_name":"Psychology","level":0,"score":0.11519089341163635},{"id":"https://openalex.org/C118552586","wikidata":"https://www.wikidata.org/wiki/Q7867","display_name":"Psychiatry","level":1,"score":0.0}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.1109/iscslp.2018.8706610","is_oa":false,"landing_page_url":"https://doi.org/10.1109/iscslp.2018.8706610","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"2018 11th International Symposium on Chinese Spoken Language Processing (ISCSLP)","raw_type":"proceedings-article"}],"best_oa_location":null,"sustainable_development_goals":[{"id":"https://metadata.un.org/sdg/16","display_name":"Peace, Justice and strong institutions","score":0.5199999809265137}],"awards":[],"funders":[],"has_content":{"grobid_xml":false,"pdf":false},"content_urls":null,"referenced_works_count":19,"referenced_works":["https://openalex.org/W1479771596","https://openalex.org/W1501669607","https://openalex.org/W2001702556","https://openalex.org/W2003097445","https://openalex.org/W2037960784","https://openalex.org/W2038821742","https://openalex.org/W2058819080","https://openalex.org/W2064675550","https://openalex.org/W2087618018","https://openalex.org/W2089787547","https://openalex.org/W2149345536","https://openalex.org/W2168465881","https://openalex.org/W2188183693","https://openalex.org/W2339343773","https://openalex.org/W2399733683","https://openalex.org/W2518110751","https://openalex.org/W6628675675","https://openalex.org/W6630073874","https://openalex.org/W6682119568"],"related_works":["https://openalex.org/W2120267809","https://openalex.org/W2373147122","https://openalex.org/W2913307771","https://openalex.org/W2058555531","https://openalex.org/W4311605484","https://openalex.org/W2902116245","https://openalex.org/W2393989740","https://openalex.org/W2558014965","https://openalex.org/W4281384481","https://openalex.org/W4307784074"],"abstract_inverted_index":{"A":[0],"complete":[1],"emotional":[2,29,97],"expression":[3],"typically":[4],"contains":[5],"a":[6,11,34],"complex":[7],"temporal":[8],"course":[9],"in":[10],"natural":[12],"conversation.":[13],"Related":[14],"research":[15],"on":[16],"utterance-level,":[17],"segment-level":[18],"and":[19,125,129],"multi-level":[20],"processing":[21],"lacks":[22],"understanding":[23],"of":[24,28,62,94,139,160,180,195],"the":[25,58,82,89,95,107,137,140,152,167,177,188],"underlying":[26],"relation":[27],"speech.":[30],"In":[31,48],"this":[32,49],"work,":[33],"convolutional":[35],"neural":[36],"network":[37],"(CNN)":[38],"with":[39,100,185],"audio":[40,67,84,90,189],"word-based":[41,190],"embedding":[42,191],"is":[43,53,73],"proposed":[44,141,153],"for":[45,144,197],"emotion":[46,101,110,117,146,157,199],"modeling.":[47],"study,":[50],"vector":[51,86,92],"quantization":[52],"first":[54],"applied":[55],"to":[56,75,105,135,166],"convert":[57,76],"low":[59],"level":[60],"features":[61],"each":[63],"speech":[64,79,98,145,198],"frame":[65],"into":[66,81],"words":[68],"using":[69],"k-means":[70],"algorithm.":[71],"Word2vec":[72],"adopted":[74],"an":[77,156,193],"input":[78,182],"utterance":[80],"corresponding":[83],"word":[85,91],"sequence.":[87,183],"Finally,":[88],"sequences":[93],"training":[96],"data":[99],"annotation":[102],"are":[103],"used":[104,134],"construct":[106],"CNN-":[108],"based":[109,173],"model.":[111],"The":[112],"NCKU-ES":[113],"database,":[114],"containing":[115],"seven":[116],"categories:":[118],"happiness,":[119],"boredom,":[120],"anger,":[121],"anxiety,":[122],"sadness,":[123],"surprise":[124],"disgust,":[126],"was":[127,133],"collected":[128],"five-fold":[130],"cross":[131],"validation":[132],"evaluate":[136],"performance":[138],"CNN-based":[142],"method":[143,154],"recognition.":[147,200],"Experimental":[148],"results":[149],"show":[150],"that":[151],"achieved":[155,192],"recognition":[158],"accuracy":[159],"82.34%,":[161],"improving":[162],"by":[163],"8.7%":[164],"compared":[165],"Long":[168],"Short":[169],"Term":[170],"Memory":[171],"(LSTM)-":[172],"method,":[174],"which":[175],"faced":[176],"challenging":[178],"issue":[179],"long":[181],"Comparing":[184],"raw":[186],"features,":[187],"improvement":[194],"3.4%":[196]},"counts_by_year":[{"year":2025,"cited_by_count":4},{"year":2024,"cited_by_count":4},{"year":2023,"cited_by_count":5},{"year":2021,"cited_by_count":4},{"year":2020,"cited_by_count":2},{"year":2019,"cited_by_count":1}],"updated_date":"2026-06-11T09:08:48.828518","created_date":"2025-10-10T00:00:00"}
