{"id":"https://openalex.org/W2996007668","doi":"https://doi.org/10.1109/tencon.2019.8929459","title":"Emotion recognition from audio, dimensional and discrete categorization using CNNs","display_name":"Emotion recognition from audio, dimensional and discrete categorization using CNNs","publication_year":2019,"publication_date":"2019-10-01","ids":{"openalex":"https://openalex.org/W2996007668","doi":"https://doi.org/10.1109/tencon.2019.8929459","mag":"2996007668"},"language":"en","primary_location":{"id":"doi:10.1109/tencon.2019.8929459","is_oa":false,"landing_page_url":"https://doi.org/10.1109/tencon.2019.8929459","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"TENCON 2019 - 2019 IEEE Region 10 Conference (TENCON)","raw_type":"proceedings-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":false,"oa_status":"closed","oa_url":null,"any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5061805997","display_name":"Rohan Rajak","orcid":"https://orcid.org/0000-0002-0384-2639"},"institutions":[{"id":"https://openalex.org/I145894827","display_name":"Indian Institute of Technology Kharagpur","ror":"https://ror.org/03w5sq511","country_code":"IN","type":"education","lineage":["https://openalex.org/I145894827"]}],"countries":["IN"],"is_corresponding":true,"raw_author_name":"Rohan Rajak","raw_affiliation_strings":["Indian Institute of Technology, Kharagpur, India"],"affiliations":[{"raw_affiliation_string":"Indian Institute of Technology, Kharagpur, India","institution_ids":["https://openalex.org/I145894827"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5105166983","display_name":"Rajib Mall","orcid":null},"institutions":[{"id":"https://openalex.org/I145894827","display_name":"Indian Institute of Technology Kharagpur","ror":"https://ror.org/03w5sq511","country_code":"IN","type":"education","lineage":["https://openalex.org/I145894827"]}],"countries":["IN"],"is_corresponding":false,"raw_author_name":"Rajib Mall","raw_affiliation_strings":["Indian Institute of Technology, Kharagpur, India"],"affiliations":[{"raw_affiliation_string":"Indian Institute of Technology, Kharagpur, India","institution_ids":["https://openalex.org/I145894827"]}]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":2,"corresponding_author_ids":["https://openalex.org/A5061805997"],"corresponding_institution_ids":["https://openalex.org/I145894827"],"apc_list":null,"apc_paid":null,"fwci":2.3029,"has_fulltext":false,"cited_by_count":22,"citation_normalized_percentile":{"value":0.8880111,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":{"min":95,"max":98},"biblio":{"volume":null,"issue":null,"first_page":"301","last_page":"305"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10667","display_name":"Emotion and Mood Recognition","score":0.9998999834060669,"subfield":{"id":"https://openalex.org/subfields/3205","display_name":"Experimental and Cognitive Psychology"},"field":{"id":"https://openalex.org/fields/32","display_name":"Psychology"},"domain":{"id":"https://openalex.org/domains/2","display_name":"Social Sciences"}},"topics":[{"id":"https://openalex.org/T10667","display_name":"Emotion and Mood Recognition","score":0.9998999834060669,"subfield":{"id":"https://openalex.org/subfields/3205","display_name":"Experimental and Cognitive Psychology"},"field":{"id":"https://openalex.org/fields/32","display_name":"Psychology"},"domain":{"id":"https://openalex.org/domains/2","display_name":"Social Sciences"}},{"id":"https://openalex.org/T10057","display_name":"Face and Expression Recognition","score":0.991100013256073,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11309","display_name":"Music and Audio Processing","score":0.9794999957084656,"subfield":{"id":"https://openalex.org/subfields/1711","display_name":"Signal Processing"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/valence","display_name":"Valence (chemistry)","score":0.8132182955741882},{"id":"https://openalex.org/keywords/arousal","display_name":"Arousal","score":0.6825705766677856},{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.665934145450592},{"id":"https://openalex.org/keywords/convolutional-neural-network","display_name":"Convolutional neural network","score":0.5897442698478699},{"id":"https://openalex.org/keywords/categorization","display_name":"Categorization","score":0.5847735404968262},{"id":"https://openalex.org/keywords/emotion-recognition","display_name":"Emotion recognition","score":0.5622567534446716},{"id":"https://openalex.org/keywords/speech-recognition","display_name":"Speech recognition","score":0.523784339427948},{"id":"https://openalex.org/keywords/sentiment-analysis","display_name":"Sentiment analysis","score":0.5236111283302307},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.5066588521003723},{"id":"https://openalex.org/keywords/natural-language-processing","display_name":"Natural language processing","score":0.4238380491733551},{"id":"https://openalex.org/keywords/emotion-classification","display_name":"Emotion classification","score":0.4204448163509369},{"id":"https://openalex.org/keywords/pattern-recognition","display_name":"Pattern recognition (psychology)","score":0.3344629406929016},{"id":"https://openalex.org/keywords/psychology","display_name":"Psychology","score":0.233625590801239}],"concepts":[{"id":"https://openalex.org/C168900304","wikidata":"https://www.wikidata.org/wiki/Q171407","display_name":"Valence (chemistry)","level":2,"score":0.8132182955741882},{"id":"https://openalex.org/C36951298","wikidata":"https://www.wikidata.org/wiki/Q379784","display_name":"Arousal","level":2,"score":0.6825705766677856},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.665934145450592},{"id":"https://openalex.org/C81363708","wikidata":"https://www.wikidata.org/wiki/Q17084460","display_name":"Convolutional neural network","level":2,"score":0.5897442698478699},{"id":"https://openalex.org/C94124525","wikidata":"https://www.wikidata.org/wiki/Q912550","display_name":"Categorization","level":2,"score":0.5847735404968262},{"id":"https://openalex.org/C2777438025","wikidata":"https://www.wikidata.org/wiki/Q1339090","display_name":"Emotion recognition","level":2,"score":0.5622567534446716},{"id":"https://openalex.org/C28490314","wikidata":"https://www.wikidata.org/wiki/Q189436","display_name":"Speech recognition","level":1,"score":0.523784339427948},{"id":"https://openalex.org/C66402592","wikidata":"https://www.wikidata.org/wiki/Q2271421","display_name":"Sentiment analysis","level":2,"score":0.5236111283302307},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.5066588521003723},{"id":"https://openalex.org/C204321447","wikidata":"https://www.wikidata.org/wiki/Q30642","display_name":"Natural language processing","level":1,"score":0.4238380491733551},{"id":"https://openalex.org/C206310091","wikidata":"https://www.wikidata.org/wiki/Q750859","display_name":"Emotion classification","level":2,"score":0.4204448163509369},{"id":"https://openalex.org/C153180895","wikidata":"https://www.wikidata.org/wiki/Q7148389","display_name":"Pattern recognition (psychology)","level":2,"score":0.3344629406929016},{"id":"https://openalex.org/C15744967","wikidata":"https://www.wikidata.org/wiki/Q9418","display_name":"Psychology","level":0,"score":0.233625590801239},{"id":"https://openalex.org/C121332964","wikidata":"https://www.wikidata.org/wiki/Q413","display_name":"Physics","level":0,"score":0.0},{"id":"https://openalex.org/C62520636","wikidata":"https://www.wikidata.org/wiki/Q944","display_name":"Quantum mechanics","level":1,"score":0.0},{"id":"https://openalex.org/C169760540","wikidata":"https://www.wikidata.org/wiki/Q207011","display_name":"Neuroscience","level":1,"score":0.0}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.1109/tencon.2019.8929459","is_oa":false,"landing_page_url":"https://doi.org/10.1109/tencon.2019.8929459","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"TENCON 2019 - 2019 IEEE Region 10 Conference (TENCON)","raw_type":"proceedings-article"}],"best_oa_location":null,"sustainable_development_goals":[{"id":"https://metadata.un.org/sdg/4","display_name":"Quality Education","score":0.6100000143051147}],"awards":[],"funders":[],"has_content":{"grobid_xml":false,"pdf":false},"content_urls":null,"referenced_works_count":27,"referenced_works":["https://openalex.org/W1538131130","https://openalex.org/W1553803945","https://openalex.org/W1589520724","https://openalex.org/W1983364832","https://openalex.org/W2002055708","https://openalex.org/W2045528981","https://openalex.org/W2061068689","https://openalex.org/W2074788634","https://openalex.org/W2087407704","https://openalex.org/W2095705004","https://openalex.org/W2103798534","https://openalex.org/W2146334809","https://openalex.org/W2168465881","https://openalex.org/W2605367287","https://openalex.org/W2746521834","https://openalex.org/W2757888873","https://openalex.org/W2762084293","https://openalex.org/W2784665486","https://openalex.org/W2803193013","https://openalex.org/W2923871787","https://openalex.org/W2964113820","https://openalex.org/W2964128364","https://openalex.org/W6632100814","https://openalex.org/W6633425288","https://openalex.org/W6672004265","https://openalex.org/W6674330103","https://openalex.org/W6684552223"],"related_works":["https://openalex.org/W4305042383","https://openalex.org/W2546649374","https://openalex.org/W4380854332","https://openalex.org/W2184859701","https://openalex.org/W4386232293","https://openalex.org/W4379781104","https://openalex.org/W2382178633","https://openalex.org/W3003834951","https://openalex.org/W4380370144","https://openalex.org/W2127511193"],"abstract_inverted_index":{"Emotions":[0],"can":[1,77],"not":[2],"be":[3,79],"estimated":[4],"with":[5,35,43,101,126],"text":[6,20,36],"alone":[7],"as":[8],"irony,":[9],"humour,":[10],"cadence":[11],"etc.":[12],"are":[13,29],"important":[14],"components":[15],"of":[16,46,55,63,70,82,96,116,216],"a":[17,22,49,60,68,184,213,221],"speech.":[18],"So,":[19],"has":[21],"limited":[23],"capacity":[24],"in":[25,32,48,87,224,228,251],"conveying":[26],"emotions.":[27],"There":[28],"various":[30,73],"work":[31,104],"sentiment":[33],"analysis":[34],"and":[37,84,98,106,122,124,128,135,141,146,148,156,171,189,194,199,231,244],"speech":[38],"but":[39,210],"this":[40],"project":[41],"deals":[42],"the":[44,93,111,166,241],"identification":[45],"mood":[47],"non-discrete":[50],"way.":[51],"The":[52,197],"traditional":[53],"method":[54,69],"prediction":[56,161,204,249],"emotion":[57,160,223],"where":[58],"labeling":[59],"certain":[61],"number":[62],"discrete":[64,242],"emotions":[65,86,97,218],"is":[66],"obviously":[67],"classification":[71],"using":[72,254],"learning":[74],"techniques.":[75],"But":[76],"there":[78],"other":[80],"techniques":[81],"describing":[83],"understanding":[85],"speech?":[88],"This":[89],"paper":[90],"first":[91],"discusses":[92],"different":[94,214,256],"dimensions":[95],"compares":[99],"them":[100],"previous":[102],"similar":[103],"(Chung":[105],"Yoon(2012))":[107],"[6],":[108],"they":[109],"classified":[110],"user's":[112],"data":[113],"into":[114],"classes":[115,130,145,153],"2":[117,129,152,206],"types":[118],"(high,":[119],"normal,":[120],"low)":[121,125],"(high":[123],"3":[127,208],"respectively":[131],"for":[132,143,151,175,191,240],"both":[133],"Valence":[134,155,193],"Arousal.":[136],"Their":[137],"performance":[138],"was":[139],"53.4%":[140],"51.0%":[142],"three":[144],"66.6%":[147],"66.4%":[149],"accuracy":[150,239,253],"on":[154,162,179,205,247,259],"Arousal":[157,195],"upon":[158],"exact":[159,192],"DEAP":[163,180],"dataset.":[164,261],"Using":[165],"same":[167],"dataset":[168],"\u201cUsing":[169],"Deep":[170],"Convolutional":[172],"Neural":[173],"Networks":[174],"Accurate":[176],"Emotion":[177],"Classification":[178],"Dataset\u201d":[181],"[5]":[182],"concludes":[183],"CNN":[185,257],"model":[186,201,243],"providing":[187],"66.79%":[188],"57.58%":[190],"prediction.":[196],"valence":[198,230],"arousal":[200,232],"follow":[202],"accurate":[203],"or":[207],"classes,":[209],"we":[211,235],"had":[212,236],"approach":[215,246],"predicting":[217],"by":[219],"placing":[220],"particular":[222],"its":[225],"respective":[226],"quadrant":[227,248],"2D":[229],"axis.":[233],"However,":[234],"around":[237],"50-55%":[238],"our":[245],"resulted":[250],"76.2%":[252],"two":[255],"architectures":[258],"RAVDESS":[260]},"counts_by_year":[{"year":2025,"cited_by_count":2},{"year":2024,"cited_by_count":3},{"year":2023,"cited_by_count":5},{"year":2022,"cited_by_count":5},{"year":2021,"cited_by_count":4},{"year":2020,"cited_by_count":3}],"updated_date":"2025-11-06T03:46:38.306776","created_date":"2025-10-10T00:00:00"}
