{"id":"https://openalex.org/W4402454386","doi":"https://doi.org/10.1145/3674029.3674045","title":"Enhancing Speech Emotion Recognition Using Deep Convolutional Neural Networks","display_name":"Enhancing Speech Emotion Recognition Using Deep Convolutional Neural Networks","publication_year":2024,"publication_date":"2024-05-24","ids":{"openalex":"https://openalex.org/W4402454386","doi":"https://doi.org/10.1145/3674029.3674045"},"language":"en","primary_location":{"id":"doi:10.1145/3674029.3674045","is_oa":true,"landing_page_url":"https://doi.org/10.1145/3674029.3674045","pdf_url":null,"source":null,"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"2024 9th International Conference on Machine Learning Technologies (ICMLT)","raw_type":"proceedings-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":true,"oa_status":"gold","oa_url":"https://doi.org/10.1145/3674029.3674045","any_repository_has_fulltext":true},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5100648633","display_name":"M. M. Manjurul Islam","orcid":"https://orcid.org/0000-0002-1823-1304"},"institutions":[{"id":"https://openalex.org/I138801177","display_name":"University of Ulster","ror":"https://ror.org/01yp9g959","country_code":"GB","type":"education","lineage":["https://openalex.org/I138801177"]}],"countries":["GB"],"is_corresponding":true,"raw_author_name":"M M Manjurul Islam","raw_affiliation_strings":["Intelligent System Research Centre, Ulster University, UK"],"raw_orcid":"https://orcid.org/0000-0002-1823-1304","affiliations":[{"raw_affiliation_string":"Intelligent System Research Centre, Ulster University, UK","institution_ids":["https://openalex.org/I138801177"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5087789749","display_name":"Md Alamgir Kabir","orcid":"https://orcid.org/0000-0002-7136-6339"},"institutions":[{"id":"https://openalex.org/I82509713","display_name":"M\u00e4lardalen University","ror":"https://ror.org/033vfbz75","country_code":"SE","type":"education","lineage":["https://openalex.org/I82509713"]}],"countries":["SE"],"is_corresponding":false,"raw_author_name":"Md Alamgir Kabir","raw_affiliation_strings":["Artificial Intelligence and Intelligent Systems Research Group, Malardalen University, Sweden"],"raw_orcid":"https://orcid.org/0000-0002-7136-6339","affiliations":[{"raw_affiliation_string":"Artificial Intelligence and Intelligent Systems Research Group, Malardalen University, Sweden","institution_ids":["https://openalex.org/I82509713"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5110695579","display_name":"Alamin Sheikh","orcid":null},"institutions":[{"id":"https://openalex.org/I103434671","display_name":"American International University-Bangladesh","ror":"https://ror.org/02j8ga255","country_code":"BD","type":"education","lineage":["https://openalex.org/I103434671"]}],"countries":["BD"],"is_corresponding":false,"raw_author_name":"Alamin Sheikh","raw_affiliation_strings":["American International University-Bangladesh, Bangladesh"],"raw_orcid":"https://orcid.org/0009-0003-1481-593X","affiliations":[{"raw_affiliation_string":"American International University-Bangladesh, Bangladesh","institution_ids":["https://openalex.org/I103434671"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5107132644","display_name":"Muhammad Saiduzzaman","orcid":null},"institutions":[{"id":"https://openalex.org/I103434671","display_name":"American International University-Bangladesh","ror":"https://ror.org/02j8ga255","country_code":"BD","type":"education","lineage":["https://openalex.org/I103434671"]}],"countries":["BD"],"is_corresponding":false,"raw_author_name":"Muhammad Saiduzzaman","raw_affiliation_strings":["American International University-Bangladesh, Bangladesh"],"raw_orcid":"https://orcid.org/0009-0007-1515-8731","affiliations":[{"raw_affiliation_string":"American International University-Bangladesh, Bangladesh","institution_ids":["https://openalex.org/I103434671"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5039541632","display_name":"Abdelakram Hafid","orcid":"https://orcid.org/0000-0001-6640-1868"},"institutions":[{"id":"https://openalex.org/I82509713","display_name":"M\u00e4lardalen University","ror":"https://ror.org/033vfbz75","country_code":"SE","type":"education","lineage":["https://openalex.org/I82509713"]}],"countries":["SE"],"is_corresponding":false,"raw_author_name":"Abdelakram Hafid","raw_affiliation_strings":["School of Innovation,Design and Engineering, Malardalen University, Sweden"],"raw_orcid":"https://orcid.org/0000-0001-6640-1868","affiliations":[{"raw_affiliation_string":"School of Innovation,Design and Engineering, Malardalen University, Sweden","institution_ids":["https://openalex.org/I82509713"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5103569093","display_name":"Saad Abdullah","orcid":"https://orcid.org/0000-0002-7186-6210"},"institutions":[{"id":"https://openalex.org/I82509713","display_name":"M\u00e4lardalen University","ror":"https://ror.org/033vfbz75","country_code":"SE","type":"education","lineage":["https://openalex.org/I82509713"]}],"countries":["SE"],"is_corresponding":false,"raw_author_name":"Saad Abdullah","raw_affiliation_strings":["School of Innovation,Design and Engineering, Malardalen University, Sweden"],"raw_orcid":"https://orcid.org/0000-0002-7186-6210","affiliations":[{"raw_affiliation_string":"School of Innovation,Design and Engineering, Malardalen University, Sweden","institution_ids":["https://openalex.org/I82509713"]}]}],"institutions":[],"countries_distinct_count":3,"institutions_distinct_count":6,"corresponding_author_ids":["https://openalex.org/A5100648633"],"corresponding_institution_ids":["https://openalex.org/I138801177"],"apc_list":null,"apc_paid":null,"fwci":2.4008,"has_fulltext":true,"cited_by_count":5,"citation_normalized_percentile":{"value":0.89068516,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":{"min":97,"max":98},"biblio":{"volume":null,"issue":null,"first_page":"95","last_page":"100"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10667","display_name":"Emotion and Mood Recognition","score":0.9995999932289124,"subfield":{"id":"https://openalex.org/subfields/3205","display_name":"Experimental and Cognitive Psychology"},"field":{"id":"https://openalex.org/fields/32","display_name":"Psychology"},"domain":{"id":"https://openalex.org/domains/2","display_name":"Social Sciences"}},"topics":[{"id":"https://openalex.org/T10667","display_name":"Emotion and Mood Recognition","score":0.9995999932289124,"subfield":{"id":"https://openalex.org/subfields/3205","display_name":"Experimental and Cognitive Psychology"},"field":{"id":"https://openalex.org/fields/32","display_name":"Psychology"},"domain":{"id":"https://openalex.org/domains/2","display_name":"Social Sciences"}},{"id":"https://openalex.org/T10860","display_name":"Speech and Audio Processing","score":0.9983999729156494,"subfield":{"id":"https://openalex.org/subfields/1711","display_name":"Signal Processing"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10201","display_name":"Speech Recognition and Synthesis","score":0.9934999942779541,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.7477372288703918},{"id":"https://openalex.org/keywords/convolutional-neural-network","display_name":"Convolutional neural network","score":0.7382288575172424},{"id":"https://openalex.org/keywords/speech-recognition","display_name":"Speech recognition","score":0.6809720396995544},{"id":"https://openalex.org/keywords/emotion-recognition","display_name":"Emotion recognition","score":0.4918828010559082},{"id":"https://openalex.org/keywords/deep-learning","display_name":"Deep learning","score":0.47685420513153076},{"id":"https://openalex.org/keywords/deep-neural-networks","display_name":"Deep neural networks","score":0.46552392840385437},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.4611618220806122},{"id":"https://openalex.org/keywords/artificial-neural-network","display_name":"Artificial neural network","score":0.44188302755355835}],"concepts":[{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.7477372288703918},{"id":"https://openalex.org/C81363708","wikidata":"https://www.wikidata.org/wiki/Q17084460","display_name":"Convolutional neural network","level":2,"score":0.7382288575172424},{"id":"https://openalex.org/C28490314","wikidata":"https://www.wikidata.org/wiki/Q189436","display_name":"Speech recognition","level":1,"score":0.6809720396995544},{"id":"https://openalex.org/C2777438025","wikidata":"https://www.wikidata.org/wiki/Q1339090","display_name":"Emotion recognition","level":2,"score":0.4918828010559082},{"id":"https://openalex.org/C108583219","wikidata":"https://www.wikidata.org/wiki/Q197536","display_name":"Deep learning","level":2,"score":0.47685420513153076},{"id":"https://openalex.org/C2984842247","wikidata":"https://www.wikidata.org/wiki/Q197536","display_name":"Deep neural networks","level":3,"score":0.46552392840385437},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.4611618220806122},{"id":"https://openalex.org/C50644808","wikidata":"https://www.wikidata.org/wiki/Q192776","display_name":"Artificial neural network","level":2,"score":0.44188302755355835}],"mesh":[],"locations_count":3,"locations":[{"id":"doi:10.1145/3674029.3674045","is_oa":true,"landing_page_url":"https://doi.org/10.1145/3674029.3674045","pdf_url":null,"source":null,"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"2024 9th International Conference on Machine Learning Technologies (ICMLT)","raw_type":"proceedings-article"},{"id":"pmh:oai:pure.atira.dk:openaire/61c7a791-9084-4e26-9ceb-56577c34559d","is_oa":true,"landing_page_url":"https://pure.ulster.ac.uk/en/publications/61c7a791-9084-4e26-9ceb-56577c34559d","pdf_url":"https://pure.ulster.ac.uk/ws/files/212940381/3674029.3674045.pdf","source":{"id":"https://openalex.org/S4306402454","display_name":"Ulster University Research Portal (Ulster University)","issn_l":null,"issn":null,"is_oa":false,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I138801177","host_organization_name":"University of Ulster","host_organization_lineage":["https://openalex.org/I138801177"],"host_organization_lineage_names":[],"type":"repository"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":"Islam, M M M, Kabir, M A, Sheikh, A, Saiduzzaman, M, Hafid, A & Abdullah, S 2024, Enhancing Speech Emotion Recognition Using Deep Convolutional Neural Networks. in Proceedings of the 2024 9th International Conference on Machine Learning Technologies. 2024 9th International Conference on Machine Learning Technologies (ICMLT), Association for Computing Machinery (ACM), pp. 95-100, 2024 9th International Conference on Machine Learning Technologies, Oslo, Norway, 24/05/24. https://doi.org/10.1145/3674029.3674045","raw_type":"contributionToPeriodical"},{"id":"pmh:oai:DiVA.org:mdh-68446","is_oa":true,"landing_page_url":"http://urn.kb.se/resolve?urn=urn:nbn:se:mdh:diva-68446","pdf_url":null,"source":{"id":"https://openalex.org/S4306401559","display_name":"KTH Publication Database DiVA (KTH Royal Institute of Technology)","issn_l":null,"issn":null,"is_oa":false,"is_in_doaj":false,"is_core":false,"host_organization":null,"host_organization_name":null,"host_organization_lineage":[],"host_organization_lineage_names":[],"type":"repository"},"license":"other-oa","license_id":"https://openalex.org/licenses/other-oa","version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"text"}],"best_oa_location":{"id":"doi:10.1145/3674029.3674045","is_oa":true,"landing_page_url":"https://doi.org/10.1145/3674029.3674045","pdf_url":null,"source":null,"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"2024 9th International Conference on Machine Learning Technologies (ICMLT)","raw_type":"proceedings-article"},"sustainable_development_goals":[{"display_name":"Reduced inequalities","score":0.41999998688697815,"id":"https://metadata.un.org/sdg/10"}],"awards":[],"funders":[],"has_content":{"pdf":false,"grobid_xml":false},"content_urls":null,"referenced_works_count":21,"referenced_works":["https://openalex.org/W2060132914","https://openalex.org/W2604268783","https://openalex.org/W2624578427","https://openalex.org/W2784665486","https://openalex.org/W2951975883","https://openalex.org/W2959133507","https://openalex.org/W2969889150","https://openalex.org/W2970737019","https://openalex.org/W2997700007","https://openalex.org/W3084484668","https://openalex.org/W3104593614","https://openalex.org/W3109961563","https://openalex.org/W3128401974","https://openalex.org/W3134063422","https://openalex.org/W3197438177","https://openalex.org/W3204087964","https://openalex.org/W3208220966","https://openalex.org/W4212823851","https://openalex.org/W4226442973","https://openalex.org/W4375869379","https://openalex.org/W4385493054"],"related_works":["https://openalex.org/W4226493464","https://openalex.org/W4312417841","https://openalex.org/W3193565141","https://openalex.org/W3133861977","https://openalex.org/W2951211570","https://openalex.org/W3103566983","https://openalex.org/W3167935049","https://openalex.org/W3029198973","https://openalex.org/W4377865163","https://openalex.org/W3126677997"],"abstract_inverted_index":{"Speech":[0,76],"emotion":[1,65],"recognition":[2,142],"(SER)":[3],"is":[4],"considered":[5],"a":[6,16,136],"pivotal":[7],"area":[8],"of":[9,18,31,41,115,154],"research":[10],"that":[11,122],"holds":[12],"significant":[13],"importance":[14],"in":[15,33,47,107,140,161,165],"variety":[17],"real-time":[19,162],"applications,":[20,163],"such":[21],"as":[22],"assessing":[23],"human":[24],"behavior":[25],"and":[26,52,87,100,149],"analyzing":[27],"the":[28,39,73,104,113,123,132,151],"emotional":[29],"states":[30],"speakers":[32],"emergency":[34,167],"situations.":[35,168],"This":[36,144],"paper":[37],"assesses":[38],"capabilities":[40],"deep":[42,58,155],"convolutional":[43],"neural":[44,59],"networks":[45,60],"(CNNs)":[46],"this":[48],"context.":[49],"Both":[50],"CNNs":[51,156],"Long":[53],"Short-Term":[54],"Memory":[55],"(LSTM)":[56],"based":[57],"are":[61,109],"evaluated":[62],"for":[63,157],"voice":[64,108],"identification.":[66],"In":[67],"our":[68],"empirical":[69,119],"evaluation,":[70],"we":[71],"utilize":[72],"Toronto":[74],"Emotional":[75],"Set":[77],"(TESS)":[78],"database,":[79],"which":[80],"comprises":[81],"speech":[82],"samples":[83],"from":[84],"both":[85],"young":[86],"old":[88],"individuals,":[89],"encompassing":[90],"seven":[91],"distinct":[92],"emotions:":[93],"anger,":[94],"happiness,":[95],"sadness,":[96],"fear,":[97],"surprise,":[98],"disgust,":[99],"neutrality.":[101],"To":[102],"augment":[103],"dataset,":[105],"variations":[106],"introduced":[110],"along":[111],"with":[112],"addition":[114],"white":[116],"noise.":[117],"The":[118],"findings":[120],"indicate":[121],"CNN":[124],"model":[125],"outperforms":[126],"existing":[127],"studies":[128],"on":[129],"SER":[130],"using":[131],"TESS":[133],"corpus,":[134],"yielding":[135],"noteworthy":[137],"21%":[138],"improvement":[139],"average":[141],"accuracy.":[143],"work":[145],"underscores":[146],"SER\u2019s":[147],"significance":[148],"highlights":[150],"transformative":[152],"potential":[153],"enhancing":[158],"its":[159],"effectiveness":[160],"particularly":[164],"high-stakes":[166]},"counts_by_year":[{"year":2025,"cited_by_count":5}],"updated_date":"2026-03-27T05:58:40.876381","created_date":"2025-10-10T00:00:00"}
