{"id":"https://openalex.org/W7118175102","doi":"https://doi.org/10.1109/access.2025.3650618","title":"Investigating the Impact of Combined Spectral and Prosodic Features on Speech Emotion Recognition","display_name":"Investigating the Impact of Combined Spectral and Prosodic Features on Speech Emotion Recognition","publication_year":2026,"publication_date":"2026-01-01","ids":{"openalex":"https://openalex.org/W7118175102","doi":"https://doi.org/10.1109/access.2025.3650618"},"language":null,"primary_location":{"id":"doi:10.1109/access.2025.3650618","is_oa":true,"landing_page_url":"https://doi.org/10.1109/access.2025.3650618","pdf_url":null,"source":{"id":"https://openalex.org/S2485537415","display_name":"IEEE Access","issn_l":"2169-3536","issn":["2169-3536"],"is_oa":true,"is_in_doaj":true,"is_core":true,"host_organization":"https://openalex.org/P4310319808","host_organization_name":"Institute of Electrical and Electronics Engineers","host_organization_lineage":["https://openalex.org/P4310319808"],"host_organization_lineage_names":["Institute of Electrical and Electronics Engineers"],"type":"journal"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"IEEE Access","raw_type":"journal-article"},"type":"article","indexed_in":["crossref","doaj"],"open_access":{"is_oa":true,"oa_status":"gold","oa_url":"https://doi.org/10.1109/access.2025.3650618","any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5121941038","display_name":"Faten S. Alamri","orcid":null},"institutions":[{"id":"https://openalex.org/I106778892","display_name":"Princess Nourah bint Abdulrahman University","ror":"https://ror.org/05b0cyh02","country_code":"SA","type":"education","lineage":["https://openalex.org/I106778892"]}],"countries":["SA"],"is_corresponding":true,"raw_author_name":"Faten S. Alamri","raw_affiliation_strings":["Department of Mathematical Sciences, College of Science, Princess Nourah bint Abdulrahman University, P.O. Box, 84428, Riyadh, Saudi Arabia"],"affiliations":[{"raw_affiliation_string":"Department of Mathematical Sciences, College of Science, Princess Nourah bint Abdulrahman University, P.O. Box, 84428, Riyadh, Saudi Arabia","institution_ids":["https://openalex.org/I106778892"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5067818003","display_name":"Abeer Mirdad","orcid":"https://orcid.org/0000-0001-9917-0699"},"institutions":[{"id":"https://openalex.org/I142024983","display_name":"Prince Sultan University","ror":"https://ror.org/053mqrf26","country_code":"SA","type":"education","lineage":["https://openalex.org/I142024983"]}],"countries":["SA"],"is_corresponding":false,"raw_author_name":"Abeer Rashad Mirdad","raw_affiliation_strings":["AIDA Laboratory, College of Computer and Information Science (CCIS), Prince Sultan University, Riyadh, Saudi Arabia"],"affiliations":[{"raw_affiliation_string":"AIDA Laboratory, College of Computer and Information Science (CCIS), Prince Sultan University, Riyadh, Saudi Arabia","institution_ids":["https://openalex.org/I142024983"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5018549351","display_name":"Tanzila Saba","orcid":"https://orcid.org/0000-0003-3138-3801"},"institutions":[{"id":"https://openalex.org/I142024983","display_name":"Prince Sultan University","ror":"https://ror.org/053mqrf26","country_code":"SA","type":"education","lineage":["https://openalex.org/I142024983"]}],"countries":["SA"],"is_corresponding":false,"raw_author_name":"Tanzila Saba","raw_affiliation_strings":["AIDA Laboratory, College of Computer and Information Science (CCIS), Prince Sultan University, Riyadh, Saudi Arabia"],"affiliations":[{"raw_affiliation_string":"AIDA Laboratory, College of Computer and Information Science (CCIS), Prince Sultan University, Riyadh, Saudi Arabia","institution_ids":["https://openalex.org/I142024983"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5110891047","display_name":"Muhammad Amjad Raza","orcid":null},"institutions":[{"id":"https://openalex.org/I4210102737","display_name":"Khwaja Fareed University of Engineering and Information Technology","ror":"https://ror.org/0161dyt30","country_code":"PK","type":"education","lineage":["https://openalex.org/I4210102737"]}],"countries":["PK"],"is_corresponding":false,"raw_author_name":"Muhammad Amjad Raza","raw_affiliation_strings":["Institute of Computer Science, Khwaja Fareed University of Engineering and Information Technology, Rahim Yar Khan, Pakistan"],"affiliations":[{"raw_affiliation_string":"Institute of Computer Science, Khwaja Fareed University of Engineering and Information Technology, Rahim Yar Khan, Pakistan","institution_ids":["https://openalex.org/I4210102737"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5121978975","display_name":"Usama Siddique","orcid":null},"institutions":[{"id":"https://openalex.org/I2990669260","display_name":"Shaikh Zayed Medical College and Hospital","ror":"https://ror.org/02vhvhj11","country_code":"PK","type":"healthcare","lineage":["https://openalex.org/I2990669260"]}],"countries":["PK"],"is_corresponding":false,"raw_author_name":"Usama Siddique","raw_affiliation_strings":["DanZee Tech, Rahim Yar Khan, Pakistan"],"affiliations":[{"raw_affiliation_string":"DanZee Tech, Rahim Yar Khan, Pakistan","institution_ids":["https://openalex.org/I2990669260"]}]}],"institutions":[],"countries_distinct_count":2,"institutions_distinct_count":5,"corresponding_author_ids":["https://openalex.org/A5121941038"],"corresponding_institution_ids":["https://openalex.org/I106778892"],"apc_list":{"value":1850,"currency":"USD","value_usd":1850},"apc_paid":{"value":1850,"currency":"USD","value_usd":1850},"fwci":0.0,"has_fulltext":false,"cited_by_count":0,"citation_normalized_percentile":{"value":0.02842844,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":null,"biblio":{"volume":"14","issue":null,"first_page":"5719","last_page":"5732"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10667","display_name":"Emotion and Mood Recognition","score":0.989799976348877,"subfield":{"id":"https://openalex.org/subfields/3205","display_name":"Experimental and Cognitive Psychology"},"field":{"id":"https://openalex.org/fields/32","display_name":"Psychology"},"domain":{"id":"https://openalex.org/domains/2","display_name":"Social Sciences"}},"topics":[{"id":"https://openalex.org/T10667","display_name":"Emotion and Mood Recognition","score":0.989799976348877,"subfield":{"id":"https://openalex.org/subfields/3205","display_name":"Experimental and Cognitive Psychology"},"field":{"id":"https://openalex.org/fields/32","display_name":"Psychology"},"domain":{"id":"https://openalex.org/domains/2","display_name":"Social Sciences"}},{"id":"https://openalex.org/T11309","display_name":"Music and Audio Processing","score":0.0015999999595806003,"subfield":{"id":"https://openalex.org/subfields/1711","display_name":"Signal Processing"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10201","display_name":"Speech Recognition and Synthesis","score":0.001500000013038516,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/discriminative-model","display_name":"Discriminative model","score":0.7515000104904175},{"id":"https://openalex.org/keywords/cepstrum","display_name":"Cepstrum","score":0.550599992275238},{"id":"https://openalex.org/keywords/mel-frequency-cepstrum","display_name":"Mel-frequency cepstrum","score":0.5497999787330627},{"id":"https://openalex.org/keywords/set","display_name":"Set (abstract data type)","score":0.5012000203132629},{"id":"https://openalex.org/keywords/inference","display_name":"Inference","score":0.49059998989105225},{"id":"https://openalex.org/keywords/emotion-recognition","display_name":"Emotion recognition","score":0.474700003862381},{"id":"https://openalex.org/keywords/support-vector-machine","display_name":"Support vector machine","score":0.3926999866962433},{"id":"https://openalex.org/keywords/speech-processing","display_name":"Speech processing","score":0.3889999985694885},{"id":"https://openalex.org/keywords/voice-activity-detection","display_name":"Voice activity detection","score":0.3781000077724457}],"concepts":[{"id":"https://openalex.org/C97931131","wikidata":"https://www.wikidata.org/wiki/Q5282087","display_name":"Discriminative model","level":2,"score":0.7515000104904175},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.7264000177383423},{"id":"https://openalex.org/C28490314","wikidata":"https://www.wikidata.org/wiki/Q189436","display_name":"Speech recognition","level":1,"score":0.7016000151634216},{"id":"https://openalex.org/C88485024","wikidata":"https://www.wikidata.org/wiki/Q1054571","display_name":"Cepstrum","level":2,"score":0.550599992275238},{"id":"https://openalex.org/C151989614","wikidata":"https://www.wikidata.org/wiki/Q440370","display_name":"Mel-frequency cepstrum","level":3,"score":0.5497999787330627},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.5497999787330627},{"id":"https://openalex.org/C177264268","wikidata":"https://www.wikidata.org/wiki/Q1514741","display_name":"Set (abstract data type)","level":2,"score":0.5012000203132629},{"id":"https://openalex.org/C2776214188","wikidata":"https://www.wikidata.org/wiki/Q408386","display_name":"Inference","level":2,"score":0.49059998989105225},{"id":"https://openalex.org/C2777438025","wikidata":"https://www.wikidata.org/wiki/Q1339090","display_name":"Emotion recognition","level":2,"score":0.474700003862381},{"id":"https://openalex.org/C12267149","wikidata":"https://www.wikidata.org/wiki/Q282453","display_name":"Support vector machine","level":2,"score":0.3926999866962433},{"id":"https://openalex.org/C61328038","wikidata":"https://www.wikidata.org/wiki/Q3358061","display_name":"Speech processing","level":2,"score":0.3889999985694885},{"id":"https://openalex.org/C204201278","wikidata":"https://www.wikidata.org/wiki/Q1332614","display_name":"Voice activity detection","level":3,"score":0.3781000077724457},{"id":"https://openalex.org/C52622490","wikidata":"https://www.wikidata.org/wiki/Q1026626","display_name":"Feature extraction","level":2,"score":0.375900000333786},{"id":"https://openalex.org/C26517878","wikidata":"https://www.wikidata.org/wiki/Q228039","display_name":"Key (lock)","level":2,"score":0.3698999881744385},{"id":"https://openalex.org/C206310091","wikidata":"https://www.wikidata.org/wiki/Q750859","display_name":"Emotion classification","level":2,"score":0.36899998784065247},{"id":"https://openalex.org/C6438553","wikidata":"https://www.wikidata.org/wiki/Q1185804","display_name":"Affective computing","level":2,"score":0.3675000071525574},{"id":"https://openalex.org/C153180895","wikidata":"https://www.wikidata.org/wiki/Q7148389","display_name":"Pattern recognition (psychology)","level":2,"score":0.35420000553131104},{"id":"https://openalex.org/C45273575","wikidata":"https://www.wikidata.org/wiki/Q578970","display_name":"Spectrogram","level":2,"score":0.34369999170303345},{"id":"https://openalex.org/C2780233690","wikidata":"https://www.wikidata.org/wiki/Q535347","display_name":"Transparency (behavior)","level":2,"score":0.3325999975204468},{"id":"https://openalex.org/C169903167","wikidata":"https://www.wikidata.org/wiki/Q3985153","display_name":"Test set","level":2,"score":0.3294999897480011},{"id":"https://openalex.org/C204321447","wikidata":"https://www.wikidata.org/wiki/Q30642","display_name":"Natural language processing","level":1,"score":0.32919999957084656},{"id":"https://openalex.org/C114289077","wikidata":"https://www.wikidata.org/wiki/Q3284399","display_name":"Statistical model","level":2,"score":0.3172000050544739},{"id":"https://openalex.org/C133892786","wikidata":"https://www.wikidata.org/wiki/Q1145189","display_name":"Speaker recognition","level":2,"score":0.3003000020980835},{"id":"https://openalex.org/C134261354","wikidata":"https://www.wikidata.org/wiki/Q938438","display_name":"Statistical inference","level":2,"score":0.30000001192092896},{"id":"https://openalex.org/C69738355","wikidata":"https://www.wikidata.org/wiki/Q1228929","display_name":"Linear discriminant analysis","level":2,"score":0.2831999957561493},{"id":"https://openalex.org/C2988148770","wikidata":"https://www.wikidata.org/wiki/Q1339090","display_name":"Emotion detection","level":3,"score":0.27309998869895935},{"id":"https://openalex.org/C175154964","wikidata":"https://www.wikidata.org/wiki/Q380077","display_name":"Task analysis","level":3,"score":0.2720000147819519},{"id":"https://openalex.org/C108583219","wikidata":"https://www.wikidata.org/wiki/Q197536","display_name":"Deep learning","level":2,"score":0.27000001072883606},{"id":"https://openalex.org/C119857082","wikidata":"https://www.wikidata.org/wiki/Q2539","display_name":"Machine learning","level":1,"score":0.2678000032901764},{"id":"https://openalex.org/C504749915","wikidata":"https://www.wikidata.org/wiki/Q9010971","display_name":"Speech technology","level":3,"score":0.2646999955177307},{"id":"https://openalex.org/C155635449","wikidata":"https://www.wikidata.org/wiki/Q4674699","display_name":"Acoustic model","level":3,"score":0.2583000063896179}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.1109/access.2025.3650618","is_oa":true,"landing_page_url":"https://doi.org/10.1109/access.2025.3650618","pdf_url":null,"source":{"id":"https://openalex.org/S2485537415","display_name":"IEEE Access","issn_l":"2169-3536","issn":["2169-3536"],"is_oa":true,"is_in_doaj":true,"is_core":true,"host_organization":"https://openalex.org/P4310319808","host_organization_name":"Institute of Electrical and Electronics Engineers","host_organization_lineage":["https://openalex.org/P4310319808"],"host_organization_lineage_names":["Institute of Electrical and Electronics Engineers"],"type":"journal"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"IEEE Access","raw_type":"journal-article"}],"best_oa_location":{"id":"doi:10.1109/access.2025.3650618","is_oa":true,"landing_page_url":"https://doi.org/10.1109/access.2025.3650618","pdf_url":null,"source":{"id":"https://openalex.org/S2485537415","display_name":"IEEE Access","issn_l":"2169-3536","issn":["2169-3536"],"is_oa":true,"is_in_doaj":true,"is_core":true,"host_organization":"https://openalex.org/P4310319808","host_organization_name":"Institute of Electrical and Electronics Engineers","host_organization_lineage":["https://openalex.org/P4310319808"],"host_organization_lineage_names":["Institute of Electrical and Electronics Engineers"],"type":"journal"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"IEEE Access","raw_type":"journal-article"},"sustainable_development_goals":[{"score":0.7679954767227173,"id":"https://metadata.un.org/sdg/10","display_name":"Reduced inequalities"}],"awards":[],"funders":[],"has_content":{"pdf":false,"grobid_xml":false},"content_urls":null,"referenced_works_count":22,"referenced_works":["https://openalex.org/W2019312772","https://openalex.org/W2064641533","https://openalex.org/W2102998034","https://openalex.org/W2784128585","https://openalex.org/W3160344064","https://openalex.org/W4200149041","https://openalex.org/W4382399592","https://openalex.org/W4386068662","https://openalex.org/W4389733467","https://openalex.org/W4390507232","https://openalex.org/W4393035538","https://openalex.org/W4402316237","https://openalex.org/W4404201390","https://openalex.org/W4404421986","https://openalex.org/W4404521521","https://openalex.org/W4407157560","https://openalex.org/W4408359037","https://openalex.org/W4408791323","https://openalex.org/W4411290390","https://openalex.org/W4412375550","https://openalex.org/W4416194978","https://openalex.org/W4416195004"],"related_works":[],"abstract_inverted_index":{"Emotions":[0],"play":[1],"a":[2,15,72],"fundamental":[3],"role":[4],"in":[5,18],"human":[6],"cognition,":[7],"behavior,":[8],"and":[9,47,61,78,90,128,137,165,172],"social":[10],"interaction,":[11],"making":[12],"automatic":[13],"recognition":[14,176],"key":[16],"topic":[17],"affective":[19],"computing.":[20],"Many":[21],"existing":[22],"approaches":[23],"to":[24],"recognizing":[25,66],"emotions":[26,67],"from":[27,68],"speech":[28,69,174],"rely":[29],"heavily":[30],"on":[31,115,183],"Mel-Frequency":[32],"Cepstral":[33],"Coefficients":[34],"(MFCCs),":[35],"which":[36],"capture":[37],"short-term":[38],"spectral":[39,77],"features":[40],"but":[41],"insufficiently":[42],"represent":[43],"prosody,":[44],"long-term":[45],"dynamics,":[46],"tonal":[48],"nuances":[49],"that":[50,133,169],"are":[51],"critical":[52],"for":[53,65],"accurate":[54],"classification.":[55],"This":[56],"study":[57],"presents":[58],"an":[59,111],"interpretable":[60,173],"computationally":[62],"efficient":[63],"framework":[64],"by":[70],"employing":[71],"compact":[73],"set":[74],"of":[75,92,113,144],"fourteen":[76],"prosodic":[79],"acoustic":[80],"features,":[81],"including":[82],"pitch,":[83,136],"shimmer,":[84],"jitter,":[85],"loudness,":[86],"harmonic-to-noise":[87],"ratio":[88],"(HNR),":[89],"measures":[91],"temporal":[93],"variation.":[94],"Using":[95],"tree-based":[96],"ensemble":[97],"methods,":[98],"the":[99,107,116,125,140,151],"proposed":[100],"system":[101,155],"achieved":[102,179],"its":[103],"best":[104],"performance":[105],"with":[106,160],"XGBoost":[108],"classifier,":[109],"reaching":[110],"accuracy":[112],"96.79%":[114],"Toronto":[117],"Emotional":[118],"Speech":[119],"Set":[120],"(TESS).":[121],"Statistical":[122],"validation":[123],"using":[124],"Kruskal\u2013Wallis":[126],"test":[127],"effect":[129],"size":[130],"analysis":[131],"revealed":[132],"HNR,":[134],"mean":[135],"shimmer":[138],"were":[139],"most":[141],"discriminative":[142],"predictors":[143],"emotional":[145],"state,":[146],"thereby":[147],"providing":[148],"transparency":[149],"into":[150],"classification":[152],"process.":[153],"The":[154],"also":[156],"demonstrated":[157],"real-time":[158],"capability":[159],"inference":[161],"times":[162],"between":[163],"201":[164],"231":[166],"milliseconds,":[167],"confirming":[168],"accurate,":[170],"efficient,":[171],"emotion":[175],"can":[177],"be":[178],"without":[180],"relying":[181],"solely":[182],"deep":[184],"learning":[185],"models.":[186]},"counts_by_year":[],"updated_date":"2026-03-27T05:58:40.876381","created_date":"2026-01-05T00:00:00"}
