{"id":"https://openalex.org/W2102426695","doi":"https://doi.org/10.1186/1687-6180-2012-15","title":"Emotion and mental state recognition from speech","display_name":"Emotion and mental state recognition from speech","publication_year":2012,"publication_date":"2012-01-19","ids":{"openalex":"https://openalex.org/W2102426695","doi":"https://doi.org/10.1186/1687-6180-2012-15","mag":"2102426695"},"language":"en","primary_location":{"id":"doi:10.1186/1687-6180-2012-15","is_oa":true,"landing_page_url":"https://doi.org/10.1186/1687-6180-2012-15","pdf_url":"https://asp-eurasipjournals.springeropen.com/counter/pdf/10.1186/1687-6180-2012-15","source":{"id":"https://openalex.org/S35920007","display_name":"EURASIP Journal on Advances in Signal Processing","issn_l":"1687-6172","issn":["1687-6172","1687-6180"],"is_oa":true,"is_in_doaj":true,"is_core":true,"host_organization":"https://openalex.org/P4310319900","host_organization_name":"Springer Science+Business Media","host_organization_lineage":["https://openalex.org/P4310319900","https://openalex.org/P4310319965"],"host_organization_lineage_names":["Springer Science+Business Media","Springer Nature"],"type":"journal"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"EURASIP Journal on Advances in Signal Processing","raw_type":"journal-article"},"type":"article","indexed_in":["crossref","doaj"],"open_access":{"is_oa":true,"oa_status":"gold","oa_url":"https://asp-eurasipjournals.springeropen.com/counter/pdf/10.1186/1687-6180-2012-15","any_repository_has_fulltext":true},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5030922449","display_name":"Julien Epps","orcid":"https://orcid.org/0000-0001-6624-5551"},"institutions":[{"id":"https://openalex.org/I42894916","display_name":"Data61","ror":"https://ror.org/03q397159","country_code":"AU","type":"other","lineage":["https://openalex.org/I1292875679","https://openalex.org/I2801453606","https://openalex.org/I42894916","https://openalex.org/I4387156119"]},{"id":"https://openalex.org/I31746571","display_name":"UNSW Sydney","ror":"https://ror.org/03r8z3t63","country_code":"AU","type":"education","lineage":["https://openalex.org/I31746571"]}],"countries":["AU"],"is_corresponding":true,"raw_author_name":"Julien Epps","raw_affiliation_strings":["ATP Research Laboratory, National ICT Australia (NICTA), Eveleigh, NSW, 2015, Australia","School of Electrical Engineering and Telecommunications, The University of New South Wales, Sydney, NSW, 2052, Australia","School of Electrical Engineering and Telecommunications, The University of New South Wales, Sydney, Australia","ATP Research Laboratory, National ICT Australia (NICTA), Eveleigh, Australia"],"affiliations":[{"raw_affiliation_string":"ATP Research Laboratory, National ICT Australia (NICTA), Eveleigh, NSW, 2015, Australia","institution_ids":["https://openalex.org/I42894916"]},{"raw_affiliation_string":"School of Electrical Engineering and Telecommunications, The University of New South Wales, Sydney, NSW, 2052, Australia","institution_ids":["https://openalex.org/I31746571"]},{"raw_affiliation_string":"School of Electrical Engineering and Telecommunications, The University of New South Wales, Sydney, Australia","institution_ids":["https://openalex.org/I31746571"]},{"raw_affiliation_string":"ATP Research Laboratory, National ICT Australia (NICTA), Eveleigh, Australia","institution_ids":["https://openalex.org/I42894916"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5027895237","display_name":"Roddy Cowie","orcid":"https://orcid.org/0000-0003-3480-2223"},"institutions":[{"id":"https://openalex.org/I126231945","display_name":"Queen's University Belfast","ror":"https://ror.org/00hswnk62","country_code":"GB","type":"education","lineage":["https://openalex.org/I126231945"]}],"countries":["GB"],"is_corresponding":false,"raw_author_name":"Roddy Cowie","raw_affiliation_strings":["Queen's University, Belfast, BT7 1NN, Northern Ireland","Queen's University, Belfast,   Northern  Ireland"],"affiliations":[{"raw_affiliation_string":"Queen's University, Belfast, BT7 1NN, Northern Ireland","institution_ids":[]},{"raw_affiliation_string":"Queen's University, Belfast,   Northern  Ireland","institution_ids":["https://openalex.org/I126231945"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5010028928","display_name":"Shrikanth Narayanan","orcid":"https://orcid.org/0000-0002-1052-6204"},"institutions":[{"id":"https://openalex.org/I1174212","display_name":"University of Southern California","ror":"https://ror.org/03taz7m60","country_code":"US","type":"education","lineage":["https://openalex.org/I1174212"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Shrikanth Narayanan","raw_affiliation_strings":["Department of Electrical Engineering, Viterbi School of Engineering, University of Southern California, Los Angeles, CA, 90089, USA","Department of Electrical Engineering, Viterbi School of Engineering, University of Southern California, Los Angeles, USA"],"affiliations":[{"raw_affiliation_string":"Department of Electrical Engineering, Viterbi School of Engineering, University of Southern California, Los Angeles, CA, 90089, USA","institution_ids":["https://openalex.org/I1174212"]},{"raw_affiliation_string":"Department of Electrical Engineering, Viterbi School of Engineering, University of Southern California, Los Angeles, USA","institution_ids":["https://openalex.org/I1174212"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5043060302","display_name":"Bj\u00f6rn W. Schuller","orcid":"https://orcid.org/0000-0002-6478-8699"},"institutions":[{"id":"https://openalex.org/I62916508","display_name":"Technical University of Munich","ror":"https://ror.org/02kkvpp62","country_code":"DE","type":"education","lineage":["https://openalex.org/I62916508"]}],"countries":["DE"],"is_corresponding":false,"raw_author_name":"Bj\u00f6rn Schuller","raw_affiliation_strings":["Institute for Human-Machine Communication, Technische Universit\u00e4t M\u00fcnchen, 80290, M\u00fcnchen, Germany","[Institute for Human Machine Communication, Technische Universit\u00e4t M\u00fcnchen, M\u00fcnchen, Germany]"],"affiliations":[{"raw_affiliation_string":"Institute for Human-Machine Communication, Technische Universit\u00e4t M\u00fcnchen, 80290, M\u00fcnchen, Germany","institution_ids":["https://openalex.org/I62916508"]},{"raw_affiliation_string":"[Institute for Human Machine Communication, Technische Universit\u00e4t M\u00fcnchen, M\u00fcnchen, Germany]","institution_ids":["https://openalex.org/I62916508"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5112613657","display_name":"Jianhua Tao","orcid":"https://orcid.org/0000-0002-9344-6428"},"institutions":[{"id":"https://openalex.org/I4210112150","display_name":"Institute of Automation","ror":"https://ror.org/022c3hy66","country_code":"CN","type":"facility","lineage":["https://openalex.org/I19820366","https://openalex.org/I4210112150"]},{"id":"https://openalex.org/I19820366","display_name":"Chinese Academy of Sciences","ror":"https://ror.org/034t30j35","country_code":"CN","type":"funder","lineage":["https://openalex.org/I19820366"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Jianhua Tao","raw_affiliation_strings":["National Laboratory of Pattern Recognition, Institute of Automation, Chinese Academy of Sciences, Beijing, 100080, China","National Laboratory of Pattern Recognition, Institute of Automation, Chinese Academy of Sciences Beijing, China"],"affiliations":[{"raw_affiliation_string":"National Laboratory of Pattern Recognition, Institute of Automation, Chinese Academy of Sciences, Beijing, 100080, China","institution_ids":["https://openalex.org/I4210112150","https://openalex.org/I19820366"]},{"raw_affiliation_string":"National Laboratory of Pattern Recognition, Institute of Automation, Chinese Academy of Sciences Beijing, China","institution_ids":["https://openalex.org/I4210112150","https://openalex.org/I19820366"]}]}],"institutions":[],"countries_distinct_count":5,"institutions_distinct_count":5,"corresponding_author_ids":["https://openalex.org/A5030922449"],"corresponding_institution_ids":["https://openalex.org/I31746571","https://openalex.org/I42894916"],"apc_list":{"value":1140,"currency":"GBP","value_usd":1398},"apc_paid":{"value":1140,"currency":"GBP","value_usd":1398},"fwci":0.8918,"has_fulltext":true,"cited_by_count":5,"citation_normalized_percentile":{"value":0.80450091,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":{"min":89,"max":95},"biblio":{"volume":"2012","issue":"1","first_page":null,"last_page":null},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10201","display_name":"Speech Recognition and Synthesis","score":0.932200014591217,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10201","display_name":"Speech Recognition and Synthesis","score":0.932200014591217,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/paralanguage","display_name":"Paralanguage","score":0.79230797290802},{"id":"https://openalex.org/keywords/speech-processing","display_name":"Speech processing","score":0.5344611406326294},{"id":"https://openalex.org/keywords/speaker-recognition","display_name":"Speaker recognition","score":0.5016896724700928},{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.4933835566043854},{"id":"https://openalex.org/keywords/speech-recognition","display_name":"Speech recognition","score":0.4252024292945862},{"id":"https://openalex.org/keywords/psychology","display_name":"Psychology","score":0.4121687412261963},{"id":"https://openalex.org/keywords/cognitive-psychology","display_name":"Cognitive psychology","score":0.3961297571659088},{"id":"https://openalex.org/keywords/communication","display_name":"Communication","score":0.15024089813232422}],"concepts":[{"id":"https://openalex.org/C133378560","wikidata":"https://www.wikidata.org/wiki/Q1753225","display_name":"Paralanguage","level":2,"score":0.79230797290802},{"id":"https://openalex.org/C61328038","wikidata":"https://www.wikidata.org/wiki/Q3358061","display_name":"Speech processing","level":2,"score":0.5344611406326294},{"id":"https://openalex.org/C133892786","wikidata":"https://www.wikidata.org/wiki/Q1145189","display_name":"Speaker recognition","level":2,"score":0.5016896724700928},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.4933835566043854},{"id":"https://openalex.org/C28490314","wikidata":"https://www.wikidata.org/wiki/Q189436","display_name":"Speech recognition","level":1,"score":0.4252024292945862},{"id":"https://openalex.org/C15744967","wikidata":"https://www.wikidata.org/wiki/Q9418","display_name":"Psychology","level":0,"score":0.4121687412261963},{"id":"https://openalex.org/C180747234","wikidata":"https://www.wikidata.org/wiki/Q23373","display_name":"Cognitive psychology","level":1,"score":0.3961297571659088},{"id":"https://openalex.org/C46312422","wikidata":"https://www.wikidata.org/wiki/Q11024","display_name":"Communication","level":1,"score":0.15024089813232422}],"mesh":[],"locations_count":2,"locations":[{"id":"doi:10.1186/1687-6180-2012-15","is_oa":true,"landing_page_url":"https://doi.org/10.1186/1687-6180-2012-15","pdf_url":"https://asp-eurasipjournals.springeropen.com/counter/pdf/10.1186/1687-6180-2012-15","source":{"id":"https://openalex.org/S35920007","display_name":"EURASIP Journal on Advances in Signal Processing","issn_l":"1687-6172","issn":["1687-6172","1687-6180"],"is_oa":true,"is_in_doaj":true,"is_core":true,"host_organization":"https://openalex.org/P4310319900","host_organization_name":"Springer Science+Business Media","host_organization_lineage":["https://openalex.org/P4310319900","https://openalex.org/P4310319965"],"host_organization_lineage_names":["Springer Science+Business Media","Springer Nature"],"type":"journal"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"EURASIP Journal on Advances in Signal Processing","raw_type":"journal-article"},{"id":"pmh:oai:uni-augsburg.opus-bayern.de:72642","is_oa":true,"landing_page_url":"https://opus.bibliothek.uni-augsburg.de/opus4/frontdoor/index/index/docId/72642","pdf_url":null,"source":{"id":"https://openalex.org/S4306400930","display_name":"OPUS (Augsburg University)","issn_l":null,"issn":null,"is_oa":false,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I119916105","host_organization_name":"Augsburg University","host_organization_lineage":["https://openalex.org/I119916105"],"host_organization_lineage_names":[],"type":"repository"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":"","raw_type":"article"}],"best_oa_location":{"id":"doi:10.1186/1687-6180-2012-15","is_oa":true,"landing_page_url":"https://doi.org/10.1186/1687-6180-2012-15","pdf_url":"https://asp-eurasipjournals.springeropen.com/counter/pdf/10.1186/1687-6180-2012-15","source":{"id":"https://openalex.org/S35920007","display_name":"EURASIP Journal on Advances in Signal Processing","issn_l":"1687-6172","issn":["1687-6172","1687-6180"],"is_oa":true,"is_in_doaj":true,"is_core":true,"host_organization":"https://openalex.org/P4310319900","host_organization_name":"Springer Science+Business Media","host_organization_lineage":["https://openalex.org/P4310319900","https://openalex.org/P4310319965"],"host_organization_lineage_names":["Springer Science+Business Media","Springer Nature"],"type":"journal"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"EURASIP Journal on Advances in Signal Processing","raw_type":"journal-article"},"sustainable_development_goals":[{"display_name":"Quality Education","id":"https://metadata.un.org/sdg/4","score":0.7699999809265137}],"awards":[],"funders":[],"has_content":{"pdf":true,"grobid_xml":true},"content_urls":{"pdf":"https://content.openalex.org/works/W2102426695.pdf","grobid_xml":"https://content.openalex.org/works/W2102426695.grobid-xml"},"referenced_works_count":0,"referenced_works":[],"related_works":["https://openalex.org/W4297807400","https://openalex.org/W1491159402","https://openalex.org/W4313854686","https://openalex.org/W321304764","https://openalex.org/W2249138175","https://openalex.org/W2611678594","https://openalex.org/W3162054169","https://openalex.org/W1813780412","https://openalex.org/W2640905660","https://openalex.org/W2122924390"],"abstract_inverted_index":{"As":[0],"research":[1,119,206,263],"in":[2,23,48,54,80,130,189,260,267,297,329,353,385,437,463,518,578],"speech":[3,16,20,90,100,132,183,191,284,412,424,430,495],"processing":[4,21,72,221,299],"has":[5,8,264],"matured,":[6],"attention":[7],"gradually":[9],"shifted":[10],"from":[11,89,98,349,392,480,493],"linguistic-related":[12],"applications":[13,266,311],"such":[14,252],"as":[15,216,253],"recognition":[17,26,75,262,314,322,523],"towards":[18],"paralinguistic":[19],"problems,":[22],"particular":[24],"the":[25,51,117,131,147,170,173,178,186,190,226,360,419,452,464,481,485,494,507,566,569],"of":[27,36,50,70,84,116,127,176,180,214,228,233,295,312,323,374,382,389,398,411,423,445,454,509,543,550,560,568],"speaker":[28,154,538],"identity,":[29],"language,":[30],"emotion,":[31,177,241],"gender,":[32],"and":[33,61,73,86,110,155,159,164,185,248,272,282,304,321,326,338,368,401,432,439,449,498,520,527,546],"age.":[34],"Determination":[35],"a":[37,44,68,92,211,217,293,371,455,490,530],"speaker\u2019s":[38],"emotion":[39,85,181,195,215,261,328,477,519],"or":[40],"mental":[41,87,218,234,319,521,531],"state":[42,88,235,522,532],"is":[43,91,207,563],"particularly":[45],"challenging":[46],"problem,":[47,379],"view":[49,213],"significant":[52],"variability":[53,151],"its":[55],"expression":[56],"posed":[57],"by":[58,343],"linguistic,":[59],"contextual,":[60],"speaker-specific":[62],"characteristics":[63,239],"within":[64],"speech.":[65,330,386],"In":[66],"response,":[67],"range":[69,294],"signal":[71,111,192,220,298],"pattern":[74,313],"methods":[76,144,300,316],"have":[77,196,223],"been":[78],"developed":[79],"recent":[81,258],"years.":[82],"Recognition":[83],"fundamentally":[93],"multidisciplinary":[94],"field,":[95],"comprising":[96,362],"contributions":[97],"psychology,":[99],"science,":[101],"linguistics,":[102],"(cooccurring)":[103],"nonverbal":[104],"communication,":[105],"machine":[106,142],"learning,":[107],"artificial":[108],"intelligence":[109],"processing,":[112],"among":[113],"others.":[114],"Some":[115],"key":[118],"problems":[120],"addressed":[121],"to":[122,146,153,194,198,376,409,442],"date":[123],"include":[124],"isolating":[125],"sources":[126],"emotion-specific":[128],"information":[129,562],"signal,":[133],"extracting":[134,472],"suitable":[135,166],"features,":[136],"forming":[137],"reduced-dimension":[138],"feature":[139,150,306],"sets,":[140],"developing":[141],"learning":[143],"applicable":[145],"task,":[148],"reducing":[149],"due":[152,193],"linguistic":[156],"content,":[157],"comparing":[158],"evaluating":[160],"diverse":[161],"methods,":[162],"robustness,":[163],"constructing":[165],"databases.":[167],"Studies":[168],"examining":[169],"relationships":[171],"between":[172],"psychological":[174],"basis":[175],"effect":[179],"on":[182,201,489,576],"production,":[184],"measurable":[187],"differences":[188],"helped":[197],"shed":[199],"light":[200],"these":[202],"problems;":[203],"however,":[204],"substantial":[205],"still":[208],"required.":[209],"Taking":[210],"broader":[212],"state,":[219],"researchers":[222],"also":[224,504],"explored":[225],"possibilities":[227],"automatically":[229],"detecting":[230,318,380],"other":[231],"types":[232,434],"which":[236],"share":[237],"some":[238],"with":[240],"for":[242,301,317,471,516],"example":[243],"stress,":[244],"depression,":[245,438],"cognitive":[246],"load,":[247],"\u2018cognitive":[249],"epistemic\u2019":[250],"states":[251,320],"interest,":[254],"scepticism,":[255],"etc.":[256],"The":[257,548],"interest":[259],"seen":[265],"call":[268],"centre":[269],"analytics,":[270],"human-machine":[271],"humanrobot":[273],"interfaces,":[274],"multimedia":[275],"retrieval,":[276],"surveillance":[277],"tasks,":[278],"behavioural":[279],"health":[280],"informatics,":[281],"improved":[283],"recognition.":[285,478],"This":[286],"special":[287,364],"issue":[288],"comprises":[289],"nine":[290],"articles":[291,332,361],"covering":[292],"topics":[296],"vocal":[302],"source":[303],"acoustic":[305],"extraction,":[307],"robustness":[308],"issues,":[309],"novel":[310],"techniques,":[315],"non-prototypical":[324],"spontaneous":[325],"naturalistic":[327],"These":[331,406],"were":[333],"accepted":[334],"following":[335],"peer":[336],"review,":[337],"each":[339],"submission":[340],"was":[341,347],"handled":[342],"an":[344,377],"editor":[345],"who":[346],"independent":[348],"all":[350],"authors":[351,486],"listed":[352],"that":[354,414,428,461,535],"manuscript.":[355],"Herein,":[356],"we":[357],"briefly":[358],"introduce":[359],"this":[363],"issue.":[365],"Trevino,":[366],"Quatieri":[367],"Malyska":[369],"bring":[370],"new":[372],"level":[373],"sophistication":[375],"old":[378],"signs":[381],"depressive":[383],"disorders":[384],"Their":[387,502],"measures":[388,410,422],"depression":[390],"come":[391],"standard":[393],"psychiatric":[394],"instruments,":[395],"Quick":[396],"Inventory":[397],"Depressive":[399],"Symptomatology":[400],"Hamilton":[402],"Depression":[403],"rating":[404],"scales.":[405],"are":[407,415],"linked":[408],"timing":[413],"much":[416],"richer":[417],"than":[418,460],"traditional":[420],"global":[421],"rate.":[425],"Results":[426],"indicate":[427],"different":[429,443],"sounds":[431],"sound":[433],"behave":[435],"differently":[436],"may":[440],"relate":[441],"aspects":[444],"depression.":[446],"Caponetti,":[447],"Buscicchio":[448],"Castellano":[450],"propose":[451,529],"use":[453],"more":[456],"detailed":[457,473],"auditory":[458],"model":[459],"embodied":[462],"widely":[465],"employed":[466],"mel":[467],"frequency":[468],"cepstral":[469],"coefficients,":[470],"spectral":[474],"features":[475],"during":[476],"Working":[479],"Lyon":[482],"cochlear":[483],"model,":[484],"demonstrate":[487],"improvements":[488],"five-class":[491],"problem":[492],"under":[496],"simulated":[497],"actual":[499],"stress":[500],"database.":[501],"study":[503],"further":[505],"validates":[506],"applicability":[508],"long":[510],"short-term":[511],"memory":[512],"recurrent":[513],"neural":[514],"networks":[515],"classification":[517],"problems.":[524],"Callejas,":[525],"Griol":[526],"Lopez-Cozar":[528],"prediction":[533],"approach":[534],"considers":[536],"both":[537],"*":[539],"Correspondence:":[540],"j.epps@unsw.edu.au":[541],"School":[542],"Electrical":[544],"Engineering":[545],"Telecommunications,":[547],"University":[549],"New":[551],"South":[552],"Wales,":[553],"Sydney,":[554],"NSW":[555],"2052,":[556],"Australia":[557],"Full":[558],"list":[559],"author":[561],"available":[564],"at":[565],"end":[567],"article":[570],"Epps":[571],"et":[572],"al.":[573],"EURASIP":[574],"Journal":[575],"Advances":[577],"Signal":[579],"Processing":[580],"2012,":[581],"2012:15":[582],"http://asp.eurasipjournals.com/content/2012/1/15":[583]},"counts_by_year":[{"year":2025,"cited_by_count":1},{"year":2017,"cited_by_count":1},{"year":2016,"cited_by_count":1},{"year":2014,"cited_by_count":1},{"year":2013,"cited_by_count":1}],"updated_date":"2026-03-20T23:20:44.827607","created_date":"2025-10-10T00:00:00"}
