{"id":"https://openalex.org/W283543405","doi":"https://doi.org/10.21437/eurospeech.2001-627","title":"Speech emotion recognition using hidden Markov models","display_name":"Speech emotion recognition using hidden Markov models","publication_year":2001,"publication_date":"2001-09-03","ids":{"openalex":"https://openalex.org/W283543405","doi":"https://doi.org/10.21437/eurospeech.2001-627","mag":"283543405"},"language":"en","primary_location":{"id":"doi:10.21437/eurospeech.2001-627","is_oa":false,"landing_page_url":"https://doi.org/10.21437/eurospeech.2001-627","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"7th European Conference on Speech Communication and Technology (Eurospeech 2001)","raw_type":"proceedings-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":false,"oa_status":"closed","oa_url":null,"any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5030036564","display_name":"Albino Nogueiras Rodr\u00edguez","orcid":"https://orcid.org/0000-0002-3159-1718"},"institutions":[],"countries":[],"is_corresponding":true,"raw_author_name":"Albino Nogueiras","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5103681962","display_name":"Asunci\u00f3n Moreno","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Asunci\u00f3n Moreno","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5000405202","display_name":"Antonio Bonafonte","orcid":"https://orcid.org/0000-0002-6240-9915"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Antonio Bonafonte","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"last","author":{"id":"https://openalex.org/A5063420793","display_name":"Jos\u00e9 Bernardo Mari\u00f1o Acebal","orcid":"https://orcid.org/0000-0002-9471-8675"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Jos\u00e9 B. Mari\u00f1o","raw_affiliation_strings":[],"affiliations":[]}],"institutions":[],"countries_distinct_count":0,"institutions_distinct_count":4,"corresponding_author_ids":["https://openalex.org/A5030036564"],"corresponding_institution_ids":[],"apc_list":null,"apc_paid":null,"fwci":3.9406,"has_fulltext":false,"cited_by_count":231,"citation_normalized_percentile":{"value":0.9330855,"is_in_top_1_percent":false,"is_in_top_10_percent":true},"cited_by_percentile_year":{"min":96,"max":100},"biblio":{"volume":null,"issue":null,"first_page":"2679","last_page":"2682"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10860","display_name":"Speech and Audio Processing","score":0.9991999864578247,"subfield":{"id":"https://openalex.org/subfields/1711","display_name":"Signal Processing"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10860","display_name":"Speech and Audio Processing","score":0.9991999864578247,"subfield":{"id":"https://openalex.org/subfields/1711","display_name":"Signal Processing"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10667","display_name":"Emotion and Mood Recognition","score":0.9990000128746033,"subfield":{"id":"https://openalex.org/subfields/3205","display_name":"Experimental and Cognitive Psychology"},"field":{"id":"https://openalex.org/fields/32","display_name":"Psychology"},"domain":{"id":"https://openalex.org/domains/2","display_name":"Social Sciences"}},{"id":"https://openalex.org/T10901","display_name":"Advanced Data Compression Techniques","score":0.9922000169754028,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/hidden-markov-model","display_name":"Hidden Markov model","score":0.7995374202728271},{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.7807142734527588},{"id":"https://openalex.org/keywords/speech-recognition","display_name":"Speech recognition","score":0.7049557566642761},{"id":"https://openalex.org/keywords/speaker-recognition","display_name":"Speaker recognition","score":0.5479006767272949},{"id":"https://openalex.org/keywords/interface","display_name":"Interface (matter)","score":0.5131109952926636},{"id":"https://openalex.org/keywords/scope","display_name":"Scope (computer science)","score":0.5067523121833801},{"id":"https://openalex.org/keywords/emotion-recognition","display_name":"Emotion recognition","score":0.4996960163116455},{"id":"https://openalex.org/keywords/natural-language-processing","display_name":"Natural language processing","score":0.40244418382644653},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.3876086175441742}],"concepts":[{"id":"https://openalex.org/C23224414","wikidata":"https://www.wikidata.org/wiki/Q176769","display_name":"Hidden Markov model","level":2,"score":0.7995374202728271},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.7807142734527588},{"id":"https://openalex.org/C28490314","wikidata":"https://www.wikidata.org/wiki/Q189436","display_name":"Speech recognition","level":1,"score":0.7049557566642761},{"id":"https://openalex.org/C133892786","wikidata":"https://www.wikidata.org/wiki/Q1145189","display_name":"Speaker recognition","level":2,"score":0.5479006767272949},{"id":"https://openalex.org/C113843644","wikidata":"https://www.wikidata.org/wiki/Q901882","display_name":"Interface (matter)","level":4,"score":0.5131109952926636},{"id":"https://openalex.org/C2778012447","wikidata":"https://www.wikidata.org/wiki/Q1034415","display_name":"Scope (computer science)","level":2,"score":0.5067523121833801},{"id":"https://openalex.org/C2777438025","wikidata":"https://www.wikidata.org/wiki/Q1339090","display_name":"Emotion recognition","level":2,"score":0.4996960163116455},{"id":"https://openalex.org/C204321447","wikidata":"https://www.wikidata.org/wiki/Q30642","display_name":"Natural language processing","level":1,"score":0.40244418382644653},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.3876086175441742},{"id":"https://openalex.org/C157915830","wikidata":"https://www.wikidata.org/wiki/Q2928001","display_name":"Bubble","level":2,"score":0.0},{"id":"https://openalex.org/C129307140","wikidata":"https://www.wikidata.org/wiki/Q6795880","display_name":"Maximum bubble pressure method","level":3,"score":0.0},{"id":"https://openalex.org/C173608175","wikidata":"https://www.wikidata.org/wiki/Q232661","display_name":"Parallel computing","level":1,"score":0.0},{"id":"https://openalex.org/C199360897","wikidata":"https://www.wikidata.org/wiki/Q9143","display_name":"Programming language","level":1,"score":0.0}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.21437/eurospeech.2001-627","is_oa":false,"landing_page_url":"https://doi.org/10.21437/eurospeech.2001-627","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"7th European Conference on Speech Communication and Technology (Eurospeech 2001)","raw_type":"proceedings-article"}],"best_oa_location":null,"sustainable_development_goals":[],"awards":[],"funders":[],"has_content":{"grobid_xml":false,"pdf":false},"content_urls":null,"referenced_works_count":4,"referenced_works":["https://openalex.org/W94037376","https://openalex.org/W1870886715","https://openalex.org/W1940107713","https://openalex.org/W2032254851"],"related_works":["https://openalex.org/W2053269318","https://openalex.org/W4241523039","https://openalex.org/W2364370872","https://openalex.org/W1992908141","https://openalex.org/W3006475563","https://openalex.org/W3015707499","https://openalex.org/W2049462786","https://openalex.org/W4287868249","https://openalex.org/W2326728821","https://openalex.org/W4297798768"],"abstract_inverted_index":{"This":[0,90,186],"paper":[1,187,337],"introduces":[2],"a":[3,177,292,321],"first":[4,192],"approach":[5,17,193],"to":[6,95,151,169,172,194,234,251],"emotion":[7,52,112,142,195,275,297,328,343],"recognition":[8,14,23,42,53,130,276,329,341],"using":[9,25,54,79,348],"RAMSES,":[10],"the":[11,31,38,41,55,80,99,110,116,132,148,153,157,161,189,202,205,239,272,280,284,289,340],"UPC\u2019s":[12],"speech":[13,22,120,129,162,303],"system.":[15],"The":[16,64,197,209,247],"is":[18,92,113,150,176,199,217,249],"based":[19,259],"on":[20,49,260],"standard":[21,349],"technology":[24],"hidden":[26,350],"semi-continuous":[27],"Markov":[28,351],"models.":[29],"Both":[30],"selection":[32],"of":[33,40,58,83,115,134,138,156,160,179,204,211,241,274,278,283,291,342],"low":[34,84],"level":[35,85],"features":[36,86],"and":[37,87,141,175,222,230,244,268,310],"design":[39],"system":[43],"are":[44,47,312,317],"addressed.":[45],"Results":[46],"given":[48],"speaker":[50,158,295],"dependent":[51,333],"Spanish":[56,346],"corpus":[57],"INTERFACE":[59,206,285],"Emotional":[60],"Speech":[61],"Synthesis":[62],"Database.":[63],"accuracy":[65],"recognising":[66],"seven":[67],"different":[68,123],"emotions\u2014the":[69],"six":[70],"ones":[71],"defined":[72],"in":[73,102,119,131,201,232,330],"MPEG-4":[74],"plus":[75],"neutral":[76],"style\u2014exceeds":[77],"80%":[78],"best":[81],"combination":[82],"HMM":[88],"structure.":[89],"result":[91],"very":[93],"similar":[94],"that":[96],"obtained":[97],"with":[98,109,305,339],"same":[100],"database":[101],"subjective":[103],"evaluation":[104],"by":[105,264],"human":[106,262],"judges.":[107],"Dealing":[108],"speaker\u2019s":[111],"one":[114],"latest":[117],"challenges":[118],"technologies.":[121],"Three":[122],"aspects":[124],"can":[125],"be":[126,288,325],"easily":[127],"identified:":[128],"presence":[133],"emotional":[135,139,154],"speech,":[136,140,265,279],"synthesis":[137,229],"recognition.":[143,196],"In":[144,271],"this":[145,212,300,336],"last":[146],"case,":[147],"objective":[149,210],"determine":[152],"state":[155],"out":[159,277],"samples.":[163],"Possible":[164],"applications":[165],"include":[166],"from":[167,307],"help":[168],"psychiatric":[170],"diagnosis":[171],"intelligent":[173],"toys,":[174],"subject":[178],"recent":[180],"but":[181],"rapidly":[182],"growing":[183],"interest":[184],"[1].":[185],"describes":[188],"TALP":[190],"researchers":[191],"work":[198,248],"inserted":[200],"scope":[203],"project":[207,216,286],"[2].":[208],"European":[213],"Commission":[214],"sponsored":[215],"\u201cto":[218],"define":[219],"new":[220],"models":[221,352],"implement":[223],"advanced":[224],"tools":[225],"for":[226,238,344],"audio-video":[227],"analysis,":[228],"representation":[231],"order":[233],"provide":[235],"essential":[236],"technologies":[237],"implementation":[240],"large-scale":[242],"virtual":[243],"augmented":[245],"environments.":[246],"oriented":[250],"make":[252],"man-machine":[253],"interaction":[254],"as":[255,257],"natural":[256],"possible,":[258],"everyday":[261],"communication":[263],"facial":[266],"expressions":[267],"body":[269],"gestures.\u201d":[270],"field":[273],"main":[281],"goal":[282],"will":[287,324],"construction":[290],"real-time":[293],"multi-lingual":[294],"independent":[296],"recogniser.":[298],"For":[299],"purpose,":[301],"large":[302],"databases":[304],"recordings":[306],"many":[308],"speakers":[309,347],"languages":[311],"needed.":[313],"As":[314],"these":[315],"resources":[316],"not":[318],"available":[319],"yet,":[320],"reduced":[322],"problem":[323],"addressed":[326],"first:":[327],"multi-speaker":[331],"language":[332],"conditions.":[334],"Namely,":[335],"deals":[338],"two":[345],"technology.":[353]},"counts_by_year":[{"year":2025,"cited_by_count":3},{"year":2024,"cited_by_count":6},{"year":2023,"cited_by_count":16},{"year":2022,"cited_by_count":13},{"year":2021,"cited_by_count":14},{"year":2020,"cited_by_count":12},{"year":2019,"cited_by_count":10},{"year":2018,"cited_by_count":13},{"year":2017,"cited_by_count":9},{"year":2016,"cited_by_count":9},{"year":2015,"cited_by_count":12},{"year":2014,"cited_by_count":3},{"year":2013,"cited_by_count":11},{"year":2012,"cited_by_count":5}],"updated_date":"2025-11-06T03:46:38.306776","created_date":"2025-10-10T00:00:00"}
