{"id":"https://openalex.org/W4388140063","doi":"https://doi.org/10.1108/dta-08-2023-0414","title":"Analyzing audiovisual data for understanding user's emotion in human\u2212computer interaction environment","display_name":"Analyzing audiovisual data for understanding user's emotion in human\u2212computer interaction environment","publication_year":2023,"publication_date":"2023-11-01","ids":{"openalex":"https://openalex.org/W4388140063","doi":"https://doi.org/10.1108/dta-08-2023-0414"},"language":"en","primary_location":{"id":"doi:10.1108/dta-08-2023-0414","is_oa":false,"landing_page_url":"https://doi.org/10.1108/dta-08-2023-0414","pdf_url":null,"source":{"id":"https://openalex.org/S4210171756","display_name":"Data Technologies and Applications","issn_l":"2514-9288","issn":["2514-9288","2514-9318"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310319811","host_organization_name":"Emerald Publishing Limited","host_organization_lineage":["https://openalex.org/P4310319811"],"host_organization_lineage_names":["Emerald Publishing Limited"],"type":"journal"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Data Technologies and Applications","raw_type":"journal-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":false,"oa_status":"closed","oa_url":null,"any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5020713789","display_name":"Juan Yang","orcid":"https://orcid.org/0000-0002-2004-8613"},"institutions":[{"id":"https://openalex.org/I43922553","display_name":"Wuhan University of Science and Technology","ror":"https://ror.org/00e4hrk88","country_code":"CN","type":"education","lineage":["https://openalex.org/I43922553"]}],"countries":["CN"],"is_corresponding":true,"raw_author_name":"Juan Yang","raw_affiliation_strings":["College of Computer Science and Technology, School of Computer Science and Technology, Wuhan University of Science and Technology, Wuhan, China"],"affiliations":[{"raw_affiliation_string":"College of Computer Science and Technology, School of Computer Science and Technology, Wuhan University of Science and Technology, Wuhan, China","institution_ids":["https://openalex.org/I43922553"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5101435753","display_name":"Zhenkun Li","orcid":"https://orcid.org/0000-0002-1444-6017"},"institutions":[{"id":"https://openalex.org/I43922553","display_name":"Wuhan University of Science and Technology","ror":"https://ror.org/00e4hrk88","country_code":"CN","type":"education","lineage":["https://openalex.org/I43922553"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Zhenkun Li","raw_affiliation_strings":["College of Computer Science and Technology, Wuhan University of Science and Technology, Wuhan, China"],"affiliations":[{"raw_affiliation_string":"College of Computer Science and Technology, Wuhan University of Science and Technology, Wuhan, China","institution_ids":["https://openalex.org/I43922553"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5011275854","display_name":"Xu Du","orcid":"https://orcid.org/0000-0001-9069-6109"},"institutions":[{"id":"https://openalex.org/I40963666","display_name":"Central China Normal University","ror":"https://ror.org/03x1jna21","country_code":"CN","type":"education","lineage":["https://openalex.org/I40963666"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Xu Du","raw_affiliation_strings":["National Engineering Research Center for E-Learning, Central China Normal University, Wuhan, China"],"affiliations":[{"raw_affiliation_string":"National Engineering Research Center for E-Learning, Central China Normal University, Wuhan, China","institution_ids":["https://openalex.org/I40963666"]}]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":3,"corresponding_author_ids":["https://openalex.org/A5020713789"],"corresponding_institution_ids":["https://openalex.org/I43922553"],"apc_list":null,"apc_paid":null,"fwci":0.6113,"has_fulltext":false,"cited_by_count":3,"citation_normalized_percentile":{"value":0.66954617,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":{"min":91,"max":96},"biblio":{"volume":"58","issue":"2","first_page":"318","last_page":"343"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T11309","display_name":"Music and Audio Processing","score":0.996999979019165,"subfield":{"id":"https://openalex.org/subfields/1711","display_name":"Signal Processing"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T11309","display_name":"Music and Audio Processing","score":0.996999979019165,"subfield":{"id":"https://openalex.org/subfields/1711","display_name":"Signal Processing"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T12032","display_name":"Multisensory perception and integration","score":0.9947999715805054,"subfield":{"id":"https://openalex.org/subfields/3205","display_name":"Experimental and Cognitive Psychology"},"field":{"id":"https://openalex.org/fields/32","display_name":"Psychology"},"domain":{"id":"https://openalex.org/domains/2","display_name":"Social Sciences"}},{"id":"https://openalex.org/T11439","display_name":"Video Analysis and Summarization","score":0.9939000010490417,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/modalities","display_name":"Modalities","score":0.7675246596336365},{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.7563838958740234},{"id":"https://openalex.org/keywords/modality","display_name":"Modality (human\u2013computer interaction)","score":0.6167879700660706},{"id":"https://openalex.org/keywords/discriminative-model","display_name":"Discriminative model","score":0.5625044107437134},{"id":"https://openalex.org/keywords/redundancy","display_name":"Redundancy (engineering)","score":0.4931895136833191},{"id":"https://openalex.org/keywords/key","display_name":"Key (lock)","score":0.48141026496887207},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.44208788871765137},{"id":"https://openalex.org/keywords/emotion-recognition","display_name":"Emotion recognition","score":0.4110730290412903},{"id":"https://openalex.org/keywords/human\u2013computer-interaction","display_name":"Human\u2013computer interaction","score":0.4027097821235657}],"concepts":[{"id":"https://openalex.org/C2779903281","wikidata":"https://www.wikidata.org/wiki/Q6888026","display_name":"Modalities","level":2,"score":0.7675246596336365},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.7563838958740234},{"id":"https://openalex.org/C2780226545","wikidata":"https://www.wikidata.org/wiki/Q6888030","display_name":"Modality (human\u2013computer interaction)","level":2,"score":0.6167879700660706},{"id":"https://openalex.org/C97931131","wikidata":"https://www.wikidata.org/wiki/Q5282087","display_name":"Discriminative model","level":2,"score":0.5625044107437134},{"id":"https://openalex.org/C152124472","wikidata":"https://www.wikidata.org/wiki/Q1204361","display_name":"Redundancy (engineering)","level":2,"score":0.4931895136833191},{"id":"https://openalex.org/C26517878","wikidata":"https://www.wikidata.org/wiki/Q228039","display_name":"Key (lock)","level":2,"score":0.48141026496887207},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.44208788871765137},{"id":"https://openalex.org/C2777438025","wikidata":"https://www.wikidata.org/wiki/Q1339090","display_name":"Emotion recognition","level":2,"score":0.4110730290412903},{"id":"https://openalex.org/C107457646","wikidata":"https://www.wikidata.org/wiki/Q207434","display_name":"Human\u2013computer interaction","level":1,"score":0.4027097821235657},{"id":"https://openalex.org/C111919701","wikidata":"https://www.wikidata.org/wiki/Q9135","display_name":"Operating system","level":1,"score":0.0},{"id":"https://openalex.org/C144024400","wikidata":"https://www.wikidata.org/wiki/Q21201","display_name":"Sociology","level":0,"score":0.0},{"id":"https://openalex.org/C36289849","wikidata":"https://www.wikidata.org/wiki/Q34749","display_name":"Social science","level":1,"score":0.0},{"id":"https://openalex.org/C38652104","wikidata":"https://www.wikidata.org/wiki/Q3510521","display_name":"Computer security","level":1,"score":0.0}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.1108/dta-08-2023-0414","is_oa":false,"landing_page_url":"https://doi.org/10.1108/dta-08-2023-0414","pdf_url":null,"source":{"id":"https://openalex.org/S4210171756","display_name":"Data Technologies and Applications","issn_l":"2514-9288","issn":["2514-9288","2514-9318"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310319811","host_organization_name":"Emerald Publishing Limited","host_organization_lineage":["https://openalex.org/P4310319811"],"host_organization_lineage_names":["Emerald Publishing Limited"],"type":"journal"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Data Technologies and Applications","raw_type":"journal-article"}],"best_oa_location":null,"sustainable_development_goals":[{"id":"https://metadata.un.org/sdg/10","score":0.7300000190734863,"display_name":"Reduced inequalities"}],"awards":[],"funders":[],"has_content":{"pdf":false,"grobid_xml":false},"content_urls":null,"referenced_works_count":75,"referenced_works":["https://openalex.org/W1651753422","https://openalex.org/W1750953599","https://openalex.org/W1780253070","https://openalex.org/W1969483602","https://openalex.org/W1987366351","https://openalex.org/W1994518960","https://openalex.org/W2036309320","https://openalex.org/W2044073059","https://openalex.org/W2044372538","https://openalex.org/W2094998392","https://openalex.org/W2095705004","https://openalex.org/W2106390385","https://openalex.org/W2108883127","https://openalex.org/W2133564696","https://openalex.org/W2135511277","https://openalex.org/W2148154194","https://openalex.org/W2150337255","https://openalex.org/W2155214670","https://openalex.org/W2162418306","https://openalex.org/W2194775991","https://openalex.org/W2314395941","https://openalex.org/W2341528187","https://openalex.org/W2344225493","https://openalex.org/W2402341335","https://openalex.org/W2470413457","https://openalex.org/W2559909572","https://openalex.org/W2592183475","https://openalex.org/W2610961739","https://openalex.org/W2613890029","https://openalex.org/W2619383789","https://openalex.org/W2701865535","https://openalex.org/W2738581557","https://openalex.org/W2803193013","https://openalex.org/W2883409523","https://openalex.org/W2891359673","https://openalex.org/W2896323182","https://openalex.org/W2908469318","https://openalex.org/W2958722525","https://openalex.org/W2962706528","https://openalex.org/W2962916094","https://openalex.org/W2989763126","https://openalex.org/W2990276885","https://openalex.org/W2996799978","https://openalex.org/W3023281269","https://openalex.org/W3090471441","https://openalex.org/W3094378983","https://openalex.org/W3094524767","https://openalex.org/W3101998545","https://openalex.org/W3111291969","https://openalex.org/W3112666470","https://openalex.org/W3112864462","https://openalex.org/W3116238789","https://openalex.org/W3118882785","https://openalex.org/W3123002293","https://openalex.org/W3136750845","https://openalex.org/W3137028092","https://openalex.org/W3146444769","https://openalex.org/W3172353912","https://openalex.org/W3175546442","https://openalex.org/W3183580551","https://openalex.org/W3186192207","https://openalex.org/W3209494353","https://openalex.org/W4205555939","https://openalex.org/W4206326349","https://openalex.org/W4210611093","https://openalex.org/W4220829848","https://openalex.org/W4280542149","https://openalex.org/W4281786928","https://openalex.org/W4286370724","https://openalex.org/W4287219194","https://openalex.org/W4290716630","https://openalex.org/W4296564736","https://openalex.org/W4300772595","https://openalex.org/W4312758889","https://openalex.org/W4320920903"],"related_works":["https://openalex.org/W73545470","https://openalex.org/W4224266612","https://openalex.org/W2383394264","https://openalex.org/W4320153225","https://openalex.org/W4293261942","https://openalex.org/W3125968744","https://openalex.org/W2004831463","https://openalex.org/W2167701463","https://openalex.org/W2110287964","https://openalex.org/W2168054807"],"abstract_inverted_index":{"Purpose":[0],"Although":[1],"numerous":[2],"signal":[3],"modalities":[4,13,89,229],"are":[5,14,169],"available":[6],"for":[7,21,45,105,148,179,216,235],"emotion":[8,40,63,107,218,237],"recognition,":[9],"audio":[10],"and":[11,18,37,48,75,79,118,124,163,173,176,184,199,204,224,261,264,285],"visual":[12],"the":[15,59,129,136,149,202,222,247,281],"most":[16],"common":[17],"predominant":[19],"forms":[20],"human":[22],"beings":[23],"to":[24,34,67,82,90,111,120,143,171,213,271],"express":[25],"their":[26],"emotional":[27,233],"states":[28],"in":[29,58],"daily":[30],"communication.":[31],"Therefore,":[32],"how":[33,66,81],"achieve":[35],"automatic":[36],"accurate":[38],"audiovisual":[39,62,106,122,217,267],"recognition":[41],"is":[42,103,141,211],"significantly":[43],"important":[44],"developing":[46],"engaging":[47,284],"empathetic":[49,286],"human\u2013computer":[50,287],"interaction":[51,117,288],"environment.":[52,289],"However,":[53],"two":[54,88,194],"major":[55],"challenges":[56],"exist":[57],"field":[60],"of":[61,71,132,151,206,227,283],"recognition:":[64],"(1)":[65,209],"effectively":[68],"capture":[69,174],"representations":[70,123],"each":[72],"single":[73],"modality":[74],"eliminate":[76],"redundant":[77,126],"features":[78],"(2)":[80,220],"efficiently":[83],"integrate":[84,112],"information":[85,226],"from":[86,146],"these":[87],"generate":[91],"discriminative":[92],"representations.":[93,189],"Design/methodology/approach":[94],"A":[95],"novel":[96],"key-frame":[97,113,242],"extraction-based":[98],"attention":[99],"fusion":[100,119,268],"network":[101],"(KE-AFN)":[102],"proposed":[104,170,241,277],"recognition.":[108,219,238],"KE-AFN":[109,210,278],"attempts":[110],"extraction":[114,243],"with":[115],"multimodal":[116,188],"enhance":[121,246],"reduce":[125],"computation,":[127],"filling":[128],"research":[130],"gaps":[131],"existing":[133],"approaches.":[134],"Specifically,":[135,208],"local":[137],"maximum\u2013based":[138],"content":[139],"analysis":[140],"designed":[142],"extract":[144],"key-frames":[145],"videos":[147],"purpose":[150],"eliminating":[152],"data":[153,182],"redundancy.":[154],"Two":[155],"modules,":[156],"including":[157],"\u201cMulti-head":[158,164],"Attention-based":[159,165],"Intra-modality":[160],"Interaction":[161,167],"Module\u201d":[162],"Cross-modality":[166],"Module\u201d,":[168],"mine":[172],"intra-":[175,260],"cross-modality":[177,262],"interactions":[178,263],"further":[180],"reducing":[181],"redundancy":[183],"producing":[185],"more":[186,232,250],"powerful":[187],"Findings":[190],"Extensive":[191],"experiments":[192],"on":[193,255],"benchmark":[195],"datasets":[196],"(i.e.":[197],"RAVDESS":[198],"CMU-MOSEI)":[200],"demonstrate":[201],"effectiveness":[203],"rationality":[205],"KE-AFN.":[207],"superior":[212],"state-of-the-art":[214],"baselines":[215],"Exploring":[221],"supplementary":[223],"complementary":[225],"different":[228],"can":[230,245,269,279],"provide":[231],"clues":[234],"better":[236,272],"(3)":[239],"The":[240,276],"strategy":[244],"performance":[248],"by":[249],"than":[251],"2.79":[252],"per":[253],"cent":[254],"accuracy.":[256],"(4)":[257],"Both":[258],"exploring":[259],"employing":[265],"attention-based":[266],"lead":[270],"prediction":[273],"performance.":[274],"Originality/value":[275],"support":[280],"development":[282]},"counts_by_year":[{"year":2025,"cited_by_count":1},{"year":2024,"cited_by_count":2}],"updated_date":"2025-11-06T03:46:38.306776","created_date":"2025-10-10T00:00:00"}
