{"id":"https://openalex.org/W3209798173","doi":"https://doi.org/10.1109/taffc.2021.3122146","title":"Facial Expression Recognition With Visual Transformers and Attentional Selective Fusion","display_name":"Facial Expression Recognition With Visual Transformers and Attentional Selective Fusion","publication_year":2021,"publication_date":"2021-10-26","ids":{"openalex":"https://openalex.org/W3209798173","doi":"https://doi.org/10.1109/taffc.2021.3122146","mag":"3209798173"},"language":"en","primary_location":{"id":"doi:10.1109/taffc.2021.3122146","is_oa":false,"landing_page_url":"https://doi.org/10.1109/taffc.2021.3122146","pdf_url":null,"source":{"id":"https://openalex.org/S104780363","display_name":"IEEE Transactions on Affective Computing","issn_l":"1949-3045","issn":["1949-3045","2371-9850"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310319808","host_organization_name":"Institute of Electrical and Electronics Engineers","host_organization_lineage":["https://openalex.org/P4310319808"],"host_organization_lineage_names":["Institute of Electrical and Electronics Engineers"],"type":"journal"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"IEEE Transactions on Affective Computing","raw_type":"journal-article"},"type":"article","indexed_in":["arxiv","crossref"],"open_access":{"is_oa":true,"oa_status":"green","oa_url":"https://arxiv.org/pdf/2103.16854","any_repository_has_fulltext":true},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5090221825","display_name":"Fuyan Ma","orcid":"https://orcid.org/0000-0003-0483-8866"},"institutions":[{"id":"https://openalex.org/I16609230","display_name":"Hunan University","ror":"https://ror.org/05htk5m33","country_code":"CN","type":"education","lineage":["https://openalex.org/I16609230"]}],"countries":["CN"],"is_corresponding":true,"raw_author_name":"Fuyan Ma","raw_affiliation_strings":["College of Electrical and Information Engineering, Changsha, China","Key Laboratory of Visual Perception and Artificial Intelligence of Hunan Province, Hunan University, Changsha, China"],"raw_orcid":"https://orcid.org/0000-0003-0483-8866","affiliations":[{"raw_affiliation_string":"College of Electrical and Information Engineering, Changsha, China","institution_ids":[]},{"raw_affiliation_string":"Key Laboratory of Visual Perception and Artificial Intelligence of Hunan Province, Hunan University, Changsha, China","institution_ids":["https://openalex.org/I16609230"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5100641761","display_name":"Bin Sun","orcid":"https://orcid.org/0000-0002-7029-8784"},"institutions":[{"id":"https://openalex.org/I16609230","display_name":"Hunan University","ror":"https://ror.org/05htk5m33","country_code":"CN","type":"education","lineage":["https://openalex.org/I16609230"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Bin Sun","raw_affiliation_strings":["College of Electrical and Information Engineering, Changsha, China","Key Laboratory of Visual Perception and Artificial Intelligence of Hunan Province, Hunan University, Changsha, China"],"raw_orcid":"https://orcid.org/0000-0002-7029-8784","affiliations":[{"raw_affiliation_string":"College of Electrical and Information Engineering, Changsha, China","institution_ids":[]},{"raw_affiliation_string":"Key Laboratory of Visual Perception and Artificial Intelligence of Hunan Province, Hunan University, Changsha, China","institution_ids":["https://openalex.org/I16609230"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5067097659","display_name":"Shutao Li","orcid":"https://orcid.org/0000-0002-0585-9848"},"institutions":[{"id":"https://openalex.org/I16609230","display_name":"Hunan University","ror":"https://ror.org/05htk5m33","country_code":"CN","type":"education","lineage":["https://openalex.org/I16609230"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Shutao Li","raw_affiliation_strings":["College of Electrical and Information Engineering, Changsha, China","Key Laboratory of Visual Perception and Artificial Intelligence of Hunan Province, Hunan University, Changsha, China","State Key Laboratory of Advanced Design and Manufacturing for Vehicle Body, Changsha, China"],"raw_orcid":"https://orcid.org/0000-0002-0585-9848","affiliations":[{"raw_affiliation_string":"College of Electrical and Information Engineering, Changsha, China","institution_ids":[]},{"raw_affiliation_string":"Key Laboratory of Visual Perception and Artificial Intelligence of Hunan Province, Hunan University, Changsha, China","institution_ids":["https://openalex.org/I16609230"]},{"raw_affiliation_string":"State Key Laboratory of Advanced Design and Manufacturing for Vehicle Body, Changsha, China","institution_ids":[]}]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":3,"corresponding_author_ids":["https://openalex.org/A5090221825"],"corresponding_institution_ids":["https://openalex.org/I16609230"],"apc_list":null,"apc_paid":null,"fwci":31.4648,"has_fulltext":false,"cited_by_count":280,"citation_normalized_percentile":{"value":0.99853271,"is_in_top_1_percent":true,"is_in_top_10_percent":true},"cited_by_percentile_year":{"min":89,"max":100},"biblio":{"volume":"14","issue":"2","first_page":"1236","last_page":"1248"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10667","display_name":"Emotion and Mood Recognition","score":0.9980000257492065,"subfield":{"id":"https://openalex.org/subfields/3205","display_name":"Experimental and Cognitive Psychology"},"field":{"id":"https://openalex.org/fields/32","display_name":"Psychology"},"domain":{"id":"https://openalex.org/domains/2","display_name":"Social Sciences"}},"topics":[{"id":"https://openalex.org/T10667","display_name":"Emotion and Mood Recognition","score":0.9980000257492065,"subfield":{"id":"https://openalex.org/subfields/3205","display_name":"Experimental and Cognitive Psychology"},"field":{"id":"https://openalex.org/fields/32","display_name":"Psychology"},"domain":{"id":"https://openalex.org/domains/2","display_name":"Social Sciences"}},{"id":"https://openalex.org/T10057","display_name":"Face and Expression Recognition","score":0.9972000122070312,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11448","display_name":"Face recognition and analysis","score":0.9922999739646912,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/discriminative-model","display_name":"Discriminative model","score":0.7493268251419067},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.7062506079673767},{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.6395127177238464},{"id":"https://openalex.org/keywords/pattern-recognition","display_name":"Pattern recognition (psychology)","score":0.5784709453582764},{"id":"https://openalex.org/keywords/facial-expression","display_name":"Facial expression","score":0.563066840171814},{"id":"https://openalex.org/keywords/feature","display_name":"Feature (linguistics)","score":0.4878992736339569},{"id":"https://openalex.org/keywords/fusion","display_name":"Fusion","score":0.44405877590179443},{"id":"https://openalex.org/keywords/computer-vision","display_name":"Computer vision","score":0.4374341368675232},{"id":"https://openalex.org/keywords/facial-expression-recognition","display_name":"Facial expression recognition","score":0.4338092803955078},{"id":"https://openalex.org/keywords/transformer","display_name":"Transformer","score":0.4209522008895874},{"id":"https://openalex.org/keywords/speech-recognition","display_name":"Speech recognition","score":0.36835578083992004},{"id":"https://openalex.org/keywords/facial-recognition-system","display_name":"Facial recognition system","score":0.29794788360595703},{"id":"https://openalex.org/keywords/engineering","display_name":"Engineering","score":0.10150814056396484}],"concepts":[{"id":"https://openalex.org/C97931131","wikidata":"https://www.wikidata.org/wiki/Q5282087","display_name":"Discriminative model","level":2,"score":0.7493268251419067},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.7062506079673767},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.6395127177238464},{"id":"https://openalex.org/C153180895","wikidata":"https://www.wikidata.org/wiki/Q7148389","display_name":"Pattern recognition (psychology)","level":2,"score":0.5784709453582764},{"id":"https://openalex.org/C195704467","wikidata":"https://www.wikidata.org/wiki/Q327968","display_name":"Facial expression","level":2,"score":0.563066840171814},{"id":"https://openalex.org/C2776401178","wikidata":"https://www.wikidata.org/wiki/Q12050496","display_name":"Feature (linguistics)","level":2,"score":0.4878992736339569},{"id":"https://openalex.org/C158525013","wikidata":"https://www.wikidata.org/wiki/Q2593739","display_name":"Fusion","level":2,"score":0.44405877590179443},{"id":"https://openalex.org/C31972630","wikidata":"https://www.wikidata.org/wiki/Q844240","display_name":"Computer vision","level":1,"score":0.4374341368675232},{"id":"https://openalex.org/C2987714656","wikidata":"https://www.wikidata.org/wiki/Q1185804","display_name":"Facial expression recognition","level":4,"score":0.4338092803955078},{"id":"https://openalex.org/C66322947","wikidata":"https://www.wikidata.org/wiki/Q11658","display_name":"Transformer","level":3,"score":0.4209522008895874},{"id":"https://openalex.org/C28490314","wikidata":"https://www.wikidata.org/wiki/Q189436","display_name":"Speech recognition","level":1,"score":0.36835578083992004},{"id":"https://openalex.org/C31510193","wikidata":"https://www.wikidata.org/wiki/Q1192553","display_name":"Facial recognition system","level":3,"score":0.29794788360595703},{"id":"https://openalex.org/C127413603","wikidata":"https://www.wikidata.org/wiki/Q11023","display_name":"Engineering","level":0,"score":0.10150814056396484},{"id":"https://openalex.org/C41895202","wikidata":"https://www.wikidata.org/wiki/Q8162","display_name":"Linguistics","level":1,"score":0.0},{"id":"https://openalex.org/C138885662","wikidata":"https://www.wikidata.org/wiki/Q5891","display_name":"Philosophy","level":0,"score":0.0},{"id":"https://openalex.org/C119599485","wikidata":"https://www.wikidata.org/wiki/Q43035","display_name":"Electrical engineering","level":1,"score":0.0},{"id":"https://openalex.org/C165801399","wikidata":"https://www.wikidata.org/wiki/Q25428","display_name":"Voltage","level":2,"score":0.0}],"mesh":[],"locations_count":2,"locations":[{"id":"doi:10.1109/taffc.2021.3122146","is_oa":false,"landing_page_url":"https://doi.org/10.1109/taffc.2021.3122146","pdf_url":null,"source":{"id":"https://openalex.org/S104780363","display_name":"IEEE Transactions on Affective Computing","issn_l":"1949-3045","issn":["1949-3045","2371-9850"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310319808","host_organization_name":"Institute of Electrical and Electronics Engineers","host_organization_lineage":["https://openalex.org/P4310319808"],"host_organization_lineage_names":["Institute of Electrical and Electronics Engineers"],"type":"journal"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"IEEE Transactions on Affective Computing","raw_type":"journal-article"},{"id":"pmh:oai:arXiv.org:2103.16854","is_oa":true,"landing_page_url":"http://arxiv.org/abs/2103.16854","pdf_url":"https://arxiv.org/pdf/2103.16854","source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"text"}],"best_oa_location":{"id":"pmh:oai:arXiv.org:2103.16854","is_oa":true,"landing_page_url":"http://arxiv.org/abs/2103.16854","pdf_url":"https://arxiv.org/pdf/2103.16854","source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"text"},"sustainable_development_goals":[{"id":"https://metadata.un.org/sdg/10","score":0.6700000166893005,"display_name":"Reduced inequalities"}],"awards":[{"id":"https://openalex.org/G7579875074","display_name":null,"funder_award_id":"62171183","funder_id":"https://openalex.org/F4320321001","funder_display_name":"National Natural Science Foundation of China"}],"funders":[{"id":"https://openalex.org/F4320321001","display_name":"National Natural Science Foundation of China","ror":"https://ror.org/01h0zpd94"}],"has_content":{"grobid_xml":false,"pdf":false},"content_urls":null,"referenced_works_count":85,"referenced_works":["https://openalex.org/W1522301498","https://openalex.org/W1546411676","https://openalex.org/W1986803802","https://openalex.org/W1990207480","https://openalex.org/W2014185685","https://openalex.org/W2035372623","https://openalex.org/W2038317184","https://openalex.org/W2060488580","https://openalex.org/W2093422693","https://openalex.org/W2101176070","https://openalex.org/W2103943262","https://openalex.org/W2106390385","https://openalex.org/W2108113956","https://openalex.org/W2108598243","https://openalex.org/W2147800946","https://openalex.org/W2161969291","https://openalex.org/W2194775991","https://openalex.org/W2341528187","https://openalex.org/W2479639417","https://openalex.org/W2481681431","https://openalex.org/W2513140567","https://openalex.org/W2540801879","https://openalex.org/W2563705555","https://openalex.org/W2565639579","https://openalex.org/W2745497104","https://openalex.org/W2787524669","https://openalex.org/W2798553619","https://openalex.org/W2799041689","https://openalex.org/W2805613995","https://openalex.org/W2806927661","https://openalex.org/W2889978276","https://openalex.org/W2894217452","https://openalex.org/W2896277673","https://openalex.org/W2902598059","https://openalex.org/W2904483377","https://openalex.org/W2944523338","https://openalex.org/W2948217907","https://openalex.org/W2963446712","https://openalex.org/W3003720578","https://openalex.org/W3006012949","https://openalex.org/W3019410392","https://openalex.org/W3035336958","https://openalex.org/W3035565904","https://openalex.org/W3088827635","https://openalex.org/W3089911443","https://openalex.org/W3091862369","https://openalex.org/W3094502228","https://openalex.org/W3101998545","https://openalex.org/W3106547440","https://openalex.org/W3109635183","https://openalex.org/W3112113890","https://openalex.org/W3114896399","https://openalex.org/W3117707723","https://openalex.org/W3122081138","https://openalex.org/W3124054989","https://openalex.org/W3127463063","https://openalex.org/W3129458182","https://openalex.org/W3131500599","https://openalex.org/W3134941379","https://openalex.org/W3154541964","https://openalex.org/W3171516518","https://openalex.org/W3180355996","https://openalex.org/W3186105911","https://openalex.org/W3189369550","https://openalex.org/W4214493665","https://openalex.org/W4214669216","https://openalex.org/W4238539449","https://openalex.org/W4295312788","https://openalex.org/W4385245566","https://openalex.org/W4388315058","https://openalex.org/W6631190155","https://openalex.org/W6632670727","https://openalex.org/W6675224631","https://openalex.org/W6676019839","https://openalex.org/W6725923168","https://openalex.org/W6739901393","https://openalex.org/W6755106128","https://openalex.org/W6766978945","https://openalex.org/W6784333009","https://openalex.org/W6786361841","https://openalex.org/W6786690992","https://openalex.org/W6786708909","https://openalex.org/W6787283782","https://openalex.org/W6787826751","https://openalex.org/W6787906798"],"related_works":["https://openalex.org/W4205986151","https://openalex.org/W2355913164","https://openalex.org/W2162992774","https://openalex.org/W1153638794","https://openalex.org/W2168968280","https://openalex.org/W2901126000","https://openalex.org/W4323520705","https://openalex.org/W2116055069","https://openalex.org/W2356663679","https://openalex.org/W3027190010"],"abstract_inverted_index":{"Facial":[0],"Expression":[1],"Recognition":[2],"(FER)":[3],"in":[4,30,33,114,174],"the":[5,34,56,104,115,124,150,170,188,208,227,246,251],"wild":[6,116],"is":[7,80,194],"extremely":[8],"challenging":[9],"due":[10],"to":[11,84,111,180],"occlusions,":[12,47],"variant":[13,48],"head":[14,49],"poses,":[15],"face":[16],"deformation":[17],"and":[18,51,66,82,93,160,205,236],"motion":[19],"blur":[20],"under":[21],"unconstrained":[22],"conditions.":[23],"Although":[24],"substantial":[25],"progresses":[26],"have":[27],"been":[28],"made":[29],"automatic":[31],"FER":[32,59,113],"past":[35],"few":[36],"decades,":[37],"previous":[38,71],"studies":[39],"were":[40],"mainly":[41],"designed":[42],"for":[43,129],"lab-controlled":[44],"FER.":[45],"Real-world":[46],"poses":[50],"other":[52,221],"issues":[53],"definitely":[54],"increase":[55],"difficulty":[57],"of":[58,62,90,133,164,172,226,250],"on":[60,196,229,243],"account":[61],"these":[63,184],"information-deficient":[64],"regions":[65],"complex":[67],"backgrounds.":[68],"Different":[69],"from":[70,97],"pure":[72],"CNNs":[73],"based":[74],"methods,":[75,222],"we":[76,102,122,178],"argue":[77],"that":[78,214],"it":[79],"feasible":[81],"practical":[83],"translate":[85],"facial":[86,200],"images":[87],"into":[88,162],"sequences":[89,163],"visual":[91,165,185],"words":[92,186],"perform":[94],"expression":[95,201],"recognition":[96],"a":[98],"global":[99,189],"perspective.":[100],"Therefore,":[101],"propose":[103,123,179],"Visual":[105],"Transformers":[106,173],"with":[107,149,187,231,234,238],"Feature":[108],"Fusion":[109],"(VTFF)":[110],"tackle":[112],"by":[117,137,145,169],"two":[118,131],"main":[119],"steps.":[120],"First,":[121],"attentional":[125],"selective":[126],"fusion":[127],"(ASF)":[128],"leveraging":[130],"kinds":[132],"feature":[134,155],"maps":[135,156],"generated":[136],"two-branch":[138],"CNNs.":[139],"The":[140,153,191,240],"ASF":[141],"captures":[142],"discriminative":[143],"information":[144],"fusing":[146],"multiple":[147],"features":[148],"global-local":[151],"attention.":[152],"fused":[154],"are":[157],"then":[158],"flattened":[159],"projected":[161],"words.":[166],"Second,":[167],"inspired":[168],"success":[171],"natural":[175],"language":[176],"processing,":[177],"model":[181],"relationships":[182],"between":[183],"self-attention.":[190],"proposed":[192,252],"method":[193,216],"evaluated":[195],"three":[197],"public":[198],"in-the-wild":[199],"datasets":[202],"(RAF-DB,":[203],"FERPlus":[204,233],"AffectNet).":[206],"Under":[207],"same":[209],"settings,":[210],"extensive":[211],"experiments":[212],"demonstrate":[213],"our":[215],"shows":[217,245],"superior":[218],"performance":[219],"over":[220],"setting":[223],"new":[224],"state":[225],"art":[228],"RAF-DB":[230],"88.14%,":[232],"88.81%":[235],"AffectNet":[237],"61.85%.":[239],"cross-dataset":[241],"evaluation":[242],"CK+":[244],"promising":[247],"generalization":[248],"capability":[249],"method.":[253]},"counts_by_year":[{"year":2026,"cited_by_count":11},{"year":2025,"cited_by_count":96},{"year":2024,"cited_by_count":75},{"year":2023,"cited_by_count":74},{"year":2022,"cited_by_count":23},{"year":2021,"cited_by_count":1}],"updated_date":"2026-05-11T08:15:01.531666","created_date":"2025-10-10T00:00:00"}
