{"id":"https://openalex.org/W4376852201","doi":"https://doi.org/10.1145/3573942.3574080","title":"Patch Attention Network for Video Facial Expression Recognition","display_name":"Patch Attention Network for Video Facial Expression Recognition","publication_year":2022,"publication_date":"2022-09-23","ids":{"openalex":"https://openalex.org/W4376852201","doi":"https://doi.org/10.1145/3573942.3574080"},"language":"en","primary_location":{"id":"doi:10.1145/3573942.3574080","is_oa":false,"landing_page_url":"https://doi.org/10.1145/3573942.3574080","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Proceedings of the 2022 5th International Conference on Artificial Intelligence and Pattern Recognition","raw_type":"proceedings-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":false,"oa_status":"closed","oa_url":null,"any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5101705736","display_name":"Yingkai Hua","orcid":"https://orcid.org/0000-0002-9552-8873"},"institutions":[{"id":"https://openalex.org/I76130692","display_name":"Zhejiang University","ror":"https://ror.org/00a2xv884","country_code":"CN","type":"education","lineage":["https://openalex.org/I76130692"]}],"countries":["CN"],"is_corresponding":true,"raw_author_name":"Yingkai Hua","raw_affiliation_strings":["Zhejiang University, China"],"raw_orcid":"https://orcid.org/0000-0002-9552-8873","affiliations":[{"raw_affiliation_string":"Zhejiang University, China","institution_ids":["https://openalex.org/I76130692"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5101494891","display_name":"Xinmin Xu","orcid":"https://orcid.org/0000-0002-0910-2375"},"institutions":[{"id":"https://openalex.org/I76130692","display_name":"Zhejiang University","ror":"https://ror.org/00a2xv884","country_code":"CN","type":"education","lineage":["https://openalex.org/I76130692"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Xinmin Xu","raw_affiliation_strings":["Zhejiang University, China"],"raw_orcid":"https://orcid.org/0000-0002-0910-2375","affiliations":[{"raw_affiliation_string":"Zhejiang University, China","institution_ids":["https://openalex.org/I76130692"]}]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":2,"corresponding_author_ids":["https://openalex.org/A5101705736"],"corresponding_institution_ids":["https://openalex.org/I76130692"],"apc_list":null,"apc_paid":null,"fwci":0.0,"has_fulltext":false,"cited_by_count":0,"citation_normalized_percentile":{"value":0.2287464,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":null,"biblio":{"volume":null,"issue":null,"first_page":"689","last_page":"694"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10667","display_name":"Emotion and Mood Recognition","score":0.9994000196456909,"subfield":{"id":"https://openalex.org/subfields/3205","display_name":"Experimental and Cognitive Psychology"},"field":{"id":"https://openalex.org/fields/32","display_name":"Psychology"},"domain":{"id":"https://openalex.org/domains/2","display_name":"Social Sciences"}},"topics":[{"id":"https://openalex.org/T10667","display_name":"Emotion and Mood Recognition","score":0.9994000196456909,"subfield":{"id":"https://openalex.org/subfields/3205","display_name":"Experimental and Cognitive Psychology"},"field":{"id":"https://openalex.org/fields/32","display_name":"Psychology"},"domain":{"id":"https://openalex.org/domains/2","display_name":"Social Sciences"}},{"id":"https://openalex.org/T10812","display_name":"Human Pose and Action Recognition","score":0.9980000257492065,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11398","display_name":"Hand Gesture Recognition Systems","score":0.9973999857902527,"subfield":{"id":"https://openalex.org/subfields/1709","display_name":"Human-Computer Interaction"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/facial-expression-recognition","display_name":"Facial expression recognition","score":0.7761760950088501},{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.7735252380371094},{"id":"https://openalex.org/keywords/focus","display_name":"Focus (optics)","score":0.6893337965011597},{"id":"https://openalex.org/keywords/facial-expression","display_name":"Facial expression","score":0.6495922803878784},{"id":"https://openalex.org/keywords/mechanism","display_name":"Mechanism (biology)","score":0.5663415193557739},{"id":"https://openalex.org/keywords/convolution","display_name":"Convolution (computer science)","score":0.5343412756919861},{"id":"https://openalex.org/keywords/expression","display_name":"Expression (computer science)","score":0.503987729549408},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.4825103282928467},{"id":"https://openalex.org/keywords/facial-recognition-system","display_name":"Facial recognition system","score":0.42802608013153076},{"id":"https://openalex.org/keywords/pattern-recognition","display_name":"Pattern recognition (psychology)","score":0.42407283186912537},{"id":"https://openalex.org/keywords/artificial-neural-network","display_name":"Artificial neural network","score":0.16582316160202026}],"concepts":[{"id":"https://openalex.org/C2987714656","wikidata":"https://www.wikidata.org/wiki/Q1185804","display_name":"Facial expression recognition","level":4,"score":0.7761760950088501},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.7735252380371094},{"id":"https://openalex.org/C192209626","wikidata":"https://www.wikidata.org/wiki/Q190909","display_name":"Focus (optics)","level":2,"score":0.6893337965011597},{"id":"https://openalex.org/C195704467","wikidata":"https://www.wikidata.org/wiki/Q327968","display_name":"Facial expression","level":2,"score":0.6495922803878784},{"id":"https://openalex.org/C89611455","wikidata":"https://www.wikidata.org/wiki/Q6804646","display_name":"Mechanism (biology)","level":2,"score":0.5663415193557739},{"id":"https://openalex.org/C45347329","wikidata":"https://www.wikidata.org/wiki/Q5166604","display_name":"Convolution (computer science)","level":3,"score":0.5343412756919861},{"id":"https://openalex.org/C90559484","wikidata":"https://www.wikidata.org/wiki/Q778379","display_name":"Expression (computer science)","level":2,"score":0.503987729549408},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.4825103282928467},{"id":"https://openalex.org/C31510193","wikidata":"https://www.wikidata.org/wiki/Q1192553","display_name":"Facial recognition system","level":3,"score":0.42802608013153076},{"id":"https://openalex.org/C153180895","wikidata":"https://www.wikidata.org/wiki/Q7148389","display_name":"Pattern recognition (psychology)","level":2,"score":0.42407283186912537},{"id":"https://openalex.org/C50644808","wikidata":"https://www.wikidata.org/wiki/Q192776","display_name":"Artificial neural network","level":2,"score":0.16582316160202026},{"id":"https://openalex.org/C120665830","wikidata":"https://www.wikidata.org/wiki/Q14620","display_name":"Optics","level":1,"score":0.0},{"id":"https://openalex.org/C111472728","wikidata":"https://www.wikidata.org/wiki/Q9471","display_name":"Epistemology","level":1,"score":0.0},{"id":"https://openalex.org/C199360897","wikidata":"https://www.wikidata.org/wiki/Q9143","display_name":"Programming language","level":1,"score":0.0},{"id":"https://openalex.org/C121332964","wikidata":"https://www.wikidata.org/wiki/Q413","display_name":"Physics","level":0,"score":0.0},{"id":"https://openalex.org/C138885662","wikidata":"https://www.wikidata.org/wiki/Q5891","display_name":"Philosophy","level":0,"score":0.0}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.1145/3573942.3574080","is_oa":false,"landing_page_url":"https://doi.org/10.1145/3573942.3574080","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Proceedings of the 2022 5th International Conference on Artificial Intelligence and Pattern Recognition","raw_type":"proceedings-article"}],"best_oa_location":null,"sustainable_development_goals":[],"awards":[],"funders":[],"has_content":{"grobid_xml":false,"pdf":false},"content_urls":null,"referenced_works_count":14,"referenced_works":["https://openalex.org/W1522734439","https://openalex.org/W2217426128","https://openalex.org/W2479639417","https://openalex.org/W2744078350","https://openalex.org/W2798583514","https://openalex.org/W2799041689","https://openalex.org/W2904483377","https://openalex.org/W2938613434","https://openalex.org/W2970710980","https://openalex.org/W3003720578","https://openalex.org/W3034751874","https://openalex.org/W3035336958","https://openalex.org/W3046911849","https://openalex.org/W4214645187"],"related_works":["https://openalex.org/W2642127892","https://openalex.org/W4205986151","https://openalex.org/W2355913164","https://openalex.org/W1153638794","https://openalex.org/W2168968280","https://openalex.org/W2116055069","https://openalex.org/W2162992774","https://openalex.org/W4323520705","https://openalex.org/W2356663679","https://openalex.org/W2169777806"],"abstract_inverted_index":{"Facial":[0],"expression":[1,23,86],"recognition":[2,24],"(FER)":[3],"is":[4],"a":[5,47],"hot":[6],"research":[7],"topic":[8],"in":[9,21],"computer":[10],"vision.":[11],"In":[12,42],"recent":[13],"years,":[14],"attention":[15,34,54],"mechanism":[16,35,55],"has":[17],"been":[18],"widely":[19],"used":[20],"facial":[22],"tasks":[25],"and":[26,74,93],"achieved":[27],"good":[28],"results.":[29],"However,":[30],"most":[31],"methods":[32],"applying":[33],"are":[36],"aimed":[37],"at":[38],"static":[39],"image-based":[40],"FER.":[41,58],"this":[43],"paper,":[44],"we":[45],"propose":[46],"novel":[48],"convolution":[49],"neutral":[50],"network":[51,60],"(CNN)":[52],"with":[53,71],"for":[56],"video-based":[57],"Our":[59],"introduces":[61],"Patch":[62,75],"Diff":[63],"Attention":[64,77],"(PDA)":[65],"module":[66,79],"to":[67,80,105],"focus":[68,81],"on":[69,82,91],"regions":[70,83],"large":[72],"variation,":[73],"Self":[76],"(PSA)":[78],"containing":[84],"more":[85],"information.":[87],"With":[88],"extensive":[89],"experiments":[90],"CK+":[92],"AFEW":[94],"datasets,":[95],"our":[96],"proposed":[97],"method":[98],"shows":[99],"superior":[100],"or":[101],"similar":[102],"performance":[103],"compared":[104],"the":[106],"state-of-the-art":[107],"approaches.":[108]},"counts_by_year":[],"updated_date":"2025-11-06T03:46:38.306776","created_date":"2025-10-10T00:00:00"}
