{"id":"https://openalex.org/W4387969083","doi":"https://doi.org/10.1145/3581783.3612852","title":"Sliding Window Seq2seq Modeling for Engagement Estimation","display_name":"Sliding Window Seq2seq Modeling for Engagement Estimation","publication_year":2023,"publication_date":"2023-10-26","ids":{"openalex":"https://openalex.org/W4387969083","doi":"https://doi.org/10.1145/3581783.3612852"},"language":"en","primary_location":{"id":"doi:10.1145/3581783.3612852","is_oa":false,"landing_page_url":"https://doi.org/10.1145/3581783.3612852","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Proceedings of the 31st ACM International Conference on Multimedia","raw_type":"proceedings-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":false,"oa_status":"closed","oa_url":null,"any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5048818071","display_name":"Jun Yu","orcid":"https://orcid.org/0000-0002-3197-8103"},"institutions":[{"id":"https://openalex.org/I126520041","display_name":"University of Science and Technology of China","ror":"https://ror.org/04c4dkn09","country_code":"CN","type":"education","lineage":["https://openalex.org/I126520041","https://openalex.org/I19820366"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Jun Yu","raw_affiliation_strings":["University of Science and Technology of China, Hefei, China"],"raw_orcid":"https://orcid.org/0000-0002-3197-8103","affiliations":[{"raw_affiliation_string":"University of Science and Technology of China, Hefei, China","institution_ids":["https://openalex.org/I126520041"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5045007834","display_name":"Keda Lu","orcid":"https://orcid.org/0009-0006-8974-3813"},"institutions":[{"id":"https://openalex.org/I126520041","display_name":"University of Science and Technology of China","ror":"https://ror.org/04c4dkn09","country_code":"CN","type":"education","lineage":["https://openalex.org/I126520041","https://openalex.org/I19820366"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Keda Lu","raw_affiliation_strings":["University of Science and Technology of China, Hefei, China"],"raw_orcid":"https://orcid.org/0009-0006-8974-3813","affiliations":[{"raw_affiliation_string":"University of Science and Technology of China, Hefei, China","institution_ids":["https://openalex.org/I126520041"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5077962053","display_name":"Mohan Jing","orcid":"https://orcid.org/0009-0003-3891-9207"},"institutions":[{"id":"https://openalex.org/I126520041","display_name":"University of Science and Technology of China","ror":"https://ror.org/04c4dkn09","country_code":"CN","type":"education","lineage":["https://openalex.org/I126520041","https://openalex.org/I19820366"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Mohan Jing","raw_affiliation_strings":["University of Science and Technology of China, Hefei, China"],"raw_orcid":"https://orcid.org/0009-0003-3891-9207","affiliations":[{"raw_affiliation_string":"University of Science and Technology of China, Hefei, China","institution_ids":["https://openalex.org/I126520041"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5057417516","display_name":"Ziqi Liang","orcid":"https://orcid.org/0009-0006-8488-991X"},"institutions":[{"id":"https://openalex.org/I126520041","display_name":"University of Science and Technology of China","ror":"https://ror.org/04c4dkn09","country_code":"CN","type":"education","lineage":["https://openalex.org/I126520041","https://openalex.org/I19820366"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Ziqi Liang","raw_affiliation_strings":["University of Science and Technology of China, Hefei, China"],"raw_orcid":"https://orcid.org/0009-0006-8488-991X","affiliations":[{"raw_affiliation_string":"University of Science and Technology of China, Hefei, China","institution_ids":["https://openalex.org/I126520041"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5101459239","display_name":"Bingyuan Zhang","orcid":"https://orcid.org/0009-0003-6000-6631"},"institutions":[{"id":"https://openalex.org/I126520041","display_name":"University of Science and Technology of China","ror":"https://ror.org/04c4dkn09","country_code":"CN","type":"education","lineage":["https://openalex.org/I126520041","https://openalex.org/I19820366"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Bingyuan Zhang","raw_affiliation_strings":["University of Science and Technology of China, Hefei, China"],"raw_orcid":"https://orcid.org/0009-0003-6000-6631","affiliations":[{"raw_affiliation_string":"University of Science and Technology of China, Hefei, China","institution_ids":["https://openalex.org/I126520041"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5047888605","display_name":"Jianqing Sun","orcid":"https://orcid.org/0009-0007-3598-8564"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Jianqing Sun","raw_affiliation_strings":["Unisound AI Technology Co.,Ltd, Beijing, China"],"raw_orcid":"https://orcid.org/0009-0007-3598-8564","affiliations":[{"raw_affiliation_string":"Unisound AI Technology Co.,Ltd, Beijing, China","institution_ids":[]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5039730743","display_name":"Jiaen Liang","orcid":"https://orcid.org/0009-0001-8309-1301"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Jiaen Liang","raw_affiliation_strings":["Unisound AI Technology Co.,Ltd, Beijing, China"],"raw_orcid":"https://orcid.org/0009-0001-8309-1301","affiliations":[{"raw_affiliation_string":"Unisound AI Technology Co.,Ltd, Beijing, China","institution_ids":[]}]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":7,"corresponding_author_ids":[],"corresponding_institution_ids":[],"apc_list":null,"apc_paid":null,"fwci":0.7859,"has_fulltext":false,"cited_by_count":7,"citation_normalized_percentile":{"value":0.74592503,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":{"min":95,"max":98},"biblio":{"volume":null,"issue":null,"first_page":"9496","last_page":"9500"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10812","display_name":"Human Pose and Action Recognition","score":0.9998999834060669,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10812","display_name":"Human Pose and Action Recognition","score":0.9998999834060669,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10667","display_name":"Emotion and Mood Recognition","score":0.9990000128746033,"subfield":{"id":"https://openalex.org/subfields/3205","display_name":"Experimental and Cognitive Psychology"},"field":{"id":"https://openalex.org/fields/32","display_name":"Psychology"},"domain":{"id":"https://openalex.org/domains/2","display_name":"Social Sciences"}},{"id":"https://openalex.org/T11714","display_name":"Multimodal Machine Learning Applications","score":0.9987000226974487,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.7169826626777649},{"id":"https://openalex.org/keywords/sliding-window-protocol","display_name":"Sliding window protocol","score":0.7156879901885986},{"id":"https://openalex.org/keywords/estimation","display_name":"Estimation","score":0.5278682112693787},{"id":"https://openalex.org/keywords/transformer","display_name":"Transformer","score":0.5194603800773621},{"id":"https://openalex.org/keywords/modal","display_name":"Modal","score":0.45043396949768066},{"id":"https://openalex.org/keywords/focus","display_name":"Focus (optics)","score":0.4484427869319916},{"id":"https://openalex.org/keywords/window","display_name":"Window (computing)","score":0.44633162021636963},{"id":"https://openalex.org/keywords/feature","display_name":"Feature (linguistics)","score":0.44353193044662476},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.4378507435321808},{"id":"https://openalex.org/keywords/frame","display_name":"Frame (networking)","score":0.4281269311904907},{"id":"https://openalex.org/keywords/human\u2013computer-interaction","display_name":"Human\u2013computer interaction","score":0.3258037269115448},{"id":"https://openalex.org/keywords/engineering","display_name":"Engineering","score":0.11008888483047485},{"id":"https://openalex.org/keywords/voltage","display_name":"Voltage","score":0.08146658539772034},{"id":"https://openalex.org/keywords/telecommunications","display_name":"Telecommunications","score":0.07687419652938843}],"concepts":[{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.7169826626777649},{"id":"https://openalex.org/C102392041","wikidata":"https://www.wikidata.org/wiki/Q592860","display_name":"Sliding window protocol","level":3,"score":0.7156879901885986},{"id":"https://openalex.org/C96250715","wikidata":"https://www.wikidata.org/wiki/Q965330","display_name":"Estimation","level":2,"score":0.5278682112693787},{"id":"https://openalex.org/C66322947","wikidata":"https://www.wikidata.org/wiki/Q11658","display_name":"Transformer","level":3,"score":0.5194603800773621},{"id":"https://openalex.org/C71139939","wikidata":"https://www.wikidata.org/wiki/Q910194","display_name":"Modal","level":2,"score":0.45043396949768066},{"id":"https://openalex.org/C192209626","wikidata":"https://www.wikidata.org/wiki/Q190909","display_name":"Focus (optics)","level":2,"score":0.4484427869319916},{"id":"https://openalex.org/C2778751112","wikidata":"https://www.wikidata.org/wiki/Q835016","display_name":"Window (computing)","level":2,"score":0.44633162021636963},{"id":"https://openalex.org/C2776401178","wikidata":"https://www.wikidata.org/wiki/Q12050496","display_name":"Feature (linguistics)","level":2,"score":0.44353193044662476},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.4378507435321808},{"id":"https://openalex.org/C126042441","wikidata":"https://www.wikidata.org/wiki/Q1324888","display_name":"Frame (networking)","level":2,"score":0.4281269311904907},{"id":"https://openalex.org/C107457646","wikidata":"https://www.wikidata.org/wiki/Q207434","display_name":"Human\u2013computer interaction","level":1,"score":0.3258037269115448},{"id":"https://openalex.org/C127413603","wikidata":"https://www.wikidata.org/wiki/Q11023","display_name":"Engineering","level":0,"score":0.11008888483047485},{"id":"https://openalex.org/C165801399","wikidata":"https://www.wikidata.org/wiki/Q25428","display_name":"Voltage","level":2,"score":0.08146658539772034},{"id":"https://openalex.org/C76155785","wikidata":"https://www.wikidata.org/wiki/Q418","display_name":"Telecommunications","level":1,"score":0.07687419652938843},{"id":"https://openalex.org/C121332964","wikidata":"https://www.wikidata.org/wiki/Q413","display_name":"Physics","level":0,"score":0.0},{"id":"https://openalex.org/C120665830","wikidata":"https://www.wikidata.org/wiki/Q14620","display_name":"Optics","level":1,"score":0.0},{"id":"https://openalex.org/C119599485","wikidata":"https://www.wikidata.org/wiki/Q43035","display_name":"Electrical engineering","level":1,"score":0.0},{"id":"https://openalex.org/C201995342","wikidata":"https://www.wikidata.org/wiki/Q682496","display_name":"Systems engineering","level":1,"score":0.0},{"id":"https://openalex.org/C41895202","wikidata":"https://www.wikidata.org/wiki/Q8162","display_name":"Linguistics","level":1,"score":0.0},{"id":"https://openalex.org/C111919701","wikidata":"https://www.wikidata.org/wiki/Q9135","display_name":"Operating system","level":1,"score":0.0},{"id":"https://openalex.org/C138885662","wikidata":"https://www.wikidata.org/wiki/Q5891","display_name":"Philosophy","level":0,"score":0.0},{"id":"https://openalex.org/C185592680","wikidata":"https://www.wikidata.org/wiki/Q2329","display_name":"Chemistry","level":0,"score":0.0},{"id":"https://openalex.org/C188027245","wikidata":"https://www.wikidata.org/wiki/Q750446","display_name":"Polymer chemistry","level":1,"score":0.0}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.1145/3581783.3612852","is_oa":false,"landing_page_url":"https://doi.org/10.1145/3581783.3612852","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Proceedings of the 31st ACM International Conference on Multimedia","raw_type":"proceedings-article"}],"best_oa_location":null,"sustainable_development_goals":[],"awards":[{"id":"https://openalex.org/G450612882","display_name":null,"funder_award_id":"62276242","funder_id":"https://openalex.org/F4320321001","funder_display_name":"National Natural Science Foundation of China"}],"funders":[{"id":"https://openalex.org/F4320321001","display_name":"National Natural Science Foundation of China","ror":"https://ror.org/01h0zpd94"},{"id":"https://openalex.org/F4320325599","display_name":"University of Science and Technology of China","ror":"https://ror.org/04c4dkn09"}],"has_content":{"pdf":false,"grobid_xml":false},"content_urls":null,"referenced_works_count":16,"referenced_works":["https://openalex.org/W2015752089","https://openalex.org/W2042587338","https://openalex.org/W2064675550","https://openalex.org/W2105410877","https://openalex.org/W2131774270","https://openalex.org/W2139916508","https://openalex.org/W2194775991","https://openalex.org/W2239141610","https://openalex.org/W2313339984","https://openalex.org/W2559085405","https://openalex.org/W2755291975","https://openalex.org/W2807126412","https://openalex.org/W2895475421","https://openalex.org/W2995682556","https://openalex.org/W3184185352","https://openalex.org/W4385965696"],"related_works":["https://openalex.org/W2109115373","https://openalex.org/W2390901981","https://openalex.org/W2353818951","https://openalex.org/W1605879311","https://openalex.org/W2611980620","https://openalex.org/W4230691760","https://openalex.org/W2385763735","https://openalex.org/W4391923333","https://openalex.org/W3014558862","https://openalex.org/W150851721"],"abstract_inverted_index":{"Engagement":[0],"estimation":[1,51,108],"in":[2,82],"human":[3],"conversations":[4],"has":[5],"been":[6],"one":[7],"of":[8,29,49,91,104],"the":[9,26,41,46,75,83,89,92,100,110],"most":[10],"important":[11],"research":[12],"issues":[13],"for":[14,106],"natural":[15],"human-robot":[16],"interaction.":[17],"However,":[18],"previous":[19],"datasets":[20],"and":[21,64,77,86],"studies":[22],"mainly":[23],"focus":[24],"on":[25,109],"video-wise":[27],"level":[28,48],"engagement":[30,50,90,107],"estimation,":[31],"therefore,":[32],"can":[33],"hardly":[34],"reflect":[35],"human's":[36],"constantly":[37],"changing":[38],"engagement.":[39],"Fortunately,":[40],"MultiMediate":[42],"'23":[43],"challenge":[44],"provides":[45],"frame-wise":[47],"task.":[52],"In":[53],"this":[54],"paper,":[55],"we":[56],"propose":[57],"Sliding":[58],"Window":[59],"Seq2seq":[60],"Modeling":[61],"by":[62],"BiLSTM":[63],"Transformer":[65],"with":[66],"powerful":[67],"sequence":[68],"modeling":[69],"capabilities.":[70],"Our":[71,97],"method":[72,98],"fully":[73],"utilizes":[74],"global":[76],"local":[78],"multi-modal":[79],"feature":[80],"information":[81],"participants'":[84],"videos":[85],"accurately":[87],"expresses":[88],"participants":[93],"at":[94],"each":[95],"moment.":[96],"achieves":[99],"state-of-the-art":[101],"CCC":[102],"result":[103],"0.71":[105],"corresponding":[111],"test":[112],"sets.":[113]},"counts_by_year":[{"year":2025,"cited_by_count":2},{"year":2024,"cited_by_count":5}],"updated_date":"2026-06-11T09:08:48.828518","created_date":"2025-10-10T00:00:00"}
