{"id":"https://openalex.org/W4415539290","doi":"https://doi.org/10.1145/3746027.3755404","title":"EventLip: Enhancing Event-Based Lip Reading via Frequency-Aware Spatiotemporal Hypergraph Modeling","display_name":"EventLip: Enhancing Event-Based Lip Reading via Frequency-Aware Spatiotemporal Hypergraph Modeling","publication_year":2025,"publication_date":"2025-10-25","ids":{"openalex":"https://openalex.org/W4415539290","doi":"https://doi.org/10.1145/3746027.3755404"},"language":null,"primary_location":{"id":"doi:10.1145/3746027.3755404","is_oa":false,"landing_page_url":"https://doi.org/10.1145/3746027.3755404","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Proceedings of the 33rd ACM International Conference on Multimedia","raw_type":"proceedings-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":false,"oa_status":"closed","oa_url":null,"any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5103064052","display_name":"Xueyi Zhang","orcid":"https://orcid.org/0009-0008-2394-3518"},"institutions":[{"id":"https://openalex.org/I170215575","display_name":"National University of Defense Technology","ror":"https://ror.org/05d2yfz11","country_code":"CN","type":"education","lineage":["https://openalex.org/I170215575"]}],"countries":["CN"],"is_corresponding":true,"raw_author_name":"Xueyi Zhang","raw_affiliation_strings":["National University of Defense Technology, changsha, China"],"raw_orcid":"https://orcid.org/0009-0008-2394-3518","affiliations":[{"raw_affiliation_string":"National University of Defense Technology, changsha, China","institution_ids":["https://openalex.org/I170215575"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5031239761","display_name":"Jialu Sun","orcid":null},"institutions":[{"id":"https://openalex.org/I4210116924","display_name":"Chinese University of Hong Kong, Shenzhen","ror":"https://ror.org/02d5ks197","country_code":"CN","type":"education","lineage":["https://openalex.org/I177725633","https://openalex.org/I180726961","https://openalex.org/I4210116924"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Jialu Sun","raw_affiliation_strings":["The Chinese University of Hong Kong, Shenzhen, Shenzhen, China"],"raw_orcid":"https://orcid.org/0009-0009-0218-7829","affiliations":[{"raw_affiliation_string":"The Chinese University of Hong Kong, Shenzhen, Shenzhen, China","institution_ids":["https://openalex.org/I4210116924"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5102710394","display_name":"Chengwei Zhang","orcid":"https://orcid.org/0000-0002-3375-2458"},"institutions":[{"id":"https://openalex.org/I4210165038","display_name":"University of Chinese Academy of Sciences","ror":"https://ror.org/05qbk4x57","country_code":"CN","type":"education","lineage":["https://openalex.org/I19820366","https://openalex.org/I4210165038"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Chengwei Zhang","raw_affiliation_strings":["University of the Chinese Academy of Sciences, Beijing, China"],"raw_orcid":"https://orcid.org/0000-0002-3375-2458","affiliations":[{"raw_affiliation_string":"University of the Chinese Academy of Sciences, Beijing, China","institution_ids":["https://openalex.org/I4210165038"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5060201191","display_name":"Xianghu Yue","orcid":"https://orcid.org/0000-0003-3527-6034"},"institutions":[{"id":"https://openalex.org/I162868743","display_name":"Tianjin University","ror":"https://ror.org/012tb2g32","country_code":"CN","type":"education","lineage":["https://openalex.org/I162868743"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Xianghu Yue","raw_affiliation_strings":["Tianjin University, Tianjin, China"],"raw_orcid":"https://orcid.org/0000-0003-3527-6034","affiliations":[{"raw_affiliation_string":"Tianjin University, Tianjin, China","institution_ids":["https://openalex.org/I162868743"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5082822511","display_name":"T. Xiao","orcid":"https://orcid.org/0000-0002-3303-1036"},"institutions":[{"id":"https://openalex.org/I157773358","display_name":"Sun Yat-sen University","ror":"https://ror.org/0064kty71","country_code":"CN","type":"education","lineage":["https://openalex.org/I157773358"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Tianfang Xiao","raw_affiliation_strings":["Sun Yat-sen University, Guangzhou, China"],"raw_orcid":"https://orcid.org/0000-0002-3303-1036","affiliations":[{"raw_affiliation_string":"Sun Yat-sen University, Guangzhou, China","institution_ids":["https://openalex.org/I157773358"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5028082407","display_name":"Shengliang Cai","orcid":null},"institutions":[{"id":"https://openalex.org/I204983213","display_name":"Harbin Institute of Technology","ror":"https://ror.org/01yqg2h08","country_code":"CN","type":"education","lineage":["https://openalex.org/I204983213"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Siqi Cai","raw_affiliation_strings":["Harbin Institute of Technology, Shenzhen, Shenzhen, China"],"raw_orcid":"https://orcid.org/0009-0007-4386-0472","affiliations":[{"raw_affiliation_string":"Harbin Institute of Technology, Shenzhen, Shenzhen, China","institution_ids":["https://openalex.org/I204983213"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5028043255","display_name":"Mingrui Lao","orcid":"https://orcid.org/0000-0001-8413-7220"},"institutions":[{"id":"https://openalex.org/I170215575","display_name":"National University of Defense Technology","ror":"https://ror.org/05d2yfz11","country_code":"CN","type":"education","lineage":["https://openalex.org/I170215575"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Mingrui Lao","raw_affiliation_strings":["National University of Defense Technology, Changsha, China"],"raw_orcid":"https://orcid.org/0000-0001-8413-7220","affiliations":[{"raw_affiliation_string":"National University of Defense Technology, Changsha, China","institution_ids":["https://openalex.org/I170215575"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5032690182","display_name":"Haizhou Li","orcid":null},"institutions":[{"id":"https://openalex.org/I4210116924","display_name":"Chinese University of Hong Kong, Shenzhen","ror":"https://ror.org/02d5ks197","country_code":"CN","type":"education","lineage":["https://openalex.org/I177725633","https://openalex.org/I180726961","https://openalex.org/I4210116924"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Haizhou Li","raw_affiliation_strings":["The Chinese University of Hong Kong, Shenzhen, Shenzhen, China"],"raw_orcid":"https://orcid.org/0000-0001-9158-9401","affiliations":[{"raw_affiliation_string":"The Chinese University of Hong Kong, Shenzhen, Shenzhen, China","institution_ids":["https://openalex.org/I4210116924"]}]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":8,"corresponding_author_ids":["https://openalex.org/A5103064052"],"corresponding_institution_ids":["https://openalex.org/I170215575"],"apc_list":null,"apc_paid":null,"fwci":0.0,"has_fulltext":false,"cited_by_count":0,"citation_normalized_percentile":{"value":0.28821239,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":null,"biblio":{"volume":null,"issue":null,"first_page":"8263","last_page":"8272"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T11439","display_name":"Video Analysis and Summarization","score":0.9980000257492065,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T11439","display_name":"Video Analysis and Summarization","score":0.9980000257492065,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11309","display_name":"Music and Audio Processing","score":0.9965999722480774,"subfield":{"id":"https://openalex.org/subfields/1711","display_name":"Signal Processing"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10812","display_name":"Human Pose and Action Recognition","score":0.9950000047683716,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/hypergraph","display_name":"Hypergraph","score":0.8125},{"id":"https://openalex.org/keywords/discriminative-model","display_name":"Discriminative model","score":0.7688000202178955},{"id":"https://openalex.org/keywords/smoothing","display_name":"Smoothing","score":0.5932000279426575},{"id":"https://openalex.org/keywords/robustness","display_name":"Robustness (evolution)","score":0.5593000054359436},{"id":"https://openalex.org/keywords/pattern-recognition","display_name":"Pattern recognition (psychology)","score":0.43799999356269836},{"id":"https://openalex.org/keywords/event","display_name":"Event (particle physics)","score":0.412200003862381},{"id":"https://openalex.org/keywords/benchmark","display_name":"Benchmark (surveying)","score":0.40459999442100525},{"id":"https://openalex.org/keywords/precision-and-recall","display_name":"Precision and recall","score":0.3815999925136566}],"concepts":[{"id":"https://openalex.org/C2781221856","wikidata":"https://www.wikidata.org/wiki/Q840247","display_name":"Hypergraph","level":2,"score":0.8125},{"id":"https://openalex.org/C97931131","wikidata":"https://www.wikidata.org/wiki/Q5282087","display_name":"Discriminative model","level":2,"score":0.7688000202178955},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.6771000027656555},{"id":"https://openalex.org/C3770464","wikidata":"https://www.wikidata.org/wiki/Q775963","display_name":"Smoothing","level":2,"score":0.5932000279426575},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.5647000074386597},{"id":"https://openalex.org/C63479239","wikidata":"https://www.wikidata.org/wiki/Q7353546","display_name":"Robustness (evolution)","level":3,"score":0.5593000054359436},{"id":"https://openalex.org/C153180895","wikidata":"https://www.wikidata.org/wiki/Q7148389","display_name":"Pattern recognition (psychology)","level":2,"score":0.43799999356269836},{"id":"https://openalex.org/C2779662365","wikidata":"https://www.wikidata.org/wiki/Q5416694","display_name":"Event (particle physics)","level":2,"score":0.412200003862381},{"id":"https://openalex.org/C185798385","wikidata":"https://www.wikidata.org/wiki/Q1161707","display_name":"Benchmark (surveying)","level":2,"score":0.40459999442100525},{"id":"https://openalex.org/C81669768","wikidata":"https://www.wikidata.org/wiki/Q2359161","display_name":"Precision and recall","level":2,"score":0.3815999925136566},{"id":"https://openalex.org/C127705205","wikidata":"https://www.wikidata.org/wiki/Q5748245","display_name":"Heuristics","level":2,"score":0.31709998846054077},{"id":"https://openalex.org/C2777810175","wikidata":"https://www.wikidata.org/wiki/Q5416730","display_name":"Event structure","level":2,"score":0.2985000014305115},{"id":"https://openalex.org/C136886441","wikidata":"https://www.wikidata.org/wiki/Q926129","display_name":"Normalization (sociology)","level":2,"score":0.2913999855518341},{"id":"https://openalex.org/C2780801425","wikidata":"https://www.wikidata.org/wiki/Q5164392","display_name":"Construct (python library)","level":2,"score":0.2720000147819519},{"id":"https://openalex.org/C147764199","wikidata":"https://www.wikidata.org/wiki/Q6865248","display_name":"Minification","level":2,"score":0.27149999141693115},{"id":"https://openalex.org/C11413529","wikidata":"https://www.wikidata.org/wiki/Q8366","display_name":"Algorithm","level":1,"score":0.2685000002384186},{"id":"https://openalex.org/C67186912","wikidata":"https://www.wikidata.org/wiki/Q367664","display_name":"Data modeling","level":2,"score":0.2646999955177307},{"id":"https://openalex.org/C184337299","wikidata":"https://www.wikidata.org/wiki/Q1437428","display_name":"Semantics (computer science)","level":2,"score":0.2524999976158142},{"id":"https://openalex.org/C66746571","wikidata":"https://www.wikidata.org/wiki/Q1134833","display_name":"ENCODE","level":3,"score":0.25189998745918274}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.1145/3746027.3755404","is_oa":false,"landing_page_url":"https://doi.org/10.1145/3746027.3755404","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Proceedings of the 33rd ACM International Conference on Multimedia","raw_type":"proceedings-article"}],"best_oa_location":null,"sustainable_development_goals":[],"awards":[],"funders":[],"has_content":{"pdf":false,"grobid_xml":false},"content_urls":null,"referenced_works_count":39,"referenced_works":["https://openalex.org/W2073044325","https://openalex.org/W2132680170","https://openalex.org/W2157262520","https://openalex.org/W2806331055","https://openalex.org/W2907888938","https://openalex.org/W2922107638","https://openalex.org/W2951333473","https://openalex.org/W2963524571","https://openalex.org/W2969508737","https://openalex.org/W2979450518","https://openalex.org/W3010268791","https://openalex.org/W3046688540","https://openalex.org/W3133758660","https://openalex.org/W3156853927","https://openalex.org/W3168565360","https://openalex.org/W3177222833","https://openalex.org/W3188692592","https://openalex.org/W4200337780","https://openalex.org/W4200635484","https://openalex.org/W4214727094","https://openalex.org/W4224983022","https://openalex.org/W4282926996","https://openalex.org/W4282968465","https://openalex.org/W4288770705","https://openalex.org/W4315650277","https://openalex.org/W4377990899","https://openalex.org/W4378472859","https://openalex.org/W4378805097","https://openalex.org/W4386172478","https://openalex.org/W4386432206","https://openalex.org/W4387491256","https://openalex.org/W4387969641","https://openalex.org/W4391512994","https://openalex.org/W4396629483","https://openalex.org/W4396732977","https://openalex.org/W4398254293","https://openalex.org/W4399541983","https://openalex.org/W4409365952","https://openalex.org/W4412377338"],"related_works":[],"abstract_inverted_index":{"Event":[0],"cameras,":[1],"with":[2],"their":[3],"microsecond-level":[4],"temporal":[5],"resolution":[6],"and":[7,28,53,96,113,173,183,189,197],"sparse":[8],"visual":[9,169],"encoding,":[10],"provide":[11],"a":[12,30,71,108,114,154,160,199],"transformative":[13],"paradigm":[14],"for":[15,61,78,92,202],"automatic":[16],"lip":[17,41,63,80,126,138,149,204],"reading":[18],"(ALR).":[19],"However,":[20],"event":[21],"data":[22],"inherently":[23],"lack":[24],"explicit":[25],"spatial":[26],"structure":[27],"exhibit":[29],"pronounced":[31],"frequency-domain":[32],"bias.":[33],"The":[34,119],"low-frequency":[35,85],"components":[36],"fail":[37],"to":[38,87,101,144,167],"capture":[39,145],"crucial":[40],"structural":[42,134],"information,":[43],"which":[44,58],"fundamentally":[45],"impedes":[46],"the":[47,89,129,137,142,175,187],"modeling":[48],"of":[49,57,177],"intra-frame":[50,122],"topological":[51,123],"dependencies":[52,124],"inter-frame":[54,133],"semantic":[55],"evolution-both":[56],"are":[59],"critical":[60],"robust":[62],"reading.":[64,81,205],"To":[65],"this":[66],"end,":[67],"we":[68,83,106,152],"propose":[69,153],"FAST-HG,":[70],"Frequency-Aware":[72],"SpatioTemporal":[73],"HyperGraph":[74],"framework":[75],"specifically":[76],"designed":[77,166],"event-based":[79,203],"First,":[82],"apply":[84],"perturbation":[86],"improve":[88],"model's":[90],"robustness":[91],"capturing":[93],"discriminative":[94,146],"features,":[95],"integrate":[97],"adaptive":[98],"high-frequency":[99],"filtering":[100],"enhance":[102],"edge-aware":[103],"representations.":[104],"Then,":[105],"construct":[107],"Spatial":[109],"Region":[110],"Hypergraph":[111,117],"(SRH)":[112],"Temporal":[115],"Semantic":[116],"(TSH).":[118],"former":[120],"captures":[121],"among":[125],"regions,":[127],"while":[128],"latter":[130],"explicitly":[131],"models":[132],"associations":[135],"throughout":[136],"movement":[139],"process,":[140],"enabling":[141],"model":[143],"patterns":[147],"in":[148],"dynamics.":[150],"Furthermore,":[151],"viseme-aware":[155],"label":[156],"smoothing":[157],"strategy,":[158],"where":[159],"novel":[161],"viseme-level":[162],"edit":[163],"distance":[164],"is":[165],"quantify":[168],"similarities":[170],"between":[171],"classes":[172],"guide":[174],"construction":[176],"soft":[178],"labels.":[179],"FAST-HG":[180],"achieves":[181],"79.85%":[182],"84.03%":[184],"accuracy":[185],"on":[186],"DVS-Lip":[188],"DVS-LRW100":[190],"datasets,":[191],"respectively,":[192],"significantly":[193],"outperforming":[194],"prior":[195],"methods":[196],"establishing":[198],"new":[200],"benchmark":[201]},"counts_by_year":[],"updated_date":"2025-11-06T03:46:38.306776","created_date":"2025-10-25T00:00:00"}
