{"id":"https://openalex.org/W4415536168","doi":"https://doi.org/10.1145/3746027.3755538","title":"Kinematic Enhanced Hypergraph Convolutional Network for Skeleton-based Human Action Recognition with LLM Training Guides","display_name":"Kinematic Enhanced Hypergraph Convolutional Network for Skeleton-based Human Action Recognition with LLM Training Guides","publication_year":2025,"publication_date":"2025-10-25","ids":{"openalex":"https://openalex.org/W4415536168","doi":"https://doi.org/10.1145/3746027.3755538"},"language":null,"primary_location":{"id":"doi:10.1145/3746027.3755538","is_oa":false,"landing_page_url":"https://doi.org/10.1145/3746027.3755538","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Proceedings of the 33rd ACM International Conference on Multimedia","raw_type":"proceedings-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":false,"oa_status":"closed","oa_url":null,"any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5100613879","display_name":"Nan Ma","orcid":"https://orcid.org/0000-0001-6264-2365"},"institutions":[{"id":"https://openalex.org/I37796252","display_name":"Beijing University of Technology","ror":"https://ror.org/037b1pp87","country_code":"CN","type":"education","lineage":["https://openalex.org/I37796252"]},{"id":"https://openalex.org/I4210164898","display_name":"Beijing Chaoyang Emergency Medical Center","ror":"https://ror.org/05anb7a53","country_code":"CN","type":"healthcare","lineage":["https://openalex.org/I4210164898"]}],"countries":["CN"],"is_corresponding":true,"raw_author_name":"Nan Ma","raw_affiliation_strings":["School of Information Science and Technology, Beijing University of Technology, Chaoyang Qu, Beijing Shi, China"],"affiliations":[{"raw_affiliation_string":"School of Information Science and Technology, Beijing University of Technology, Chaoyang Qu, Beijing Shi, China","institution_ids":["https://openalex.org/I37796252","https://openalex.org/I4210164898"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5113192659","display_name":"Beining Sun","orcid":"https://orcid.org/0009-0006-7814-9368"},"institutions":[{"id":"https://openalex.org/I37796252","display_name":"Beijing University of Technology","ror":"https://ror.org/037b1pp87","country_code":"CN","type":"education","lineage":["https://openalex.org/I37796252"]},{"id":"https://openalex.org/I4210164898","display_name":"Beijing Chaoyang Emergency Medical Center","ror":"https://ror.org/05anb7a53","country_code":"CN","type":"healthcare","lineage":["https://openalex.org/I4210164898"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Beining Sun","raw_affiliation_strings":["School of Information Science and Technology, Beijing University of Technology, Chaoyang Qu, Beijing Shi, China"],"affiliations":[{"raw_affiliation_string":"School of Information Science and Technology, Beijing University of Technology, Chaoyang Qu, Beijing Shi, China","institution_ids":["https://openalex.org/I37796252","https://openalex.org/I4210164898"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5035402576","display_name":"Yiheng Han","orcid":"https://orcid.org/0000-0002-3986-7555"},"institutions":[{"id":"https://openalex.org/I37796252","display_name":"Beijing University of Technology","ror":"https://ror.org/037b1pp87","country_code":"CN","type":"education","lineage":["https://openalex.org/I37796252"]},{"id":"https://openalex.org/I4210164898","display_name":"Beijing Chaoyang Emergency Medical Center","ror":"https://ror.org/05anb7a53","country_code":"CN","type":"healthcare","lineage":["https://openalex.org/I4210164898"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Yiheng Han","raw_affiliation_strings":["School of Information Science and Technology, Beijing University of Technology, Chaoyang Qu, Beijing Shi, China"],"affiliations":[{"raw_affiliation_string":"School of Information Science and Technology, Beijing University of Technology, Chaoyang Qu, Beijing Shi, China","institution_ids":["https://openalex.org/I37796252","https://openalex.org/I4210164898"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5112507939","display_name":"Genbao Xu","orcid":null},"institutions":[{"id":"https://openalex.org/I37796252","display_name":"Beijing University of Technology","ror":"https://ror.org/037b1pp87","country_code":"CN","type":"education","lineage":["https://openalex.org/I37796252"]},{"id":"https://openalex.org/I4210164898","display_name":"Beijing Chaoyang Emergency Medical Center","ror":"https://ror.org/05anb7a53","country_code":"CN","type":"healthcare","lineage":["https://openalex.org/I4210164898"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Genbao Xu","raw_affiliation_strings":["School of Information Science and Technology, Beijing University of Technology, Chaoyang Qu, Beijing Shi, China"],"affiliations":[{"raw_affiliation_string":"School of Information Science and Technology, Beijing University of Technology, Chaoyang Qu, Beijing Shi, China","institution_ids":["https://openalex.org/I37796252","https://openalex.org/I4210164898"]}]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":4,"corresponding_author_ids":["https://openalex.org/A5100613879"],"corresponding_institution_ids":["https://openalex.org/I37796252","https://openalex.org/I4210164898"],"apc_list":null,"apc_paid":null,"fwci":1.1919,"has_fulltext":false,"cited_by_count":1,"citation_normalized_percentile":{"value":0.84137756,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":{"min":96,"max":98},"biblio":{"volume":null,"issue":null,"first_page":"1920","last_page":"1928"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10812","display_name":"Human Pose and Action Recognition","score":1.0,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10812","display_name":"Human Pose and Action Recognition","score":1.0,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T12740","display_name":"Gait Recognition and Analysis","score":0.9957000017166138,"subfield":{"id":"https://openalex.org/subfields/2204","display_name":"Biomedical Engineering"},"field":{"id":"https://openalex.org/fields/22","display_name":"Engineering"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11512","display_name":"Anomaly Detection Techniques and Applications","score":0.994700014591217,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/kinematics","display_name":"Kinematics","score":0.8700000047683716},{"id":"https://openalex.org/keywords/hypergraph","display_name":"Hypergraph","score":0.7408999800682068},{"id":"https://openalex.org/keywords/feature","display_name":"Feature (linguistics)","score":0.5777999758720398},{"id":"https://openalex.org/keywords/action-recognition","display_name":"Action recognition","score":0.5088000297546387},{"id":"https://openalex.org/keywords/convolutional-neural-network","display_name":"Convolutional neural network","score":0.46389999985694885},{"id":"https://openalex.org/keywords/benchmark","display_name":"Benchmark (surveying)","score":0.4636000096797943},{"id":"https://openalex.org/keywords/training","display_name":"Training (meteorology)","score":0.3905999958515167},{"id":"https://openalex.org/keywords/pattern-recognition","display_name":"Pattern recognition (psychology)","score":0.3878999948501587}],"concepts":[{"id":"https://openalex.org/C39920418","wikidata":"https://www.wikidata.org/wiki/Q11476","display_name":"Kinematics","level":2,"score":0.8700000047683716},{"id":"https://openalex.org/C2781221856","wikidata":"https://www.wikidata.org/wiki/Q840247","display_name":"Hypergraph","level":2,"score":0.7408999800682068},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.6898999810218811},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.5946999788284302},{"id":"https://openalex.org/C2776401178","wikidata":"https://www.wikidata.org/wiki/Q12050496","display_name":"Feature (linguistics)","level":2,"score":0.5777999758720398},{"id":"https://openalex.org/C2987834672","wikidata":"https://www.wikidata.org/wiki/Q4677630","display_name":"Action recognition","level":3,"score":0.5088000297546387},{"id":"https://openalex.org/C81363708","wikidata":"https://www.wikidata.org/wiki/Q17084460","display_name":"Convolutional neural network","level":2,"score":0.46389999985694885},{"id":"https://openalex.org/C185798385","wikidata":"https://www.wikidata.org/wiki/Q1161707","display_name":"Benchmark (surveying)","level":2,"score":0.4636000096797943},{"id":"https://openalex.org/C2777211547","wikidata":"https://www.wikidata.org/wiki/Q17141490","display_name":"Training (meteorology)","level":2,"score":0.3905999958515167},{"id":"https://openalex.org/C153180895","wikidata":"https://www.wikidata.org/wiki/Q7148389","display_name":"Pattern recognition (psychology)","level":2,"score":0.3878999948501587},{"id":"https://openalex.org/C66746571","wikidata":"https://www.wikidata.org/wiki/Q1134833","display_name":"ENCODE","level":3,"score":0.3806000053882599},{"id":"https://openalex.org/C192209626","wikidata":"https://www.wikidata.org/wiki/Q190909","display_name":"Focus (optics)","level":2,"score":0.37209999561309814},{"id":"https://openalex.org/C62837456","wikidata":"https://www.wikidata.org/wiki/Q678308","display_name":"Kinematic chain","level":3,"score":0.3675999939441681},{"id":"https://openalex.org/C2780791683","wikidata":"https://www.wikidata.org/wiki/Q846785","display_name":"Action (physics)","level":2,"score":0.365200012922287},{"id":"https://openalex.org/C104114177","wikidata":"https://www.wikidata.org/wiki/Q79782","display_name":"Motion (physics)","level":2,"score":0.3346000015735626},{"id":"https://openalex.org/C31972630","wikidata":"https://www.wikidata.org/wiki/Q844240","display_name":"Computer vision","level":1,"score":0.3287999927997589},{"id":"https://openalex.org/C18969341","wikidata":"https://www.wikidata.org/wiki/Q1169129","display_name":"Skeleton (computer programming)","level":2,"score":0.29600000381469727},{"id":"https://openalex.org/C51632099","wikidata":"https://www.wikidata.org/wiki/Q3985153","display_name":"Training set","level":2,"score":0.2946999967098236},{"id":"https://openalex.org/C194544171","wikidata":"https://www.wikidata.org/wiki/Q21105679","display_name":"Gating","level":2,"score":0.29429998993873596},{"id":"https://openalex.org/C74222875","wikidata":"https://www.wikidata.org/wiki/Q16000312","display_name":"Robot kinematics","level":4,"score":0.28610000014305115},{"id":"https://openalex.org/C52622490","wikidata":"https://www.wikidata.org/wiki/Q1026626","display_name":"Feature extraction","level":2,"score":0.26460000872612},{"id":"https://openalex.org/C119857082","wikidata":"https://www.wikidata.org/wiki/Q2539","display_name":"Machine learning","level":1,"score":0.26170000433921814},{"id":"https://openalex.org/C150303390","wikidata":"https://www.wikidata.org/wiki/Q1983852","display_name":"Virtual actor","level":3,"score":0.2590000033378601},{"id":"https://openalex.org/C104122410","wikidata":"https://www.wikidata.org/wiki/Q1416406","display_name":"Network model","level":2,"score":0.2583000063896179}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.1145/3746027.3755538","is_oa":false,"landing_page_url":"https://doi.org/10.1145/3746027.3755538","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Proceedings of the 33rd ACM International Conference on Multimedia","raw_type":"proceedings-article"}],"best_oa_location":null,"sustainable_development_goals":[],"awards":[{"id":"https://openalex.org/G3220979006","display_name":null,"funder_award_id":"Nos. 62371013","funder_id":"https://openalex.org/F4320321001","funder_display_name":"National Natural Science Foundation of China"}],"funders":[{"id":"https://openalex.org/F4320321001","display_name":"National Natural Science Foundation of China","ror":"https://ror.org/01h0zpd94"}],"has_content":{"grobid_xml":false,"pdf":false},"content_urls":null,"referenced_works_count":29,"referenced_works":["https://openalex.org/W2054041160","https://openalex.org/W2150884987","https://openalex.org/W2510185399","https://openalex.org/W2604321021","https://openalex.org/W2892880750","https://openalex.org/W2948058585","https://openalex.org/W2963076818","https://openalex.org/W2963465695","https://openalex.org/W2964134613","https://openalex.org/W2966438217","https://openalex.org/W3035050855","https://openalex.org/W3093411241","https://openalex.org/W3108496296","https://openalex.org/W3125955391","https://openalex.org/W3153110474","https://openalex.org/W3185273257","https://openalex.org/W3203634062","https://openalex.org/W3207613026","https://openalex.org/W4280576085","https://openalex.org/W4283377921","https://openalex.org/W4283775680","https://openalex.org/W4285085664","https://openalex.org/W4386075639","https://openalex.org/W4386172478","https://openalex.org/W4390871806","https://openalex.org/W4390871852","https://openalex.org/W4396629483","https://openalex.org/W4402716188","https://openalex.org/W4405778915"],"related_works":[],"abstract_inverted_index":{"Skeleton-based":[0],"human":[1,74],"action":[2],"recognition":[3],"has":[4],"wide":[5],"applications":[6],"in":[7],"video":[8],"understanding":[9],"and":[10,22,28,59,84,97,129,142,166],"virtual":[11],"reality.":[12],"However,":[13],"most":[14],"existing":[15],"methods":[16],"focus":[17],"excessively":[18],"on":[19,106,159],"spatial":[20],"location":[21],"global":[23,128],"movement,":[24],"while":[25],"underrepresenting":[26],"subtle":[27],"local":[29,130],"actions.":[30],"To":[31],"address":[32],"the":[33,66,77,81,85,102,107,115,155,169],"limitation,":[34],"we":[35,64,113],"innovatively":[36],"propose":[37],"a":[38,89,120,126],"Kinematic":[39,56,60],"Enhanced":[40],"Hypergraph":[41,57],"Convolutional":[42],"Network(KEHCN)":[43],"with":[44],"LLM":[45,53],"training":[46,103],"guides.":[47],"The":[48,157],"network":[49,69,117,133],"mainly":[50],"consists":[51],"of":[52,109,151],"Training":[54],"Guides(LTG),":[55],"Convolution(KHC),":[58],"Gating":[61],"Module(KGM).":[62],"Specifically,":[63],"use":[65],"hypergraph":[67],"convolutional":[68],"to":[70,79,87,94,144,173],"extract":[71],"high-order":[72],"correlated":[73],"skeleton":[75],"features,":[76],"KHC":[78],"encode":[80],"kinematic":[82,98,121,137],"features":[83,100,138],"LTG":[86,141],"provide":[88],"pre-trained":[90],"large":[91],"language":[92],"model":[93],"generate":[95],"text":[96],"description":[99],"during":[101],"phase.":[104],"Based":[105],"Mixture":[108],"Experts":[110],"(MoE)":[111],"framework,":[112],"simplify":[114],"gating":[116],"by":[118],"introducing":[119],"feature":[122],"threshold,":[123],"thereby":[124],"constructing":[125],"dual-branch":[127],"motion":[131],"expert":[132],"(KGM).":[134],"We":[135],"integrated":[136],"into":[139],"KHC,":[140],"KGM":[143],"seek":[145],"improvements":[146],"from":[147],"three":[148,160],"perspectives,":[149],"all":[150],"which":[152],"have":[153],"enhanced":[154],"performance.":[156],"experiments":[158],"benchmark":[161],"datasets(NTU":[162],"RGB+D,":[163],"NTU-RGB+D":[164],"120":[165],"NW-UCLA),":[167],"demonstrate":[168],"state-of-the-art":[170],"performance":[171],"compared":[172],"current":[174],"open-source":[175],"methods.":[176]},"counts_by_year":[{"year":2026,"cited_by_count":1}],"updated_date":"2026-04-14T08:04:32.555800","created_date":"2025-10-25T00:00:00"}
