{"id":"https://openalex.org/W7147686699","doi":"https://doi.org/10.1109/cnml68938.2026.11452298","title":"Efficient Multimodal Fusion of Skeleton and Posture Cues for Robust Behavior Understanding","display_name":"Efficient Multimodal Fusion of Skeleton and Posture Cues for Robust Behavior Understanding","publication_year":2026,"publication_date":"2026-01-30","ids":{"openalex":"https://openalex.org/W7147686699","doi":"https://doi.org/10.1109/cnml68938.2026.11452298"},"language":null,"primary_location":{"id":"doi:10.1109/cnml68938.2026.11452298","is_oa":false,"landing_page_url":"https://doi.org/10.1109/cnml68938.2026.11452298","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"2026 International Conference on Communication Networks and Machine Learning (CNML)","raw_type":"proceedings-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":false,"oa_status":"closed","oa_url":null,"any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5003319392","display_name":"Yujian Zhang","orcid":"https://orcid.org/0000-0001-7450-2642"},"institutions":[{"id":"https://openalex.org/I159948400","display_name":"Jinan University","ror":"https://ror.org/02xe5ns62","country_code":"CN","type":"education","lineage":["https://openalex.org/I159948400"]}],"countries":["CN"],"is_corresponding":true,"raw_author_name":"Yujian Zhang","raw_affiliation_strings":["Jinan University&#x2013;University of Birmingham Joint Institute Jinan University,Guangzhou,China"],"affiliations":[{"raw_affiliation_string":"Jinan University&#x2013;University of Birmingham Joint Institute Jinan University,Guangzhou,China","institution_ids":["https://openalex.org/I159948400"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5123769129","display_name":"Xiaoli Liu","orcid":null},"institutions":[{"id":"https://openalex.org/I159948400","display_name":"Jinan University","ror":"https://ror.org/02xe5ns62","country_code":"CN","type":"education","lineage":["https://openalex.org/I159948400"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Xiaoli Liu","raw_affiliation_strings":["Jinan University&#x2013;University of Birmingham Joint Institute Jinan University,Guangzhou,China"],"affiliations":[{"raw_affiliation_string":"Jinan University&#x2013;University of Birmingham Joint Institute Jinan University,Guangzhou,China","institution_ids":["https://openalex.org/I159948400"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5100338400","display_name":"Jingjing Li","orcid":"https://orcid.org/0000-0003-0811-4988"},"institutions":[{"id":"https://openalex.org/I5343935","display_name":"Guilin University of Electronic Technology","ror":"https://ror.org/05arjae42","country_code":"CN","type":"education","lineage":["https://openalex.org/I5343935"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Jingjing Li","raw_affiliation_strings":["Guilin University of Electronic Technology,Guangxi Key Laboratory of Trusted Software,Guilin,China,541004"],"affiliations":[{"raw_affiliation_string":"Guilin University of Electronic Technology,Guangxi Key Laboratory of Trusted Software,Guilin,China,541004","institution_ids":["https://openalex.org/I5343935"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5034029145","display_name":"Qingzhen Xu","orcid":null},"institutions":[{"id":"https://openalex.org/I187400657","display_name":"South China Normal University","ror":"https://ror.org/01kq0pv72","country_code":"CN","type":"education","lineage":["https://openalex.org/I187400657"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Qingzhen Xu","raw_affiliation_strings":["South China Normal University,School of Computer Science,Guangzhou,China"],"affiliations":[{"raw_affiliation_string":"South China Normal University,School of Computer Science,Guangzhou,China","institution_ids":["https://openalex.org/I187400657"]}]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":4,"corresponding_author_ids":["https://openalex.org/A5003319392"],"corresponding_institution_ids":["https://openalex.org/I159948400"],"apc_list":null,"apc_paid":null,"fwci":0.0,"has_fulltext":false,"cited_by_count":0,"citation_normalized_percentile":{"value":0.9267205,"is_in_top_1_percent":false,"is_in_top_10_percent":true},"cited_by_percentile_year":null,"biblio":{"volume":null,"issue":null,"first_page":"795","last_page":"802"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10812","display_name":"Human Pose and Action Recognition","score":0.9065999984741211,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10812","display_name":"Human Pose and Action Recognition","score":0.9065999984741211,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11714","display_name":"Multimodal Machine Learning Applications","score":0.04010000079870224,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10444","display_name":"Context-Aware Activity Recognition Systems","score":0.009399999864399433,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/action-recognition","display_name":"Action recognition","score":0.6617000102996826},{"id":"https://openalex.org/keywords/key","display_name":"Key (lock)","score":0.6183000206947327},{"id":"https://openalex.org/keywords/software-deployment","display_name":"Software deployment","score":0.5378000140190125},{"id":"https://openalex.org/keywords/action","display_name":"Action (physics)","score":0.49459999799728394},{"id":"https://openalex.org/keywords/activity-recognition","display_name":"Activity recognition","score":0.43790000677108765},{"id":"https://openalex.org/keywords/virtual-reality","display_name":"Virtual reality","score":0.4016999900341034},{"id":"https://openalex.org/keywords/skeleton","display_name":"Skeleton (computer programming)","score":0.38909998536109924},{"id":"https://openalex.org/keywords/set","display_name":"Set (abstract data type)","score":0.3815999925136566}],"concepts":[{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.815500020980835},{"id":"https://openalex.org/C2987834672","wikidata":"https://www.wikidata.org/wiki/Q4677630","display_name":"Action recognition","level":3,"score":0.6617000102996826},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.654699981212616},{"id":"https://openalex.org/C26517878","wikidata":"https://www.wikidata.org/wiki/Q228039","display_name":"Key (lock)","level":2,"score":0.6183000206947327},{"id":"https://openalex.org/C105339364","wikidata":"https://www.wikidata.org/wiki/Q2297740","display_name":"Software deployment","level":2,"score":0.5378000140190125},{"id":"https://openalex.org/C2780791683","wikidata":"https://www.wikidata.org/wiki/Q846785","display_name":"Action (physics)","level":2,"score":0.49459999799728394},{"id":"https://openalex.org/C31972630","wikidata":"https://www.wikidata.org/wiki/Q844240","display_name":"Computer vision","level":1,"score":0.44190001487731934},{"id":"https://openalex.org/C121687571","wikidata":"https://www.wikidata.org/wiki/Q4677630","display_name":"Activity recognition","level":2,"score":0.43790000677108765},{"id":"https://openalex.org/C194969405","wikidata":"https://www.wikidata.org/wiki/Q170519","display_name":"Virtual reality","level":2,"score":0.4016999900341034},{"id":"https://openalex.org/C18969341","wikidata":"https://www.wikidata.org/wiki/Q1169129","display_name":"Skeleton (computer programming)","level":2,"score":0.38909998536109924},{"id":"https://openalex.org/C107457646","wikidata":"https://www.wikidata.org/wiki/Q207434","display_name":"Human\u2013computer interaction","level":1,"score":0.3828999996185303},{"id":"https://openalex.org/C177264268","wikidata":"https://www.wikidata.org/wiki/Q1514741","display_name":"Set (abstract data type)","level":2,"score":0.3815999925136566},{"id":"https://openalex.org/C119857082","wikidata":"https://www.wikidata.org/wiki/Q2539","display_name":"Machine learning","level":1,"score":0.37450000643730164},{"id":"https://openalex.org/C150303390","wikidata":"https://www.wikidata.org/wiki/Q1983852","display_name":"Virtual actor","level":3,"score":0.37389999628067017},{"id":"https://openalex.org/C63479239","wikidata":"https://www.wikidata.org/wiki/Q7353546","display_name":"Robustness (evolution)","level":3,"score":0.3582000136375427},{"id":"https://openalex.org/C36464697","wikidata":"https://www.wikidata.org/wiki/Q451553","display_name":"Visualization","level":2,"score":0.35429999232292175},{"id":"https://openalex.org/C141353440","wikidata":"https://www.wikidata.org/wiki/Q182221","display_name":"Fuse (electrical)","level":2,"score":0.3472999930381775},{"id":"https://openalex.org/C66024118","wikidata":"https://www.wikidata.org/wiki/Q1122506","display_name":"Computational model","level":2,"score":0.33809998631477356},{"id":"https://openalex.org/C2777846634","wikidata":"https://www.wikidata.org/wiki/Q9621","display_name":"Human skeleton","level":2,"score":0.3361999988555908},{"id":"https://openalex.org/C33954974","wikidata":"https://www.wikidata.org/wiki/Q486494","display_name":"Sensor fusion","level":2,"score":0.32199999690055847},{"id":"https://openalex.org/C153180895","wikidata":"https://www.wikidata.org/wiki/Q7148389","display_name":"Pattern recognition (psychology)","level":2,"score":0.3183000087738037},{"id":"https://openalex.org/C158525013","wikidata":"https://www.wikidata.org/wiki/Q2593739","display_name":"Fusion","level":2,"score":0.305400013923645},{"id":"https://openalex.org/C135641252","wikidata":"https://www.wikidata.org/wiki/Q738567","display_name":"Multimodal interaction","level":2,"score":0.30239999294281006},{"id":"https://openalex.org/C175154964","wikidata":"https://www.wikidata.org/wiki/Q380077","display_name":"Task analysis","level":3,"score":0.2669999897480011},{"id":"https://openalex.org/C145460709","wikidata":"https://www.wikidata.org/wiki/Q859951","display_name":"Human\u2013robot interaction","level":3,"score":0.2524000108242035}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.1109/cnml68938.2026.11452298","is_oa":false,"landing_page_url":"https://doi.org/10.1109/cnml68938.2026.11452298","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"2026 International Conference on Communication Networks and Machine Learning (CNML)","raw_type":"proceedings-article"}],"best_oa_location":null,"sustainable_development_goals":[],"awards":[],"funders":[],"has_content":{"grobid_xml":false,"pdf":false},"content_urls":null,"referenced_works_count":16,"referenced_works":["https://openalex.org/W2044774029","https://openalex.org/W2739179646","https://openalex.org/W2810685774","https://openalex.org/W2941718503","https://openalex.org/W2948058585","https://openalex.org/W2963037989","https://openalex.org/W2963076818","https://openalex.org/W2982083293","https://openalex.org/W3130191949","https://openalex.org/W4206459143","https://openalex.org/W4220733951","https://openalex.org/W4312245820","https://openalex.org/W4367301504","https://openalex.org/W4404722309","https://openalex.org/W4407361273","https://openalex.org/W4409129251"],"related_works":[],"abstract_inverted_index":{"Accurate":[0],"and":[1,15,26,39,59,85,100,111,132,143],"robust":[2],"human":[3,74],"behavior":[4],"recognition":[5,109],"has":[6],"become":[7],"a":[8,44,53,89],"key":[9],"requirement":[10],"in":[11,129,145],"Extended":[12],"Reality":[13],"(XR)":[14],"human\u2013computer":[16],"interaction":[17,141],"scenarios":[18],"such":[19],"as":[20,88],"immersive":[21],"learning,":[22],"collaborative":[23],"virtual":[24],"spaces,":[25],"healthcare":[27],"monitoring.":[28],"Yet,":[29],"building":[30],"models":[31],"that":[32,56,123],"can":[33],"operate":[34],"reliably":[35],"under":[36],"limited":[37],"resources":[38],"dynamically":[40],"changing":[41],"conditions":[42],"remains":[43],"pressing":[45],"issue.":[46],"To":[47],"tackle":[48],"this,":[49],"we":[50],"introduce":[51],"YOLO-OpenPoseNet,":[52],"multimodal":[54],"framework":[55],"fuses":[57],"object-level":[58],"pose-level":[60],"information":[61],"for":[62,72,92,138],"efficient":[63],"action":[64],"recognition.":[65],"In":[66],"our":[67],"design,":[68],"YOLOv5":[69],"is":[70],"used":[71],"fast":[73],"detection,":[75],"OpenPose":[76],"provides":[77],"fine-grained":[78],"skeletal":[79],"keypoints":[80],"to":[81],"describe":[82],"posture":[83],"variations,":[84],"MobileNetV3":[86],"functions":[87],"lightweight":[90],"backbone":[91],"classification.":[93],"By":[94],"jointly":[95],"leveraging":[96],"bounding-box":[97],"visual":[98],"cues":[99],"skeleton-based":[101],"spatial":[102],"representations,":[103],"the":[104,116],"model":[105],"achieves":[106],"both":[107],"high":[108],"accuracy":[110],"computational":[112],"efficiency.":[113],"Experiments":[114],"on":[115],"UCI":[117],"Multiview":[118],"Human":[119],"Action":[120],"Database":[121],"confirm":[122],"YOLO-OpenPoseNet":[124],"outperforms":[125],"representative":[126],"unimodal":[127],"approaches":[128],"precision,":[130],"recall,":[131],"F1":[133],"score,":[134],"demonstrating":[135],"its":[136],"suitability":[137],"real-time":[139],"XR-enhanced":[140],"systems":[142],"deployment":[144],"resource-constrained":[146],"IoT":[147],"environments.":[148]},"counts_by_year":[],"updated_date":"2026-04-02T13:53:19.096889","created_date":"2026-04-02T00:00:00"}
