{"id":"https://openalex.org/W4411472251","doi":"https://doi.org/10.1109/access.2025.3581734","title":"Real-Time Human Action Recognition With Dynamical Frame Processing via Modified ConvLSTM and BERT","display_name":"Real-Time Human Action Recognition With Dynamical Frame Processing via Modified ConvLSTM and BERT","publication_year":2025,"publication_date":"2025-01-01","ids":{"openalex":"https://openalex.org/W4411472251","doi":"https://doi.org/10.1109/access.2025.3581734"},"language":"en","primary_location":{"id":"doi:10.1109/access.2025.3581734","is_oa":true,"landing_page_url":"https://doi.org/10.1109/access.2025.3581734","pdf_url":null,"source":{"id":"https://openalex.org/S2485537415","display_name":"IEEE Access","issn_l":"2169-3536","issn":["2169-3536"],"is_oa":true,"is_in_doaj":true,"is_core":true,"host_organization":"https://openalex.org/P4310319808","host_organization_name":"Institute of Electrical and Electronics Engineers","host_organization_lineage":["https://openalex.org/P4310319808"],"host_organization_lineage_names":["Institute of Electrical and Electronics Engineers"],"type":"journal"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"IEEE Access","raw_type":"journal-article"},"type":"article","indexed_in":["crossref","doaj"],"open_access":{"is_oa":true,"oa_status":"gold","oa_url":"https://doi.org/10.1109/access.2025.3581734","any_repository_has_fulltext":true},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5013802009","display_name":"Raden Hadapiningsyah Kusumoseniarto","orcid":null},"institutions":[{"id":"https://openalex.org/I154864474","display_name":"National Taiwan University of Science and Technology","ror":"https://ror.org/00q09pe49","country_code":"TW","type":"education","lineage":["https://openalex.org/I154864474"]}],"countries":["TW"],"is_corresponding":true,"raw_author_name":"Raden Hadapiningsyah Kusumoseniarto","raw_affiliation_strings":["Electronics and Computer Engineering Department, National Taiwan University of Science and Technology, Taipei, Taiwan"],"affiliations":[{"raw_affiliation_string":"Electronics and Computer Engineering Department, National Taiwan University of Science and Technology, Taipei, Taiwan","institution_ids":["https://openalex.org/I154864474"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5049506273","display_name":"Zhiping Lin","orcid":"https://orcid.org/0000-0002-1587-1226"},"institutions":[{"id":"https://openalex.org/I154864474","display_name":"National Taiwan University of Science and Technology","ror":"https://ror.org/00q09pe49","country_code":"TW","type":"education","lineage":["https://openalex.org/I154864474"]}],"countries":["TW"],"is_corresponding":false,"raw_author_name":"Zhi-Yuan Lin","raw_affiliation_strings":["Electrical Engineering Department, National Taiwan University of Science and Technology, Taipei, Taiwan"],"affiliations":[{"raw_affiliation_string":"Electrical Engineering Department, National Taiwan University of Science and Technology, Taipei, Taiwan","institution_ids":["https://openalex.org/I154864474"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5035915560","display_name":"Shun\u2010Feng Su","orcid":"https://orcid.org/0000-0001-9777-128X"},"institutions":[{"id":"https://openalex.org/I154864474","display_name":"National Taiwan University of Science and Technology","ror":"https://ror.org/00q09pe49","country_code":"TW","type":"education","lineage":["https://openalex.org/I154864474"]}],"countries":["TW"],"is_corresponding":false,"raw_author_name":"Shun-Feng Su","raw_affiliation_strings":["Electrical Engineering Department, National Taiwan University of Science and Technology, Taipei, Taiwan"],"affiliations":[{"raw_affiliation_string":"Electrical Engineering Department, National Taiwan University of Science and Technology, Taipei, Taiwan","institution_ids":["https://openalex.org/I154864474"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5009788338","display_name":"Pei\u2010Jun Lee","orcid":"https://orcid.org/0000-0003-2010-0853"},"institutions":[{"id":"https://openalex.org/I154864474","display_name":"National Taiwan University of Science and Technology","ror":"https://ror.org/00q09pe49","country_code":"TW","type":"education","lineage":["https://openalex.org/I154864474"]}],"countries":["TW"],"is_corresponding":false,"raw_author_name":"Pei-Jun Lee","raw_affiliation_strings":["Electronics and Computer Engineering Department, National Taiwan University of Science and Technology, Taipei, Taiwan"],"affiliations":[{"raw_affiliation_string":"Electronics and Computer Engineering Department, National Taiwan University of Science and Technology, Taipei, Taiwan","institution_ids":["https://openalex.org/I154864474"]}]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":4,"corresponding_author_ids":["https://openalex.org/A5013802009"],"corresponding_institution_ids":["https://openalex.org/I154864474"],"apc_list":{"value":1850,"currency":"USD","value_usd":1850},"apc_paid":{"value":1850,"currency":"USD","value_usd":1850},"fwci":0.0,"has_fulltext":false,"cited_by_count":0,"citation_normalized_percentile":{"value":0.12282886,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":null,"biblio":{"volume":"13","issue":null,"first_page":"112368","last_page":"112377"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10812","display_name":"Human Pose and Action Recognition","score":0.9927999973297119,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10812","display_name":"Human Pose and Action Recognition","score":0.9927999973297119,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11512","display_name":"Anomaly Detection Techniques and Applications","score":0.9595999717712402,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T12740","display_name":"Gait Recognition and Analysis","score":0.9218000173568726,"subfield":{"id":"https://openalex.org/subfields/2204","display_name":"Biomedical Engineering"},"field":{"id":"https://openalex.org/fields/22","display_name":"Engineering"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.7647979259490967},{"id":"https://openalex.org/keywords/action-recognition","display_name":"Action recognition","score":0.6378573179244995},{"id":"https://openalex.org/keywords/frame","display_name":"Frame (networking)","score":0.5911210775375366},{"id":"https://openalex.org/keywords/action","display_name":"Action (physics)","score":0.5775421261787415},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.5626203417778015},{"id":"https://openalex.org/keywords/pattern-recognition","display_name":"Pattern recognition (psychology)","score":0.4532018303871155},{"id":"https://openalex.org/keywords/speech-recognition","display_name":"Speech recognition","score":0.3487592935562134},{"id":"https://openalex.org/keywords/computer-network","display_name":"Computer network","score":0.11631852388381958},{"id":"https://openalex.org/keywords/physics","display_name":"Physics","score":0.0819949209690094}],"concepts":[{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.7647979259490967},{"id":"https://openalex.org/C2987834672","wikidata":"https://www.wikidata.org/wiki/Q4677630","display_name":"Action recognition","level":3,"score":0.6378573179244995},{"id":"https://openalex.org/C126042441","wikidata":"https://www.wikidata.org/wiki/Q1324888","display_name":"Frame (networking)","level":2,"score":0.5911210775375366},{"id":"https://openalex.org/C2780791683","wikidata":"https://www.wikidata.org/wiki/Q846785","display_name":"Action (physics)","level":2,"score":0.5775421261787415},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.5626203417778015},{"id":"https://openalex.org/C153180895","wikidata":"https://www.wikidata.org/wiki/Q7148389","display_name":"Pattern recognition (psychology)","level":2,"score":0.4532018303871155},{"id":"https://openalex.org/C28490314","wikidata":"https://www.wikidata.org/wiki/Q189436","display_name":"Speech recognition","level":1,"score":0.3487592935562134},{"id":"https://openalex.org/C31258907","wikidata":"https://www.wikidata.org/wiki/Q1301371","display_name":"Computer network","level":1,"score":0.11631852388381958},{"id":"https://openalex.org/C121332964","wikidata":"https://www.wikidata.org/wiki/Q413","display_name":"Physics","level":0,"score":0.0819949209690094},{"id":"https://openalex.org/C62520636","wikidata":"https://www.wikidata.org/wiki/Q944","display_name":"Quantum mechanics","level":1,"score":0.0},{"id":"https://openalex.org/C2777212361","wikidata":"https://www.wikidata.org/wiki/Q5127848","display_name":"Class (philosophy)","level":2,"score":0.0}],"mesh":[],"locations_count":2,"locations":[{"id":"doi:10.1109/access.2025.3581734","is_oa":true,"landing_page_url":"https://doi.org/10.1109/access.2025.3581734","pdf_url":null,"source":{"id":"https://openalex.org/S2485537415","display_name":"IEEE Access","issn_l":"2169-3536","issn":["2169-3536"],"is_oa":true,"is_in_doaj":true,"is_core":true,"host_organization":"https://openalex.org/P4310319808","host_organization_name":"Institute of Electrical and Electronics Engineers","host_organization_lineage":["https://openalex.org/P4310319808"],"host_organization_lineage_names":["Institute of Electrical and Electronics Engineers"],"type":"journal"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"IEEE Access","raw_type":"journal-article"},{"id":"pmh:oai:doaj.org/article:8ee5a5d08e204767bea68391601eb2fd","is_oa":true,"landing_page_url":"https://doaj.org/article/8ee5a5d08e204767bea68391601eb2fd","pdf_url":null,"source":{"id":"https://openalex.org/S112646816","display_name":"SHILAP Revista de lepidopterolog\u00eda","issn_l":"0300-5267","issn":["0300-5267","2340-4078"],"is_oa":true,"is_in_doaj":true,"is_core":false,"host_organization":null,"host_organization_name":null,"host_organization_lineage":[],"host_organization_lineage_names":[],"type":"journal"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":"IEEE Access, Vol 13, Pp 112368-112377 (2025)","raw_type":"article"}],"best_oa_location":{"id":"doi:10.1109/access.2025.3581734","is_oa":true,"landing_page_url":"https://doi.org/10.1109/access.2025.3581734","pdf_url":null,"source":{"id":"https://openalex.org/S2485537415","display_name":"IEEE Access","issn_l":"2169-3536","issn":["2169-3536"],"is_oa":true,"is_in_doaj":true,"is_core":true,"host_organization":"https://openalex.org/P4310319808","host_organization_name":"Institute of Electrical and Electronics Engineers","host_organization_lineage":["https://openalex.org/P4310319808"],"host_organization_lineage_names":["Institute of Electrical and Electronics Engineers"],"type":"journal"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"IEEE Access","raw_type":"journal-article"},"sustainable_development_goals":[],"awards":[],"funders":[],"has_content":{"pdf":false,"grobid_xml":false},"content_urls":null,"referenced_works_count":29,"referenced_works":["https://openalex.org/W1945123189","https://openalex.org/W2194775991","https://openalex.org/W2293634267","https://openalex.org/W2307770531","https://openalex.org/W2325939864","https://openalex.org/W2462996230","https://openalex.org/W2559085405","https://openalex.org/W2618530766","https://openalex.org/W2618799552","https://openalex.org/W2769039400","https://openalex.org/W2868292291","https://openalex.org/W2896457183","https://openalex.org/W2916798096","https://openalex.org/W2944006115","https://openalex.org/W2963155035","https://openalex.org/W2963524571","https://openalex.org/W2963616706","https://openalex.org/W2963775820","https://openalex.org/W2963795951","https://openalex.org/W2964134613","https://openalex.org/W2990503944","https://openalex.org/W3020836386","https://openalex.org/W3034572008","https://openalex.org/W3128636476","https://openalex.org/W4312245820","https://openalex.org/W4324135644","https://openalex.org/W4385245566","https://openalex.org/W4394595489","https://openalex.org/W6628877408"],"related_works":["https://openalex.org/W2084487854","https://openalex.org/W2389546251","https://openalex.org/W2353878298","https://openalex.org/W2369556382","https://openalex.org/W4205118967","https://openalex.org/W2077682749","https://openalex.org/W2298450300","https://openalex.org/W2545205567","https://openalex.org/W1576128429","https://openalex.org/W2269464716"],"abstract_inverted_index":{"In":[0,63],"this":[1],"study,":[2],"a":[3,22,29,50,88,96,138,207],"human":[4,46],"action":[5,19,47,213,218],"recognition":[6,20,48,214],"approach":[7],"with":[8,28,36,73,136],"dynamical":[9,185],"frame":[10,52,186],"processing":[11,86],"is":[12,42,180],"proposed":[13,43,65],"to":[14,44,80,115,183],"fulfill":[15],"the":[16,82,104,121,190],"need":[17],"for":[18,159,224],"in":[21,87,144,203],"real-time":[23,149,201],"manner.":[24],"A":[25,174],"novel":[26],"architecture":[27],"modified":[30],"convolutional":[31,90],"long":[32],"short-term":[33],"memory":[34],"(ModConvLSTM)":[35],"pose":[37],"heatmaps":[38],"as":[39,157],"input":[40],"features":[41],"achieve":[45,116],"without":[49,215,231],"fixed":[51],"number.":[53],"The":[54],"effects":[55],"of":[56,84,118,131,141,177],"ModConvLSTM":[57,191],"are":[58],"verified":[59],"at":[60],"different":[61],"depths.":[62],"our":[64,113,162,178,221],"architecture,":[66],"we":[67],"replace":[68],"global":[69],"average":[70],"pooling":[71],"(GAP)":[72],"Bidirectional":[74],"Encoder":[75],"Representations":[76],"from":[77],"Transformers":[78],"(BERT)":[79],"address":[81],"limitations":[83],"temporal":[85],"two-dimensional":[89],"neural":[91],"network":[92,114],"(2D-CNN).":[93],"By":[94],"incorporating":[95],"training-stage":[97],"mask":[98],"and":[99,124,133,193],"leveraging":[100],"BERT\u2019s":[101],"attention":[102],"mechanism,":[103],"model":[105,163,222],"gains":[106],"improved":[107],"contextual":[108],"understanding.":[109],"This":[110,209],"enhancement":[111],"enables":[112,211],"accuracies":[117],"91.46%":[119],"on":[120,126,153,171,206],"NTU60":[122],"dataset":[123],"83.06%":[125],"NTU120,":[127],"marking":[128],"an":[129],"improvement":[130],"1.63%":[132],"3.22%,":[134],"respectively,":[135],"only":[137],"slight":[139],"increase":[140],"0.1":[142],"GFLOPs":[143],"computational":[145],"cost.":[146],"Unlike":[147],"other":[148],"models":[150],"that":[151],"rely":[152],"large-scale":[154],"datasets":[155],"such":[156],"Kinetics":[158],"extensive":[160],"pretraining,":[161],"achieves":[164],"competitive":[165],"performance":[166],"while":[167],"being":[168],"trained":[169],"directly":[170],"NTU":[172],"datasets.":[173],"key":[175],"contribution":[176],"work":[179],"its":[181],"ability":[182],"perform":[184],"recognition,":[187],"efficiently":[188],"updating":[189],"cell":[192],"computing":[194],"BERT":[195],"every":[196],"four":[197],"new":[198],"frames,":[199],"achieving":[200],"inference":[202],"just":[204],"14.2ms":[205],"CPU.":[208],"study":[210],"continuous":[212],"requiring":[216],"predefined":[217],"boundaries,":[219],"making":[220],"well-suited":[223],"real-world":[225],"applications":[226],"where":[227],"actions":[228],"occur":[229],"naturally":[230],"explicit":[232],"segmentation.":[233]},"counts_by_year":[],"updated_date":"2026-03-27T05:58:40.876381","created_date":"2025-10-10T00:00:00"}
