{"id":"https://openalex.org/W4415968498","doi":"https://doi.org/10.1109/iecon58223.2025.11221050","title":"Transformer-based Human Action Recognition for Fine-Grained Industrial Assembly Tasks","display_name":"Transformer-based Human Action Recognition for Fine-Grained Industrial Assembly Tasks","publication_year":2025,"publication_date":"2025-10-14","ids":{"openalex":"https://openalex.org/W4415968498","doi":"https://doi.org/10.1109/iecon58223.2025.11221050"},"language":"en","primary_location":{"id":"doi:10.1109/iecon58223.2025.11221050","is_oa":false,"landing_page_url":"https://doi.org/10.1109/iecon58223.2025.11221050","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"IECON 2025 \u2013 51st Annual Conference of the IEEE Industrial Electronics Society","raw_type":"proceedings-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":false,"oa_status":"closed","oa_url":null,"any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5107831404","display_name":"M. Gallon","orcid":null},"institutions":[{"id":"https://openalex.org/I168974976","display_name":"Universidad de La Rioja","ror":"https://ror.org/0553yr311","country_code":"ES","type":"education","lineage":["https://openalex.org/I168974976"]}],"countries":["ES"],"is_corresponding":false,"raw_author_name":"Mayra Vanessa Alvear Gall\u00f3n","raw_affiliation_strings":["Universidad de La Rioja,Departamento de Matem&#x00E1;ticas y Computaci&#x00F3;n,Logro&#x00F1;o,Spain"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"Universidad de La Rioja,Departamento de Matem&#x00E1;ticas y Computaci&#x00F3;n,Logro&#x00F1;o,Spain","institution_ids":["https://openalex.org/I168974976"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5050368761","display_name":"Cosimo Patruno","orcid":"https://orcid.org/0000-0001-8624-5444"},"institutions":[{"id":"https://openalex.org/I4210146308","display_name":"Institute of Intelligent Systems for Automation","ror":"https://ror.org/051t1q308","country_code":"IT","type":"facility","lineage":["https://openalex.org/I4210146308","https://openalex.org/I4210155236"]},{"id":"https://openalex.org/I4210155236","display_name":"National Research Council","ror":"https://ror.org/04zaypm56","country_code":"IT","type":"nonprofit","lineage":["https://openalex.org/I4210155236"]}],"countries":["IT"],"is_corresponding":false,"raw_author_name":"Cosimo Patruno","raw_affiliation_strings":["Institute of Intelligent Industrial Technologies and Systems for Advanced Manufacturing National Research Council of Italy,Bari,Italy"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"Institute of Intelligent Industrial Technologies and Systems for Advanced Manufacturing National Research Council of Italy,Bari,Italy","institution_ids":["https://openalex.org/I4210146308","https://openalex.org/I4210155236"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5036169141","display_name":"Gadea Mata","orcid":"https://orcid.org/0000-0002-5567-8463"},"institutions":[{"id":"https://openalex.org/I168974976","display_name":"Universidad de La Rioja","ror":"https://ror.org/0553yr311","country_code":"ES","type":"education","lineage":["https://openalex.org/I168974976"]}],"countries":["ES"],"is_corresponding":false,"raw_author_name":"Gadea Mata","raw_affiliation_strings":["Universidad de La Rioja,Departamento de Matem&#x00E1;ticas y Computaci&#x00F3;n,Logro&#x00F1;o,Spain"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"Universidad de La Rioja,Departamento de Matem&#x00E1;ticas y Computaci&#x00F3;n,Logro&#x00F1;o,Spain","institution_ids":["https://openalex.org/I168974976"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5100602979","display_name":"C\u00e9sar Dom\u00ednguez","orcid":"https://orcid.org/0000-0002-2081-7523"},"institutions":[{"id":"https://openalex.org/I168974976","display_name":"Universidad de La Rioja","ror":"https://ror.org/0553yr311","country_code":"ES","type":"education","lineage":["https://openalex.org/I168974976"]}],"countries":["ES"],"is_corresponding":false,"raw_author_name":"C\u00e9sar Dom\u00ednguez","raw_affiliation_strings":["Universidad de La Rioja,Departamento de Matem&#x00E1;ticas y Computaci&#x00F3;n,Logro&#x00F1;o,Spain"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"Universidad de La Rioja,Departamento de Matem&#x00E1;ticas y Computaci&#x00F3;n,Logro&#x00F1;o,Spain","institution_ids":["https://openalex.org/I168974976"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5047403740","display_name":"Grazia Cicirelli","orcid":"https://orcid.org/0000-0003-1562-0467"},"institutions":[{"id":"https://openalex.org/I4210146308","display_name":"Institute of Intelligent Systems for Automation","ror":"https://ror.org/051t1q308","country_code":"IT","type":"facility","lineage":["https://openalex.org/I4210146308","https://openalex.org/I4210155236"]},{"id":"https://openalex.org/I4210155236","display_name":"National Research Council","ror":"https://ror.org/04zaypm56","country_code":"IT","type":"nonprofit","lineage":["https://openalex.org/I4210155236"]}],"countries":["IT"],"is_corresponding":false,"raw_author_name":"Grazia Cicirelli","raw_affiliation_strings":["Institute of Intelligent Industrial Technologies and Systems for Advanced Manufacturing National Research Council of Italy,Bari,Italy"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"Institute of Intelligent Industrial Technologies and Systems for Advanced Manufacturing National Research Council of Italy,Bari,Italy","institution_ids":["https://openalex.org/I4210146308","https://openalex.org/I4210155236"]}]}],"institutions":[],"countries_distinct_count":2,"institutions_distinct_count":5,"corresponding_author_ids":[],"corresponding_institution_ids":[],"apc_list":null,"apc_paid":null,"fwci":0.0,"has_fulltext":false,"cited_by_count":0,"citation_normalized_percentile":{"value":0.28470021,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":null,"biblio":{"volume":null,"issue":null,"first_page":"1","last_page":"6"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10812","display_name":"Human Pose and Action Recognition","score":0.9424999952316284,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10812","display_name":"Human Pose and Action Recognition","score":0.9424999952316284,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10653","display_name":"Robot Manipulation and Learning","score":0.01679999940097332,"subfield":{"id":"https://openalex.org/subfields/2207","display_name":"Control and Systems Engineering"},"field":{"id":"https://openalex.org/fields/22","display_name":"Engineering"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T12290","display_name":"Human Motion and Animation","score":0.00559999980032444,"subfield":{"id":"https://openalex.org/subfields/2207","display_name":"Control and Systems Engineering"},"field":{"id":"https://openalex.org/fields/22","display_name":"Engineering"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/action-recognition","display_name":"Action recognition","score":0.6046000123023987},{"id":"https://openalex.org/keywords/transformer","display_name":"Transformer","score":0.5016000270843506},{"id":"https://openalex.org/keywords/action","display_name":"Action (physics)","score":0.46799999475479126},{"id":"https://openalex.org/keywords/dimension","display_name":"Dimension (graph theory)","score":0.42719998955726624},{"id":"https://openalex.org/keywords/human-motion","display_name":"Human motion","score":0.4034999907016754},{"id":"https://openalex.org/keywords/motion","display_name":"Motion (physics)","score":0.38449999690055847},{"id":"https://openalex.org/keywords/cognitive-neuroscience-of-visual-object-recognition","display_name":"Cognitive neuroscience of visual object recognition","score":0.3671000003814697}],"concepts":[{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.7125999927520752},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.661300003528595},{"id":"https://openalex.org/C2987834672","wikidata":"https://www.wikidata.org/wiki/Q4677630","display_name":"Action recognition","level":3,"score":0.6046000123023987},{"id":"https://openalex.org/C66322947","wikidata":"https://www.wikidata.org/wiki/Q11658","display_name":"Transformer","level":3,"score":0.5016000270843506},{"id":"https://openalex.org/C2780791683","wikidata":"https://www.wikidata.org/wiki/Q846785","display_name":"Action (physics)","level":2,"score":0.46799999475479126},{"id":"https://openalex.org/C119857082","wikidata":"https://www.wikidata.org/wiki/Q2539","display_name":"Machine learning","level":1,"score":0.4431999921798706},{"id":"https://openalex.org/C33676613","wikidata":"https://www.wikidata.org/wiki/Q13415176","display_name":"Dimension (graph theory)","level":2,"score":0.42719998955726624},{"id":"https://openalex.org/C2986578859","wikidata":"https://www.wikidata.org/wiki/Q657632","display_name":"Human motion","level":3,"score":0.4034999907016754},{"id":"https://openalex.org/C104114177","wikidata":"https://www.wikidata.org/wiki/Q79782","display_name":"Motion (physics)","level":2,"score":0.38449999690055847},{"id":"https://openalex.org/C64876066","wikidata":"https://www.wikidata.org/wiki/Q5141226","display_name":"Cognitive neuroscience of visual object recognition","level":3,"score":0.3671000003814697},{"id":"https://openalex.org/C153180895","wikidata":"https://www.wikidata.org/wiki/Q7148389","display_name":"Pattern recognition (psychology)","level":2,"score":0.3506999909877777},{"id":"https://openalex.org/C2777212361","wikidata":"https://www.wikidata.org/wiki/Q5127848","display_name":"Class (philosophy)","level":2,"score":0.3330000042915344},{"id":"https://openalex.org/C121687571","wikidata":"https://www.wikidata.org/wiki/Q4677630","display_name":"Activity recognition","level":2,"score":0.31839999556541443},{"id":"https://openalex.org/C2779641649","wikidata":"https://www.wikidata.org/wiki/Q18377767","display_name":"Human Dimension","level":3,"score":0.2994999885559082},{"id":"https://openalex.org/C48007421","wikidata":"https://www.wikidata.org/wiki/Q676252","display_name":"Motion capture","level":3,"score":0.29910001158714294},{"id":"https://openalex.org/C103278499","wikidata":"https://www.wikidata.org/wiki/Q254465","display_name":"Similarity (geometry)","level":3,"score":0.2808000147342682},{"id":"https://openalex.org/C51632099","wikidata":"https://www.wikidata.org/wiki/Q3985153","display_name":"Training set","level":2,"score":0.2678000032901764},{"id":"https://openalex.org/C107457646","wikidata":"https://www.wikidata.org/wiki/Q207434","display_name":"Human\u2013computer interaction","level":1,"score":0.25690001249313354}],"mesh":[],"locations_count":2,"locations":[{"id":"doi:10.1109/iecon58223.2025.11221050","is_oa":false,"landing_page_url":"https://doi.org/10.1109/iecon58223.2025.11221050","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"IECON 2025 \u2013 51st Annual Conference of the IEEE Industrial Electronics Society","raw_type":"proceedings-article"},{"id":"pmh:oai:portal.dialnet.es:doc/694706a9221f004fbfa3c0f2","is_oa":false,"landing_page_url":"https://investigacion.unirioja.es/documentos/694706a9221f004fbfa3c0f2","pdf_url":null,"source":{"id":"https://openalex.org/S4306402551","display_name":"RIUR (Universidad de La Rioja)","issn_l":null,"issn":null,"is_oa":false,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I3032752892","host_organization_name":"Universidad Internacional de La Rioja","host_organization_lineage":["https://openalex.org/I3032752892"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"info:eu-repo/semantics/acceptedVersion"}],"best_oa_location":null,"sustainable_development_goals":[],"awards":[],"funders":[],"has_content":{"grobid_xml":false,"pdf":false},"content_urls":null,"referenced_works_count":16,"referenced_works":["https://openalex.org/W3024903125","https://openalex.org/W3113067059","https://openalex.org/W3138674438","https://openalex.org/W3185988714","https://openalex.org/W4200301490","https://openalex.org/W4306955484","https://openalex.org/W4311121622","https://openalex.org/W4361247902","https://openalex.org/W4385245566","https://openalex.org/W4385488815","https://openalex.org/W4401122654","https://openalex.org/W4401946706","https://openalex.org/W4403635079","https://openalex.org/W4408063250","https://openalex.org/W4410719252","https://openalex.org/W4412938019"],"related_works":[],"abstract_inverted_index":{"Human":[0],"Action":[1],"Recognition":[2],"(HAR)":[3],"in":[4,17,33,130],"industrial":[5,131],"assembly":[6,34],"scenarios":[7],"presents":[8],"significant":[9],"challenges,":[10],"primarily":[11],"due":[12],"to":[13,40,70],"the":[14,28,48,67,79,107,122,134],"slight":[15],"differences":[16],"motion":[18],"patterns":[19],"across":[20],"fine-grained":[21,127],"actions.":[22,149],"In":[23],"this":[24],"work,":[25],"we":[26,55,89],"address":[27],"problem":[29],"of":[30,124,136],"action":[31,87,128],"recognition":[32,75,114,129],"tasks":[35],"by":[36,65,116],"employing":[37],"skeleton":[38],"data":[39],"represent":[41],"detailed":[42],"human":[43,148],"movements.":[44],"To":[45],"effectively":[46],"capture":[47],"spatial":[49],"and":[50,82,140],"temporal":[51],"dependencies":[52],"among":[53],"joints,":[54],"apply":[56],"a":[57,91],"Transformer-based":[58],"architecture.":[59],"We":[60],"conducted":[61],"an":[62],"extensive":[63],"evaluation":[64],"varying":[66],"model":[68],"dimension":[69],"analyze":[71],"its":[72],"effect":[73],"on":[74],"performance.":[76],"Furthermore,":[77],"given":[78],"high":[80],"semantic":[81],"structural":[83],"similarity":[84],"between":[85],"certain":[86],"classes,":[88],"propose":[90],"class":[92],"merging":[93],"strategy":[94],"that":[95],"combines":[96],"highly":[97],"similar":[98],"actions":[99],"into":[100],"unified":[101],"categories.":[102],"This":[103],"not":[104],"only":[105],"simplifies":[106],"classification":[108],"task,":[109],"but":[110],"also":[111],"improves":[112],"overall":[113],"performance":[115],"reducing":[117],"ambiguity.":[118],"Experimental":[119],"results":[120],"demonstrate":[121],"effectiveness":[123],"Transformers":[125],"for":[126],"settings,":[132],"highlighting":[133],"importance":[135],"both":[137],"architectural":[138],"tuning":[139],"label":[141],"refinement":[142],"when":[143],"dealing":[144],"with":[145],"closely":[146],"related":[147]},"counts_by_year":[],"updated_date":"2026-06-11T09:08:48.828518","created_date":"2025-11-06T00:00:00"}
