{"id":"https://openalex.org/W4400527593","doi":"https://doi.org/10.1109/fg59268.2024.10582035","title":"In My Perspective, in My Hands: Accurate Egocentric 2D Hand Pose and Action Recognition","display_name":"In My Perspective, in My Hands: Accurate Egocentric 2D Hand Pose and Action Recognition","publication_year":2024,"publication_date":"2024-05-27","ids":{"openalex":"https://openalex.org/W4400527593","doi":"https://doi.org/10.1109/fg59268.2024.10582035"},"language":"en","primary_location":{"id":"doi:10.1109/fg59268.2024.10582035","is_oa":false,"landing_page_url":"https://doi.org/10.1109/fg59268.2024.10582035","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"2024 IEEE 18th International Conference on Automatic Face and Gesture Recognition (FG)","raw_type":"proceedings-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":false,"oa_status":"closed","oa_url":null,"any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5020545449","display_name":"Wiktor Mucha","orcid":"https://orcid.org/0000-0002-6048-3425"},"institutions":[{"id":"https://openalex.org/I145847075","display_name":"TU Wien","ror":"https://ror.org/04d836q62","country_code":"AT","type":"education","lineage":["https://openalex.org/I145847075"]}],"countries":["AT"],"is_corresponding":false,"raw_author_name":"Wiktor Mucha","raw_affiliation_strings":["TU Wien,Computer Vision Lab,Vienna,Austria,1040"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"TU Wien,Computer Vision Lab,Vienna,Austria,1040","institution_ids":["https://openalex.org/I145847075"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5081324708","display_name":"Martin Kampel","orcid":"https://orcid.org/0000-0002-5217-2854"},"institutions":[{"id":"https://openalex.org/I145847075","display_name":"TU Wien","ror":"https://ror.org/04d836q62","country_code":"AT","type":"education","lineage":["https://openalex.org/I145847075"]}],"countries":["AT"],"is_corresponding":false,"raw_author_name":"Martin Kampel","raw_affiliation_strings":["TU Wien,Computer Vision Lab,Vienna,Austria,1040"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"TU Wien,Computer Vision Lab,Vienna,Austria,1040","institution_ids":["https://openalex.org/I145847075"]}]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":2,"corresponding_author_ids":[],"corresponding_institution_ids":[],"apc_list":null,"apc_paid":null,"fwci":3.4997,"has_fulltext":false,"cited_by_count":16,"citation_normalized_percentile":{"value":0.93910163,"is_in_top_1_percent":false,"is_in_top_10_percent":true},"cited_by_percentile_year":{"min":90,"max":100},"biblio":{"volume":null,"issue":null,"first_page":"1","last_page":"9"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10812","display_name":"Human Pose and Action Recognition","score":0.9894000291824341,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10812","display_name":"Human Pose and Action Recognition","score":0.9894000291824341,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11398","display_name":"Hand Gesture Recognition Systems","score":0.972000002861023,"subfield":{"id":"https://openalex.org/subfields/1709","display_name":"Human-Computer Interaction"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11431","display_name":"Action Observation and Synchronization","score":0.960099995136261,"subfield":{"id":"https://openalex.org/subfields/3207","display_name":"Social Psychology"},"field":{"id":"https://openalex.org/fields/32","display_name":"Psychology"},"domain":{"id":"https://openalex.org/domains/2","display_name":"Social Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/perspective","display_name":"Perspective (graphical)","score":0.7267037630081177},{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.6691815853118896},{"id":"https://openalex.org/keywords/action-recognition","display_name":"Action recognition","score":0.6565901041030884},{"id":"https://openalex.org/keywords/action","display_name":"Action (physics)","score":0.5979688167572021},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.5206239223480225},{"id":"https://openalex.org/keywords/human\u2013computer-interaction","display_name":"Human\u2013computer interaction","score":0.5098609328269958},{"id":"https://openalex.org/keywords/computer-vision","display_name":"Computer vision","score":0.5075639486312866},{"id":"https://openalex.org/keywords/pose","display_name":"Pose","score":0.43000033497810364}],"concepts":[{"id":"https://openalex.org/C12713177","wikidata":"https://www.wikidata.org/wiki/Q1900281","display_name":"Perspective (graphical)","level":2,"score":0.7267037630081177},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.6691815853118896},{"id":"https://openalex.org/C2987834672","wikidata":"https://www.wikidata.org/wiki/Q4677630","display_name":"Action recognition","level":3,"score":0.6565901041030884},{"id":"https://openalex.org/C2780791683","wikidata":"https://www.wikidata.org/wiki/Q846785","display_name":"Action (physics)","level":2,"score":0.5979688167572021},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.5206239223480225},{"id":"https://openalex.org/C107457646","wikidata":"https://www.wikidata.org/wiki/Q207434","display_name":"Human\u2013computer interaction","level":1,"score":0.5098609328269958},{"id":"https://openalex.org/C31972630","wikidata":"https://www.wikidata.org/wiki/Q844240","display_name":"Computer vision","level":1,"score":0.5075639486312866},{"id":"https://openalex.org/C52102323","wikidata":"https://www.wikidata.org/wiki/Q1671968","display_name":"Pose","level":2,"score":0.43000033497810364},{"id":"https://openalex.org/C121332964","wikidata":"https://www.wikidata.org/wiki/Q413","display_name":"Physics","level":0,"score":0.0},{"id":"https://openalex.org/C2777212361","wikidata":"https://www.wikidata.org/wiki/Q5127848","display_name":"Class (philosophy)","level":2,"score":0.0},{"id":"https://openalex.org/C62520636","wikidata":"https://www.wikidata.org/wiki/Q944","display_name":"Quantum mechanics","level":1,"score":0.0}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.1109/fg59268.2024.10582035","is_oa":false,"landing_page_url":"https://doi.org/10.1109/fg59268.2024.10582035","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"2024 IEEE 18th International Conference on Automatic Face and Gesture Recognition (FG)","raw_type":"proceedings-article"}],"best_oa_location":null,"sustainable_development_goals":[{"display_name":"Reduced inequalities","score":0.4699999988079071,"id":"https://metadata.un.org/sdg/10"}],"awards":[{"id":"https://openalex.org/G935321560","display_name":"Algorithmic governance of care","funder_award_id":"ICT20-055","funder_id":"https://openalex.org/F4320321003","funder_display_name":"Vienna Science and Technology Fund"}],"funders":[{"id":"https://openalex.org/F4320321003","display_name":"Vienna Science and Technology Fund","ror":"https://ror.org/01f9mc681"}],"has_content":{"pdf":false,"grobid_xml":false},"content_urls":null,"referenced_works_count":0,"referenced_works":[],"related_works":["https://openalex.org/W2149537132","https://openalex.org/W2018871932","https://openalex.org/W2123263858","https://openalex.org/W641279757","https://openalex.org/W370975646","https://openalex.org/W1670566515","https://openalex.org/W3127959533","https://openalex.org/W1576128429","https://openalex.org/W3135266094","https://openalex.org/W2269464716"],"abstract_inverted_index":{"Action":[0],"recognition":[1,146,162],"is":[2,202,234],"essential":[3],"for":[4,55,93,106,113,119,206],"egocentric":[5,56,94,121,207],"video":[6],"understanding,":[7],"allowing":[8],"automatic":[9],"and":[10,116,127,136,151,158,167,177,183,212,224],"continuous":[11],"monitoring":[12],"of":[13,15,62,70,88,181,188,218],"Activities":[14],"Daily":[16],"Living":[17],"(ADLs)":[18],"without":[19],"user":[20],"effort.":[21],"Existing":[22],"literature":[23],"focuses":[24],"on":[25,134,165],"3D":[26],"hand":[27,53,90,108,150,220],"pose":[28,54,91,109,221],"input,":[29],"which":[30],"requires":[31],"computationally":[32],"intensive":[33],"depth":[34,41],"estimation":[35,92,115,222],"networks":[36],"or":[37],"wearing":[38],"an":[39,120,179],"uncomfortable":[40],"sensor.":[42],"In":[43],"contrast,":[44],"there":[45],"has":[46,172],"been":[47],"insufficient":[48],"research":[49,82],"in":[50,66],"understanding":[51],"2D":[52,89,107,149,199],"action":[57,95,145,161,208],"recognition,":[58,96],"despite":[59],"the":[60,67,86,189,216,219,229],"availability":[61],"user-friendly":[63],"smart":[64],"glasses":[65],"market":[68],"capable":[69],"capturing":[71,123],"a":[72,143,159,173,203],"single":[73],"RGB":[74],"image.":[75],"Our":[76,194],"study":[77],"aims":[78],"to":[79],"fill":[80],"this":[81],"gap":[83],"by":[84],"exploring":[85],"field":[87],"making":[97],"two":[98,103],"contributions.":[99],"Firstly,":[100],"we":[101,141],"introduce":[102],"novel":[104],"approaches":[105],"estimation,":[110],"namely":[111],"EffHandNet":[112],"single-hand":[114],"EffHandEgoNet,":[117,157],"tailored":[118],"perspective,":[122],"interactions":[124],"between":[125],"hands":[126],"objects.":[128],"Both":[129],"methods":[130],"outperform":[131],"state-of-the-art":[132],"models":[133],"H2O":[135,166],"FPHA":[137,168],"public":[138],"benchmarks.":[139],"Secondly,":[140],"present":[142],"robust":[144,204],"architecture":[147,171],"from":[148],"object":[152],"poses.":[153],"This":[154],"method":[155],"incorporates":[156],"transformer-based":[160],"method.":[163],"Evaluated":[164],"datasets,":[169],"our":[170],"faster":[174],"inference":[175],"time":[176],"achieves":[178],"accuracy":[180],"91.32%":[182],"94.43%,":[184],"respectively,":[185],"surpassing":[186],"state":[187],"art,":[190],"including":[191],"3D-based":[192],"methods.":[193],"work":[195],"demonstrates":[196],"that":[197],"using":[198],"skeletal":[200],"data":[201],"approach":[205],"understanding.":[209],"Extensive":[210],"evaluation":[211],"ablation":[213],"studies":[214],"show":[215],"impact":[217],"approach,":[223],"how":[225],"each":[226],"input":[227],"affects":[228],"overall":[230],"performance.":[231],"The":[232],"code":[233],"available":[235],"at":[236],"https://github.com/wiktormucha/effhandegonet.":[237]},"counts_by_year":[{"year":2026,"cited_by_count":6},{"year":2025,"cited_by_count":9},{"year":2024,"cited_by_count":1}],"updated_date":"2026-06-11T09:08:48.828518","created_date":"2025-10-10T00:00:00"}
