{"id":"https://openalex.org/W4313173527","doi":"https://doi.org/10.1109/mmsp55362.2022.9948897","title":"Hand-object Interaction based Semi-automatic Objects Annotation for Human Activity Datasets","display_name":"Hand-object Interaction based Semi-automatic Objects Annotation for Human Activity Datasets","publication_year":2022,"publication_date":"2022-09-26","ids":{"openalex":"https://openalex.org/W4313173527","doi":"https://doi.org/10.1109/mmsp55362.2022.9948897"},"language":"en","primary_location":{"id":"doi:10.1109/mmsp55362.2022.9948897","is_oa":false,"landing_page_url":"https://doi.org/10.1109/mmsp55362.2022.9948897","pdf_url":null,"source":{"id":"https://openalex.org/S4363605768","display_name":"2022 IEEE 24th International Workshop on Multimedia Signal Processing (MMSP)","issn_l":null,"issn":null,"is_oa":false,"is_in_doaj":false,"is_core":false,"host_organization":null,"host_organization_name":null,"host_organization_lineage":[],"host_organization_lineage_names":[],"type":"conference"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"2022 IEEE 24th International Workshop on Multimedia Signal Processing (MMSP)","raw_type":"proceedings-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":false,"oa_status":"closed","oa_url":null,"any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5100370856","display_name":"Yuankai Wu","orcid":"https://orcid.org/0000-0003-4435-9413"},"institutions":[{"id":"https://openalex.org/I62916508","display_name":"Technical University of Munich","ror":"https://ror.org/02kkvpp62","country_code":"DE","type":"education","lineage":["https://openalex.org/I62916508"]}],"countries":["DE"],"is_corresponding":true,"raw_author_name":"Yuankai Wu","raw_affiliation_strings":["Chair of Media Technology and Munich Institute of Robotics and Machine Intelligence, Technical University of Munich,Munich,Germany","Chair of Media Technology and Munich Institute of Robotics and Machine Intelligence, Technical University of Munich, Munich, Germany"],"affiliations":[{"raw_affiliation_string":"Chair of Media Technology and Munich Institute of Robotics and Machine Intelligence, Technical University of Munich,Munich,Germany","institution_ids":["https://openalex.org/I62916508"]},{"raw_affiliation_string":"Chair of Media Technology and Munich Institute of Robotics and Machine Intelligence, Technical University of Munich, Munich, Germany","institution_ids":["https://openalex.org/I62916508"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5032513259","display_name":"Zhouyi Gu","orcid":null},"institutions":[{"id":"https://openalex.org/I62916508","display_name":"Technical University of Munich","ror":"https://ror.org/02kkvpp62","country_code":"DE","type":"education","lineage":["https://openalex.org/I62916508"]}],"countries":["DE"],"is_corresponding":false,"raw_author_name":"Zhouyi Gu","raw_affiliation_strings":["Chair of Media Technology and Munich Institute of Robotics and Machine Intelligence, Technical University of Munich,Munich,Germany","Chair of Media Technology and Munich Institute of Robotics and Machine Intelligence, Technical University of Munich, Munich, Germany"],"affiliations":[{"raw_affiliation_string":"Chair of Media Technology and Munich Institute of Robotics and Machine Intelligence, Technical University of Munich,Munich,Germany","institution_ids":["https://openalex.org/I62916508"]},{"raw_affiliation_string":"Chair of Media Technology and Munich Institute of Robotics and Machine Intelligence, Technical University of Munich, Munich, Germany","institution_ids":["https://openalex.org/I62916508"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5023180222","display_name":"Marsil Zakour","orcid":"https://orcid.org/0000-0003-1319-9912"},"institutions":[{"id":"https://openalex.org/I62916508","display_name":"Technical University of Munich","ror":"https://ror.org/02kkvpp62","country_code":"DE","type":"education","lineage":["https://openalex.org/I62916508"]}],"countries":["DE"],"is_corresponding":false,"raw_author_name":"Marsil Zakour","raw_affiliation_strings":["Chair of Media Technology and Munich Institute of Robotics and Machine Intelligence, Technical University of Munich,Munich,Germany","Chair of Media Technology and Munich Institute of Robotics and Machine Intelligence, Technical University of Munich, Munich, Germany"],"affiliations":[{"raw_affiliation_string":"Chair of Media Technology and Munich Institute of Robotics and Machine Intelligence, Technical University of Munich,Munich,Germany","institution_ids":["https://openalex.org/I62916508"]},{"raw_affiliation_string":"Chair of Media Technology and Munich Institute of Robotics and Machine Intelligence, Technical University of Munich, Munich, Germany","institution_ids":["https://openalex.org/I62916508"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5083505379","display_name":"Rahul Chaudhari","orcid":"https://orcid.org/0000-0003-0400-428X"},"institutions":[{"id":"https://openalex.org/I62916508","display_name":"Technical University of Munich","ror":"https://ror.org/02kkvpp62","country_code":"DE","type":"education","lineage":["https://openalex.org/I62916508"]}],"countries":["DE"],"is_corresponding":false,"raw_author_name":"Rahul Gopal Chaudhari","raw_affiliation_strings":["Chair of Media Technology and Munich Institute of Robotics and Machine Intelligence, Technical University of Munich,Munich,Germany","Chair of Media Technology and Munich Institute of Robotics and Machine Intelligence, Technical University of Munich, Munich, Germany"],"affiliations":[{"raw_affiliation_string":"Chair of Media Technology and Munich Institute of Robotics and Machine Intelligence, Technical University of Munich,Munich,Germany","institution_ids":["https://openalex.org/I62916508"]},{"raw_affiliation_string":"Chair of Media Technology and Munich Institute of Robotics and Machine Intelligence, Technical University of Munich, Munich, Germany","institution_ids":["https://openalex.org/I62916508"]}]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":4,"corresponding_author_ids":["https://openalex.org/A5100370856"],"corresponding_institution_ids":["https://openalex.org/I62916508"],"apc_list":null,"apc_paid":null,"fwci":0.0,"has_fulltext":false,"cited_by_count":0,"citation_normalized_percentile":{"value":0.16891412,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":null,"biblio":{"volume":null,"issue":null,"first_page":"1","last_page":"6"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10812","display_name":"Human Pose and Action Recognition","score":0.9994999766349792,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10812","display_name":"Human Pose and Action Recognition","score":0.9994999766349792,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10036","display_name":"Advanced Neural Network Applications","score":0.9991000294685364,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10331","display_name":"Video Surveillance and Tracking Methods","score":0.9976999759674072,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.8327293992042542},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.7484955787658691},{"id":"https://openalex.org/keywords/computer-vision","display_name":"Computer vision","score":0.6334733963012695},{"id":"https://openalex.org/keywords/annotation","display_name":"Annotation","score":0.6231070160865784},{"id":"https://openalex.org/keywords/object","display_name":"Object (grammar)","score":0.6172745227813721},{"id":"https://openalex.org/keywords/ground-truth","display_name":"Ground truth","score":0.5310022830963135},{"id":"https://openalex.org/keywords/intersection","display_name":"Intersection (aeronautics)","score":0.5180826187133789},{"id":"https://openalex.org/keywords/object-detection","display_name":"Object detection","score":0.46600088477134705},{"id":"https://openalex.org/keywords/focus","display_name":"Focus (optics)","score":0.41742801666259766},{"id":"https://openalex.org/keywords/pattern-recognition","display_name":"Pattern recognition (psychology)","score":0.34076815843582153}],"concepts":[{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.8327293992042542},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.7484955787658691},{"id":"https://openalex.org/C31972630","wikidata":"https://www.wikidata.org/wiki/Q844240","display_name":"Computer vision","level":1,"score":0.6334733963012695},{"id":"https://openalex.org/C2776321320","wikidata":"https://www.wikidata.org/wiki/Q857525","display_name":"Annotation","level":2,"score":0.6231070160865784},{"id":"https://openalex.org/C2781238097","wikidata":"https://www.wikidata.org/wiki/Q175026","display_name":"Object (grammar)","level":2,"score":0.6172745227813721},{"id":"https://openalex.org/C146849305","wikidata":"https://www.wikidata.org/wiki/Q370766","display_name":"Ground truth","level":2,"score":0.5310022830963135},{"id":"https://openalex.org/C64543145","wikidata":"https://www.wikidata.org/wiki/Q162942","display_name":"Intersection (aeronautics)","level":2,"score":0.5180826187133789},{"id":"https://openalex.org/C2776151529","wikidata":"https://www.wikidata.org/wiki/Q3045304","display_name":"Object detection","level":3,"score":0.46600088477134705},{"id":"https://openalex.org/C192209626","wikidata":"https://www.wikidata.org/wiki/Q190909","display_name":"Focus (optics)","level":2,"score":0.41742801666259766},{"id":"https://openalex.org/C153180895","wikidata":"https://www.wikidata.org/wiki/Q7148389","display_name":"Pattern recognition (psychology)","level":2,"score":0.34076815843582153},{"id":"https://openalex.org/C121332964","wikidata":"https://www.wikidata.org/wiki/Q413","display_name":"Physics","level":0,"score":0.0},{"id":"https://openalex.org/C146978453","wikidata":"https://www.wikidata.org/wiki/Q3798668","display_name":"Aerospace engineering","level":1,"score":0.0},{"id":"https://openalex.org/C127413603","wikidata":"https://www.wikidata.org/wiki/Q11023","display_name":"Engineering","level":0,"score":0.0},{"id":"https://openalex.org/C120665830","wikidata":"https://www.wikidata.org/wiki/Q14620","display_name":"Optics","level":1,"score":0.0}],"mesh":[],"locations_count":2,"locations":[{"id":"doi:10.1109/mmsp55362.2022.9948897","is_oa":false,"landing_page_url":"https://doi.org/10.1109/mmsp55362.2022.9948897","pdf_url":null,"source":{"id":"https://openalex.org/S4363605768","display_name":"2022 IEEE 24th International Workshop on Multimedia Signal Processing (MMSP)","issn_l":null,"issn":null,"is_oa":false,"is_in_doaj":false,"is_core":false,"host_organization":null,"host_organization_name":null,"host_organization_lineage":[],"host_organization_lineage_names":[],"type":"conference"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"2022 IEEE 24th International Workshop on Multimedia Signal Processing (MMSP)","raw_type":"proceedings-article"},{"id":"pmh:oai:mediatum.ub.tum.de:node/1689174","is_oa":false,"landing_page_url":"https://mediatum.ub.tum.de/1689174","pdf_url":null,"source":{"id":"https://openalex.org/S4377196330","display_name":"mediaTUM  (Technical University of Munich)","issn_l":null,"issn":null,"is_oa":false,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I62916508","host_organization_name":"Technical University of Munich","host_organization_lineage":["https://openalex.org/I62916508"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":"","raw_type":"ConferencePaper"}],"best_oa_location":null,"sustainable_development_goals":[{"display_name":"Quality Education","score":0.6000000238418579,"id":"https://metadata.un.org/sdg/4"}],"awards":[],"funders":[],"has_content":{"pdf":false,"grobid_xml":false},"content_urls":null,"referenced_works_count":30,"referenced_works":["https://openalex.org/W639708223","https://openalex.org/W1861492603","https://openalex.org/W2021896843","https://openalex.org/W2031489346","https://openalex.org/W2150066425","https://openalex.org/W2292288263","https://openalex.org/W2337252826","https://openalex.org/W2527081555","https://openalex.org/W2601564443","https://openalex.org/W2883697687","https://openalex.org/W2888096830","https://openalex.org/W2896659472","https://openalex.org/W2962730651","https://openalex.org/W2963091558","https://openalex.org/W2963150697","https://openalex.org/W2963223499","https://openalex.org/W2963227409","https://openalex.org/W2963722382","https://openalex.org/W2964225075","https://openalex.org/W2981773282","https://openalex.org/W3005170598","https://openalex.org/W3034278117","https://openalex.org/W3034679267","https://openalex.org/W3034891989","https://openalex.org/W3116259331","https://openalex.org/W3179066717","https://openalex.org/W4293584584","https://openalex.org/W4312446811","https://openalex.org/W6639102338","https://openalex.org/W6750227808"],"related_works":["https://openalex.org/W2361861616","https://openalex.org/W2263699433","https://openalex.org/W2377979023","https://openalex.org/W2218034408","https://openalex.org/W2392921965","https://openalex.org/W2358755282","https://openalex.org/W2625833328","https://openalex.org/W1533177136","https://openalex.org/W4292830139","https://openalex.org/W4319309705"],"abstract_inverted_index":{"Objects":[0],"annotation":[1,166,185],"is":[2,29,67],"a":[3,20,30,86,134],"prerequisite":[4],"for":[5,137],"learning-based":[6],"detectors":[7],"to":[8,23,70,92,111],"locate":[9],"and":[10,36,119,182],"extract":[11],"object":[12,74,116,142],"semantic":[13,62],"information":[14],"from":[15],"the":[16,47,71,77,102,106,109,112,115,121,124,153,162,177],"scene.":[17],"This":[18,66,175],"provides":[19],"significant":[21],"contribution":[22],"human":[24],"activity":[25],"recognition":[26],"(HAR),":[27],"which":[28],"core":[31],"study":[32],"in":[33,76,96],"computer":[34],"vision":[35],"assistive":[37],"robotics":[38],"area.":[39],"The":[40,98],"current":[41,78],"dominant":[42],"HAR":[43,79],"approaches":[44],"focus":[45],"on":[46,152],"end-to-end":[48],"model":[49],"using":[50,61],"RGB":[51],"images":[52],"or":[53],"optical":[54],"flow":[55],"stream":[56],"as":[57],"input":[58],"rather":[59],"than":[60],"human-object":[63],"interaction":[64,89],"information.":[65],"mainly":[68],"due":[69],"lacking":[72],"of":[73,108,114,173],"annotations":[75,138],"datasets.":[80],"To":[81],"this":[82],"end,":[83],"we":[84],"propose":[85],"novel":[87],"hand-object":[88],"based":[90],"approach":[91,100,131],"semi-automatic":[93],"annotating":[94,146],"objects":[95,103,147,165],"videos.":[97],"proposed":[99],"annotates":[101],"by":[104,180,187],"mapping":[105],"trajectories":[107,113],"hands":[110],"bounding":[117],"boxes,":[118],"smoothen":[120],"track":[122],"with":[123,161],"Kalman":[125],"filter.":[126],"Unlike":[127],"existing":[128],"methods,":[129],"our":[130],"requires":[132],"only":[133],"few":[135],"clicks":[136],"without":[139],"fine-tuning":[140],"any":[141],"detection":[143],"models":[144],"after":[145],"manually.":[148],"Our":[149],"experimental":[150],"results":[151],"Bimanual":[154],"Actions":[155],"Dataset":[156],"achieve":[157],"78.81%":[158],"accuracy":[159],"compared":[160],"ground":[163],"truth":[164],"at":[167],"an":[168],"intersection":[169],"over":[170],"union":[171],"(IoU)":[172],"0.5.":[174],"outperforms":[176],"state-of-the-art":[178],"tracker":[179],"7.15%,":[181],"reduces":[183],"manual":[184],"workload":[186],"92.86%.":[188]},"counts_by_year":[],"updated_date":"2026-04-05T17:49:38.594831","created_date":"2025-10-10T00:00:00"}
