{"id":"https://openalex.org/W3134676920","doi":"https://doi.org/10.1109/iros51168.2021.9636578","title":"Domain Adaptive Robotic Gesture Recognition with Unsupervised Kinematic-Visual Data Alignment","display_name":"Domain Adaptive Robotic Gesture Recognition with Unsupervised Kinematic-Visual Data Alignment","publication_year":2021,"publication_date":"2021-09-27","ids":{"openalex":"https://openalex.org/W3134676920","doi":"https://doi.org/10.1109/iros51168.2021.9636578","mag":"3134676920"},"language":"en","primary_location":{"id":"doi:10.1109/iros51168.2021.9636578","is_oa":false,"landing_page_url":"https://doi.org/10.1109/iros51168.2021.9636578","pdf_url":null,"source":{"id":"https://openalex.org/S4363607734","display_name":"2021 IEEE/RSJ International Conference on Intelligent Robots and Systems (IROS)","issn_l":null,"issn":null,"is_oa":false,"is_in_doaj":false,"is_core":false,"host_organization":null,"host_organization_name":null,"host_organization_lineage":[],"host_organization_lineage_names":[],"type":"conference"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"2021 IEEE/RSJ International Conference on Intelligent Robots and Systems (IROS)","raw_type":"proceedings-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":false,"oa_status":"closed","oa_url":null,"any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5044777574","display_name":"Xueying Shi","orcid":"https://orcid.org/0000-0003-0384-560X"},"institutions":[{"id":"https://openalex.org/I177725633","display_name":"Chinese University of Hong Kong","ror":"https://ror.org/00t33hh48","country_code":"CN","type":"education","lineage":["https://openalex.org/I177725633"]}],"countries":["CN"],"is_corresponding":true,"raw_author_name":"Xueying Shi","raw_affiliation_strings":["The Chinese University of Hong Kong"],"affiliations":[{"raw_affiliation_string":"The Chinese University of Hong Kong","institution_ids":["https://openalex.org/I177725633"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5050163233","display_name":"Yueming Jin","orcid":"https://orcid.org/0000-0003-3775-3877"},"institutions":[{"id":"https://openalex.org/I177725633","display_name":"Chinese University of Hong Kong","ror":"https://ror.org/00t33hh48","country_code":"CN","type":"education","lineage":["https://openalex.org/I177725633"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Yueming Jin","raw_affiliation_strings":["The Chinese University of Hong Kong"],"affiliations":[{"raw_affiliation_string":"The Chinese University of Hong Kong","institution_ids":["https://openalex.org/I177725633"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5090516040","display_name":"Qi Dou","orcid":"https://orcid.org/0000-0002-3416-9950"},"institutions":[{"id":"https://openalex.org/I177725633","display_name":"Chinese University of Hong Kong","ror":"https://ror.org/00t33hh48","country_code":"CN","type":"education","lineage":["https://openalex.org/I177725633"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Qi Dou","raw_affiliation_strings":["T Stone Robotics Institute, The Chinese University of Hong Kong","The Chinese University of Hong Kong"],"affiliations":[{"raw_affiliation_string":"T Stone Robotics Institute, The Chinese University of Hong Kong","institution_ids":["https://openalex.org/I177725633"]},{"raw_affiliation_string":"The Chinese University of Hong Kong","institution_ids":["https://openalex.org/I177725633"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5100662807","display_name":"Jing Qin","orcid":"https://orcid.org/0000-0002-7059-0929"},"institutions":[{"id":"https://openalex.org/I14243506","display_name":"Hong Kong Polytechnic University","ror":"https://ror.org/0030zas98","country_code":"HK","type":"education","lineage":["https://openalex.org/I14243506"]}],"countries":["HK"],"is_corresponding":false,"raw_author_name":"Jing Qin","raw_affiliation_strings":["Centre for Smart Health, School of Nursing, The Hong Kong Polytechnic University"],"affiliations":[{"raw_affiliation_string":"Centre for Smart Health, School of Nursing, The Hong Kong Polytechnic University","institution_ids":["https://openalex.org/I14243506"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5032708386","display_name":"Pheng\u2010Ann Heng","orcid":"https://orcid.org/0000-0003-3055-5034"},"institutions":[{"id":"https://openalex.org/I177725633","display_name":"Chinese University of Hong Kong","ror":"https://ror.org/00t33hh48","country_code":"CN","type":"education","lineage":["https://openalex.org/I177725633"]},{"id":"https://openalex.org/I4210145761","display_name":"Shenzhen Institutes of Advanced Technology","ror":"https://ror.org/04gh4er46","country_code":"CN","type":"facility","lineage":["https://openalex.org/I19820366","https://openalex.org/I4210145761"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Pheng-Ann Heng","raw_affiliation_strings":["Guangdong-Hong Kong-Macao Joint Laboratory of Human-Machine Intelligence-Synergy Systems, Shenzhen Institutes of Advanced Technology, Chinese Academy of Sciences, China","T Stone Robotics Institute, The Chinese University of Hong Kong","The Chinese University of Hong Kong"],"affiliations":[{"raw_affiliation_string":"Guangdong-Hong Kong-Macao Joint Laboratory of Human-Machine Intelligence-Synergy Systems, Shenzhen Institutes of Advanced Technology, Chinese Academy of Sciences, China","institution_ids":["https://openalex.org/I4210145761"]},{"raw_affiliation_string":"T Stone Robotics Institute, The Chinese University of Hong Kong","institution_ids":["https://openalex.org/I177725633"]},{"raw_affiliation_string":"The Chinese University of Hong Kong","institution_ids":["https://openalex.org/I177725633"]}]}],"institutions":[],"countries_distinct_count":2,"institutions_distinct_count":5,"corresponding_author_ids":["https://openalex.org/A5044777574"],"corresponding_institution_ids":["https://openalex.org/I177725633"],"apc_list":null,"apc_paid":null,"fwci":0.196,"has_fulltext":false,"cited_by_count":4,"citation_normalized_percentile":{"value":0.54565092,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":{"min":89,"max":95},"biblio":{"volume":null,"issue":null,"first_page":"9453","last_page":"9460"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10812","display_name":"Human Pose and Action Recognition","score":0.9980999827384949,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10812","display_name":"Human Pose and Action Recognition","score":0.9980999827384949,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11398","display_name":"Hand Gesture Recognition Systems","score":0.9965999722480774,"subfield":{"id":"https://openalex.org/subfields/1709","display_name":"Human-Computer Interaction"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11714","display_name":"Multimodal Machine Learning Applications","score":0.9952999949455261,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/kinematics","display_name":"Kinematics","score":0.7549073696136475},{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.743238627910614},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.7039071321487427},{"id":"https://openalex.org/keywords/computer-vision","display_name":"Computer vision","score":0.5819201469421387},{"id":"https://openalex.org/keywords/feature","display_name":"Feature (linguistics)","score":0.5815407633781433},{"id":"https://openalex.org/keywords/gesture","display_name":"Gesture","score":0.5145889520645142},{"id":"https://openalex.org/keywords/robot","display_name":"Robot","score":0.5006616115570068},{"id":"https://openalex.org/keywords/gesture-recognition","display_name":"Gesture recognition","score":0.44792577624320984},{"id":"https://openalex.org/keywords/similarity","display_name":"Similarity (geometry)","score":0.4430631101131439},{"id":"https://openalex.org/keywords/domain","display_name":"Domain (mathematical analysis)","score":0.43889957666397095},{"id":"https://openalex.org/keywords/transfer-of-learning","display_name":"Transfer of learning","score":0.43216073513031006},{"id":"https://openalex.org/keywords/robot-kinematics","display_name":"Robot kinematics","score":0.4261455237865448},{"id":"https://openalex.org/keywords/pattern-recognition","display_name":"Pattern recognition (psychology)","score":0.35900282859802246},{"id":"https://openalex.org/keywords/mobile-robot","display_name":"Mobile robot","score":0.1917855441570282},{"id":"https://openalex.org/keywords/image","display_name":"Image (mathematics)","score":0.10195925831794739}],"concepts":[{"id":"https://openalex.org/C39920418","wikidata":"https://www.wikidata.org/wiki/Q11476","display_name":"Kinematics","level":2,"score":0.7549073696136475},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.743238627910614},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.7039071321487427},{"id":"https://openalex.org/C31972630","wikidata":"https://www.wikidata.org/wiki/Q844240","display_name":"Computer vision","level":1,"score":0.5819201469421387},{"id":"https://openalex.org/C2776401178","wikidata":"https://www.wikidata.org/wiki/Q12050496","display_name":"Feature (linguistics)","level":2,"score":0.5815407633781433},{"id":"https://openalex.org/C207347870","wikidata":"https://www.wikidata.org/wiki/Q371174","display_name":"Gesture","level":2,"score":0.5145889520645142},{"id":"https://openalex.org/C90509273","wikidata":"https://www.wikidata.org/wiki/Q11012","display_name":"Robot","level":2,"score":0.5006616115570068},{"id":"https://openalex.org/C159437735","wikidata":"https://www.wikidata.org/wiki/Q1519524","display_name":"Gesture recognition","level":3,"score":0.44792577624320984},{"id":"https://openalex.org/C103278499","wikidata":"https://www.wikidata.org/wiki/Q254465","display_name":"Similarity (geometry)","level":3,"score":0.4430631101131439},{"id":"https://openalex.org/C36503486","wikidata":"https://www.wikidata.org/wiki/Q11235244","display_name":"Domain (mathematical analysis)","level":2,"score":0.43889957666397095},{"id":"https://openalex.org/C150899416","wikidata":"https://www.wikidata.org/wiki/Q1820378","display_name":"Transfer of learning","level":2,"score":0.43216073513031006},{"id":"https://openalex.org/C74222875","wikidata":"https://www.wikidata.org/wiki/Q16000312","display_name":"Robot kinematics","level":4,"score":0.4261455237865448},{"id":"https://openalex.org/C153180895","wikidata":"https://www.wikidata.org/wiki/Q7148389","display_name":"Pattern recognition (psychology)","level":2,"score":0.35900282859802246},{"id":"https://openalex.org/C19966478","wikidata":"https://www.wikidata.org/wiki/Q4810574","display_name":"Mobile robot","level":3,"score":0.1917855441570282},{"id":"https://openalex.org/C115961682","wikidata":"https://www.wikidata.org/wiki/Q860623","display_name":"Image (mathematics)","level":2,"score":0.10195925831794739},{"id":"https://openalex.org/C41895202","wikidata":"https://www.wikidata.org/wiki/Q8162","display_name":"Linguistics","level":1,"score":0.0},{"id":"https://openalex.org/C134306372","wikidata":"https://www.wikidata.org/wiki/Q7754","display_name":"Mathematical analysis","level":1,"score":0.0},{"id":"https://openalex.org/C74650414","wikidata":"https://www.wikidata.org/wiki/Q11397","display_name":"Classical mechanics","level":1,"score":0.0},{"id":"https://openalex.org/C33923547","wikidata":"https://www.wikidata.org/wiki/Q395","display_name":"Mathematics","level":0,"score":0.0},{"id":"https://openalex.org/C121332964","wikidata":"https://www.wikidata.org/wiki/Q413","display_name":"Physics","level":0,"score":0.0},{"id":"https://openalex.org/C138885662","wikidata":"https://www.wikidata.org/wiki/Q5891","display_name":"Philosophy","level":0,"score":0.0}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.1109/iros51168.2021.9636578","is_oa":false,"landing_page_url":"https://doi.org/10.1109/iros51168.2021.9636578","pdf_url":null,"source":{"id":"https://openalex.org/S4363607734","display_name":"2021 IEEE/RSJ International Conference on Intelligent Robots and Systems (IROS)","issn_l":null,"issn":null,"is_oa":false,"is_in_doaj":false,"is_core":false,"host_organization":null,"host_organization_name":null,"host_organization_lineage":[],"host_organization_lineage_names":[],"type":"conference"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"2021 IEEE/RSJ International Conference on Intelligent Robots and Systems (IROS)","raw_type":"proceedings-article"}],"best_oa_location":null,"sustainable_development_goals":[],"awards":[],"funders":[{"id":"https://openalex.org/F4320321001","display_name":"National Natural Science Foundation of China","ror":"https://ror.org/01h0zpd94"},{"id":"https://openalex.org/F4320337504","display_name":"Research and Development","ror":"https://ror.org/027s68j25"}],"has_content":{"pdf":false,"grobid_xml":false},"content_urls":null,"referenced_works_count":30,"referenced_works":["https://openalex.org/W1584687743","https://openalex.org/W1882958252","https://openalex.org/W1953678742","https://openalex.org/W2013293242","https://openalex.org/W2194775991","https://openalex.org/W2413983136","https://openalex.org/W2513058035","https://openalex.org/W2568518337","https://openalex.org/W2598070036","https://openalex.org/W2605102758","https://openalex.org/W2770804203","https://openalex.org/W2777273430","https://openalex.org/W2793888044","https://openalex.org/W2962687275","https://openalex.org/W2963826681","https://openalex.org/W2987427063","https://openalex.org/W2998446648","https://openalex.org/W2998770346","https://openalex.org/W3003853839","https://openalex.org/W3034972874","https://openalex.org/W3090743551","https://openalex.org/W3090913119","https://openalex.org/W3091747220","https://openalex.org/W3092022161","https://openalex.org/W3096667748","https://openalex.org/W3150630416","https://openalex.org/W3194032101","https://openalex.org/W4212965831","https://openalex.org/W6639480849","https://openalex.org/W6800317752"],"related_works":["https://openalex.org/W2902873204","https://openalex.org/W2185750513","https://openalex.org/W2010878661","https://openalex.org/W3147379364","https://openalex.org/W2026258298","https://openalex.org/W3204639664","https://openalex.org/W2970836791","https://openalex.org/W2805039731","https://openalex.org/W2989699735","https://openalex.org/W2331850854"],"abstract_inverted_index":{"Automated":[0],"surgical":[1],"gesture":[2,183],"recognition":[3,184],"is":[4],"of":[5,145,161],"great":[6,201],"importance":[7],"in":[8,86,91,207,211,217],"robot-assisted":[9],"minimally":[10],"invasive":[11],"surgery.":[12],"However,":[13],"existing":[14],"methods":[15],"assume":[16],"that":[17,194],"training":[18],"and":[19,42,65,88,135,147,209],"testing":[20],"data":[21],"are":[22,155],"from":[23,29,68],"the":[24,40,75,127,142,162,169,173,198],"same":[25],"domain,":[26],"which":[27,56,111],"suffers":[28],"severe":[30],"performance":[31,199],"degradation":[32],"when":[33],"a":[34,50,100,133],"domain":[35,53,76],"gap":[36,77,121],"exists,":[37],"such":[38],"as":[39],"simulator":[41,69],"real":[43,71,218],"robot.":[44,72,219],"In":[45],"this":[46],"paper,":[47],"we":[48,97,131],"propose":[49,99,132],"novel":[51],"unsupervised":[52],"adaptation":[54,128],"framework":[55],"can":[57],"simultaneously":[58],"transfer":[59,116,141,190],"multi-modality":[60],"knowledge,":[61],"i.e.,":[62],"both":[63],"kinematic":[64],"visual":[66],"data,":[67],"to":[70,108,115,140,205],"It":[73],"remedies":[74],"with":[78,119,188,200],"enhanced":[79],"transferable":[80],"features":[81,150],"by":[82,152],"using":[83,185,214],"temporal":[84,113],"cues":[85],"videos,":[87],"inherent":[89],"correlations":[90],"multi-modal":[92],"towards":[93],"recognizing":[94],"gesture.":[95],"Specifically,":[96],"first":[98],"Motion":[101],"Direction":[102],"Oriented":[103],"Kinematics":[104],"feature":[105,165],"alignment":[106,166],"(MDO-K)":[107],"align":[109],"kinematics,":[110],"exploits":[112],"continuity":[114],"motion":[117],"directions":[118],"smaller":[120],"rather":[122],"than":[123],"position":[124],"values,":[125],"relieving":[126],"burden.":[129],"Moreover,":[130],"Kinematic":[134],"Visual":[136],"Relation":[137],"Attention":[138],"(KV-Relation-ATT)":[139],"co-occurrence":[143],"signals":[144],"kinematics":[146],"vision.":[148],"Such":[149],"attended":[151],"correlation":[153],"similarity":[154],"more":[156],"informative":[157],"for":[158,182],"enhancing":[159],"domain-irreverent":[160],"model.":[163],"Two":[164],"strategies":[167],"benefit":[168],"model":[170],"mutually":[171],"during":[172],"end-to-end":[174],"learning":[175],"process.":[176],"We":[177],"extensively":[178],"evaluate":[179],"our":[180,195],"method":[181],"DESK":[186],"dataset":[187],"peg":[189],"procedure.":[191],"Results":[192],"show":[193],"approach":[196],"recovers":[197],"improvement":[202],"gains,":[203],"up":[204],"12.91%":[206],"Accuracy":[208],"20.16%":[210],"F1score":[212],"without":[213],"any":[215],"annotations":[216]},"counts_by_year":[{"year":2025,"cited_by_count":1},{"year":2023,"cited_by_count":1},{"year":2021,"cited_by_count":2}],"updated_date":"2025-11-06T03:46:38.306776","created_date":"2025-10-10T00:00:00"}
