{"id":"https://openalex.org/W2003862906","doi":"https://doi.org/10.1109/roman.2007.4415073","title":"Hand Gesture Recognition To Understand Musical Conducting Action","display_name":"Hand Gesture Recognition To Understand Musical Conducting Action","publication_year":2007,"publication_date":"2007-01-01","ids":{"openalex":"https://openalex.org/W2003862906","doi":"https://doi.org/10.1109/roman.2007.4415073","mag":"2003862906"},"language":"en","primary_location":{"id":"doi:10.1109/roman.2007.4415073","is_oa":false,"landing_page_url":"https://doi.org/10.1109/roman.2007.4415073","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"RO-MAN 2007 - The 16th IEEE International Symposium on Robot and Human Interactive Communication","raw_type":"proceedings-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":false,"oa_status":"closed","oa_url":null,"any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5009941021","display_name":"Hong-Mo Je","orcid":null},"institutions":[{"id":"https://openalex.org/I123900574","display_name":"Pohang University of Science and Technology","ror":"https://ror.org/04xysgw12","country_code":"KR","type":"education","lineage":["https://openalex.org/I123900574"]}],"countries":["KR"],"is_corresponding":false,"raw_author_name":"Hongmo Je","raw_affiliation_strings":["Intelligent Multimedia Laboratory, Department of Computer Science & Engineering, Pohang University of Science and Technology, Pohang, South Korea","Pohang Univ. of Sci. & Technol., Pohang#TAB#"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"Intelligent Multimedia Laboratory, Department of Computer Science & Engineering, Pohang University of Science and Technology, Pohang, South Korea","institution_ids":["https://openalex.org/I123900574"]},{"raw_affiliation_string":"Pohang Univ. of Sci. & Technol., Pohang#TAB#","institution_ids":["https://openalex.org/I123900574"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5088953139","display_name":"Jiman Kim","orcid":"https://orcid.org/0000-0002-9929-5499"},"institutions":[{"id":"https://openalex.org/I123900574","display_name":"Pohang University of Science and Technology","ror":"https://ror.org/04xysgw12","country_code":"KR","type":"education","lineage":["https://openalex.org/I123900574"]}],"countries":["KR"],"is_corresponding":false,"raw_author_name":"Jiman Kim","raw_affiliation_strings":["Intelligent Multimedia Laboratory, Department of Computer Science & Engineering, Pohang University of Science and Technology, Pohang, South Korea","Pohang Univ. of Sci. & Technol., Pohang#TAB#"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"Intelligent Multimedia Laboratory, Department of Computer Science & Engineering, Pohang University of Science and Technology, Pohang, South Korea","institution_ids":["https://openalex.org/I123900574"]},{"raw_affiliation_string":"Pohang Univ. of Sci. & Technol., Pohang#TAB#","institution_ids":["https://openalex.org/I123900574"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5101431617","display_name":"Daijin Kim","orcid":"https://orcid.org/0000-0002-8046-8521"},"institutions":[{"id":"https://openalex.org/I123900574","display_name":"Pohang University of Science and Technology","ror":"https://ror.org/04xysgw12","country_code":"KR","type":"education","lineage":["https://openalex.org/I123900574"]}],"countries":["KR"],"is_corresponding":false,"raw_author_name":"Daijin Kim","raw_affiliation_strings":["Intelligent Multimedia Laboratory, Department of Computer Science & Engineering, Pohang University of Science and Technology, Pohang, South Korea","Pohang Univ. of Sci. & Technol., Pohang#TAB#"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"Intelligent Multimedia Laboratory, Department of Computer Science & Engineering, Pohang University of Science and Technology, Pohang, South Korea","institution_ids":["https://openalex.org/I123900574"]},{"raw_affiliation_string":"Pohang Univ. of Sci. & Technol., Pohang#TAB#","institution_ids":["https://openalex.org/I123900574"]}]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":3,"corresponding_author_ids":[],"corresponding_institution_ids":[],"apc_list":null,"apc_paid":null,"fwci":2.5026,"has_fulltext":false,"cited_by_count":32,"citation_normalized_percentile":{"value":0.88479178,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":{"min":89,"max":99},"biblio":{"volume":null,"issue":null,"first_page":"163","last_page":"168"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T11398","display_name":"Hand Gesture Recognition Systems","score":1.0,"subfield":{"id":"https://openalex.org/subfields/1709","display_name":"Human-Computer Interaction"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T11398","display_name":"Hand Gesture Recognition Systems","score":1.0,"subfield":{"id":"https://openalex.org/subfields/1709","display_name":"Human-Computer Interaction"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10812","display_name":"Human Pose and Action Recognition","score":0.9878000020980835,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11285","display_name":"Hearing Impairment and Communication","score":0.9832000136375427,"subfield":{"id":"https://openalex.org/subfields/3204","display_name":"Developmental and Educational Psychology"},"field":{"id":"https://openalex.org/fields/32","display_name":"Psychology"},"domain":{"id":"https://openalex.org/domains/2","display_name":"Social Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/computer-vision","display_name":"Computer vision","score":0.7730116248130798},{"id":"https://openalex.org/keywords/gesture-recognition","display_name":"Gesture recognition","score":0.7637643814086914},{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.7309752702713013},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.7073652148246765},{"id":"https://openalex.org/keywords/gesture","display_name":"Gesture","score":0.5981519818305969},{"id":"https://openalex.org/keywords/histogram","display_name":"Histogram","score":0.5881214737892151},{"id":"https://openalex.org/keywords/match-moving","display_name":"Match moving","score":0.5152595043182373},{"id":"https://openalex.org/keywords/template-matching","display_name":"Template matching","score":0.4257269501686096},{"id":"https://openalex.org/keywords/motion","display_name":"Motion (physics)","score":0.4175077974796295},{"id":"https://openalex.org/keywords/speech-recognition","display_name":"Speech recognition","score":0.34724047780036926},{"id":"https://openalex.org/keywords/image","display_name":"Image (mathematics)","score":0.08585697412490845}],"concepts":[{"id":"https://openalex.org/C31972630","wikidata":"https://www.wikidata.org/wiki/Q844240","display_name":"Computer vision","level":1,"score":0.7730116248130798},{"id":"https://openalex.org/C159437735","wikidata":"https://www.wikidata.org/wiki/Q1519524","display_name":"Gesture recognition","level":3,"score":0.7637643814086914},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.7309752702713013},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.7073652148246765},{"id":"https://openalex.org/C207347870","wikidata":"https://www.wikidata.org/wiki/Q371174","display_name":"Gesture","level":2,"score":0.5981519818305969},{"id":"https://openalex.org/C53533937","wikidata":"https://www.wikidata.org/wiki/Q185020","display_name":"Histogram","level":3,"score":0.5881214737892151},{"id":"https://openalex.org/C95020103","wikidata":"https://www.wikidata.org/wiki/Q1813492","display_name":"Match moving","level":3,"score":0.5152595043182373},{"id":"https://openalex.org/C158096908","wikidata":"https://www.wikidata.org/wiki/Q3983303","display_name":"Template matching","level":3,"score":0.4257269501686096},{"id":"https://openalex.org/C104114177","wikidata":"https://www.wikidata.org/wiki/Q79782","display_name":"Motion (physics)","level":2,"score":0.4175077974796295},{"id":"https://openalex.org/C28490314","wikidata":"https://www.wikidata.org/wiki/Q189436","display_name":"Speech recognition","level":1,"score":0.34724047780036926},{"id":"https://openalex.org/C115961682","wikidata":"https://www.wikidata.org/wiki/Q860623","display_name":"Image (mathematics)","level":2,"score":0.08585697412490845}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.1109/roman.2007.4415073","is_oa":false,"landing_page_url":"https://doi.org/10.1109/roman.2007.4415073","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"RO-MAN 2007 - The 16th IEEE International Symposium on Robot and Human Interactive Communication","raw_type":"proceedings-article"}],"best_oa_location":null,"sustainable_development_goals":[],"awards":[],"funders":[],"has_content":{"pdf":false,"grobid_xml":false},"content_urls":null,"referenced_works_count":16,"referenced_works":["https://openalex.org/W6854706","https://openalex.org/W175773053","https://openalex.org/W1595932190","https://openalex.org/W1971544888","https://openalex.org/W1982439832","https://openalex.org/W2057312772","https://openalex.org/W2110838840","https://openalex.org/W2111578598","https://openalex.org/W2155958158","https://openalex.org/W2161616933","https://openalex.org/W4245301227","https://openalex.org/W4285719527","https://openalex.org/W6607065525","https://openalex.org/W6640164134","https://openalex.org/W6664802581","https://openalex.org/W6676514092"],"related_works":["https://openalex.org/W2902873204","https://openalex.org/W2185750513","https://openalex.org/W2010878661","https://openalex.org/W3147379364","https://openalex.org/W2026258298","https://openalex.org/W3204639664","https://openalex.org/W2970836791","https://openalex.org/W2805039731","https://openalex.org/W2989699735","https://openalex.org/W2299204920"],"abstract_inverted_index":{"This":[0],"paper":[1],"deals":[2],"with":[3,44],"the":[4,33,75,80,84,100,106,119,122,125,128,134,141,146,151,157,175,187,192],"understanding":[5],"of":[6,21,27,113,121,124,127,150],"four":[7],"musical":[8,176],"time":[9,177],"patterns":[10],"and":[11,61,68,83,132,140,154,179],"three":[12],"tempos":[13],"that":[14,174],"are":[15,183],"generated":[16,109],"by":[17,104,110,156],"a":[18,40,66],"human":[19,101],"conductor":[20],"robot":[22],"orchestra":[23],"or":[24,166],"an":[25],"operator":[26],"computer-based":[28],"music":[29],"play":[30],"system":[31,93],"using":[32,74,162],"hand":[34,71,90,102,130,159],"gesture":[35,72,91,135,160],"recognition.":[36],"We":[37,64],"use":[38],"only":[39],"stereo":[41,111],"vision":[42],"camera":[43],"no":[45],"extra":[46],"special":[47],"devices":[48],"such":[49,137],"as":[50,95,138],"sensor":[51],"glove,":[52],"3D":[53],"motion":[54,85,120,167,193],"capture":[55],"system,":[56],"infra-red":[57],"camera,":[58],"electronic":[59],"baton":[60],"so":[62],"on.":[63],"propose":[65],"simple":[67],"reliable":[69],"vision-based":[70],"recognition":[73,92,161,181],"conducting":[76],"feature":[77],"point":[78],"(CFP),":[79],"motion-direction":[81],"code,":[82],"history":[86],"matching.":[87,169],"The":[88,170],"proposed":[89,158],"operates":[94],"follows:":[96],"First,":[97],"it":[98,117],"extracts":[99],"region":[103,131],"segmenting":[105],"depth":[107],"information":[108],"matching":[112,195],"image":[114],"sequences.":[115],"Next,":[116],"follows":[118],"center":[123],"gravity(COG)":[126],"extracted":[129],"generates":[133],"features":[136],"CFP":[139,164],"direction-code.":[142],"Finally,":[143],"we":[144],"obtain":[145],"current":[147],"timing":[148],"pattern":[149,178],"music's":[152],"beat":[153],"tempo":[155,180],"either":[163],"tracking":[165],"histogram":[168,194],"experimental":[171],"results":[172],"show":[173],"rate":[182],"over":[184],"86%":[185],"on":[186],"test":[188],"data":[189],"set":[190],"when":[191],"is":[196],"used.":[197]},"counts_by_year":[{"year":2026,"cited_by_count":1},{"year":2025,"cited_by_count":1},{"year":2023,"cited_by_count":1},{"year":2020,"cited_by_count":1},{"year":2019,"cited_by_count":2},{"year":2018,"cited_by_count":1},{"year":2016,"cited_by_count":4},{"year":2015,"cited_by_count":3},{"year":2014,"cited_by_count":6},{"year":2013,"cited_by_count":2},{"year":2012,"cited_by_count":2}],"updated_date":"2026-06-11T09:08:48.828518","created_date":"2025-10-10T00:00:00"}
