{"id":"https://openalex.org/W4402352210","doi":"https://doi.org/10.1109/ijcnn60899.2024.10651436","title":"Intuitive UAV Operation: A Novel Dataset and Benchmark for Multi-Distance Gesture Recognition","display_name":"Intuitive UAV Operation: A Novel Dataset and Benchmark for Multi-Distance Gesture Recognition","publication_year":2024,"publication_date":"2024-06-30","ids":{"openalex":"https://openalex.org/W4402352210","doi":"https://doi.org/10.1109/ijcnn60899.2024.10651436"},"language":"en","primary_location":{"id":"doi:10.1109/ijcnn60899.2024.10651436","is_oa":false,"landing_page_url":"http://dx.doi.org/10.1109/ijcnn60899.2024.10651436","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"2024 International Joint Conference on Neural Networks (IJCNN)","raw_type":"proceedings-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":false,"oa_status":"closed","oa_url":null,"any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5100573475","display_name":"Zhenpeng Xu","orcid":null},"institutions":[{"id":"https://openalex.org/I4210152380","display_name":"Shenzhen Technology University","ror":"https://ror.org/04qzpec27","country_code":"CN","type":"education","lineage":["https://openalex.org/I4210152380"]}],"countries":["CN"],"is_corresponding":true,"raw_author_name":"Zhenpeng Xu","raw_affiliation_strings":["Shenzhen Technology University,College of Big Data and Internet,Shenzhen,China"],"affiliations":[{"raw_affiliation_string":"Shenzhen Technology University,College of Big Data and Internet,Shenzhen,China","institution_ids":["https://openalex.org/I4210152380"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5100562876","display_name":"Pan Sun","orcid":"https://orcid.org/0009-0003-6188-7880"},"institutions":[{"id":"https://openalex.org/I4210152380","display_name":"Shenzhen Technology University","ror":"https://ror.org/04qzpec27","country_code":"CN","type":"education","lineage":["https://openalex.org/I4210152380"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Pan Sun","raw_affiliation_strings":["Shenzhen Technology University,College of Big Data and Internet,Shenzhen,China"],"affiliations":[{"raw_affiliation_string":"Shenzhen Technology University,College of Big Data and Internet,Shenzhen,China","institution_ids":["https://openalex.org/I4210152380"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5102765121","display_name":"Lu Yu","orcid":null},"institutions":[{"id":"https://openalex.org/I4210152380","display_name":"Shenzhen Technology University","ror":"https://ror.org/04qzpec27","country_code":"CN","type":"education","lineage":["https://openalex.org/I4210152380"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Yu Lu","raw_affiliation_strings":["Shenzhen Technology University,College of Big Data and Internet,Shenzhen,China"],"affiliations":[{"raw_affiliation_string":"Shenzhen Technology University,College of Big Data and Internet,Shenzhen,China","institution_ids":["https://openalex.org/I4210152380"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5016399027","display_name":"Huilin Ge","orcid":"https://orcid.org/0000-0001-9175-5668"},"institutions":[{"id":"https://openalex.org/I4210096899","display_name":"Jiangsu University of Science and Technology","ror":"https://ror.org/00tyjp878","country_code":"CN","type":"education","lineage":["https://openalex.org/I4210096899"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Huilin Ge","raw_affiliation_strings":["Jiangsu University Science and Technology,College of Automation,Zhenjiang,China"],"affiliations":[{"raw_affiliation_string":"Jiangsu University Science and Technology,College of Automation,Zhenjiang,China","institution_ids":["https://openalex.org/I4210096899"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5100457578","display_name":"Meng Li","orcid":"https://orcid.org/0000-0003-4069-2665"},"institutions":[{"id":"https://openalex.org/I4210152380","display_name":"Shenzhen Technology University","ror":"https://ror.org/04qzpec27","country_code":"CN","type":"education","lineage":["https://openalex.org/I4210152380"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Meng Li","raw_affiliation_strings":["Shenzhen Technology University,College of Big Data and Internet,Shenzhen,China"],"affiliations":[{"raw_affiliation_string":"Shenzhen Technology University,College of Big Data and Internet,Shenzhen,China","institution_ids":["https://openalex.org/I4210152380"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5065242276","display_name":"Yingjian Qi","orcid":null},"institutions":[{"id":"https://openalex.org/I4210152380","display_name":"Shenzhen Technology University","ror":"https://ror.org/04qzpec27","country_code":"CN","type":"education","lineage":["https://openalex.org/I4210152380"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Yingjian Qi","raw_affiliation_strings":["Shenzhen Technology University,College of Big Data and Internet,Shenzhen,China"],"affiliations":[{"raw_affiliation_string":"Shenzhen Technology University,College of Big Data and Internet,Shenzhen,China","institution_ids":["https://openalex.org/I4210152380"]}]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":6,"corresponding_author_ids":["https://openalex.org/A5100573475"],"corresponding_institution_ids":["https://openalex.org/I4210152380"],"apc_list":null,"apc_paid":null,"fwci":0.0,"has_fulltext":false,"cited_by_count":0,"citation_normalized_percentile":{"value":0.14498537,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":null,"biblio":{"volume":"28","issue":null,"first_page":"1","last_page":"8"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T11398","display_name":"Hand Gesture Recognition Systems","score":0.9998999834060669,"subfield":{"id":"https://openalex.org/subfields/1709","display_name":"Human-Computer Interaction"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T11398","display_name":"Hand Gesture Recognition Systems","score":0.9998999834060669,"subfield":{"id":"https://openalex.org/subfields/1709","display_name":"Human-Computer Interaction"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T13382","display_name":"Robotics and Automated Systems","score":0.9944999814033508,"subfield":{"id":"https://openalex.org/subfields/2207","display_name":"Control and Systems Engineering"},"field":{"id":"https://openalex.org/fields/22","display_name":"Engineering"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10331","display_name":"Video Surveillance and Tracking Methods","score":0.9925000071525574,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.7935519218444824},{"id":"https://openalex.org/keywords/benchmark","display_name":"Benchmark (surveying)","score":0.7462195754051208},{"id":"https://openalex.org/keywords/gesture","display_name":"Gesture","score":0.71977698802948},{"id":"https://openalex.org/keywords/gesture-recognition","display_name":"Gesture recognition","score":0.6087862253189087},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.5698395371437073},{"id":"https://openalex.org/keywords/speech-recognition","display_name":"Speech recognition","score":0.4610634744167328},{"id":"https://openalex.org/keywords/pattern-recognition","display_name":"Pattern recognition (psychology)","score":0.3790265917778015},{"id":"https://openalex.org/keywords/computer-vision","display_name":"Computer vision","score":0.36647260189056396},{"id":"https://openalex.org/keywords/cartography","display_name":"Cartography","score":0.07125794887542725},{"id":"https://openalex.org/keywords/geography","display_name":"Geography","score":0.05647304654121399}],"concepts":[{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.7935519218444824},{"id":"https://openalex.org/C185798385","wikidata":"https://www.wikidata.org/wiki/Q1161707","display_name":"Benchmark (surveying)","level":2,"score":0.7462195754051208},{"id":"https://openalex.org/C207347870","wikidata":"https://www.wikidata.org/wiki/Q371174","display_name":"Gesture","level":2,"score":0.71977698802948},{"id":"https://openalex.org/C159437735","wikidata":"https://www.wikidata.org/wiki/Q1519524","display_name":"Gesture recognition","level":3,"score":0.6087862253189087},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.5698395371437073},{"id":"https://openalex.org/C28490314","wikidata":"https://www.wikidata.org/wiki/Q189436","display_name":"Speech recognition","level":1,"score":0.4610634744167328},{"id":"https://openalex.org/C153180895","wikidata":"https://www.wikidata.org/wiki/Q7148389","display_name":"Pattern recognition (psychology)","level":2,"score":0.3790265917778015},{"id":"https://openalex.org/C31972630","wikidata":"https://www.wikidata.org/wiki/Q844240","display_name":"Computer vision","level":1,"score":0.36647260189056396},{"id":"https://openalex.org/C58640448","wikidata":"https://www.wikidata.org/wiki/Q42515","display_name":"Cartography","level":1,"score":0.07125794887542725},{"id":"https://openalex.org/C205649164","wikidata":"https://www.wikidata.org/wiki/Q1071","display_name":"Geography","level":0,"score":0.05647304654121399}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.1109/ijcnn60899.2024.10651436","is_oa":false,"landing_page_url":"http://dx.doi.org/10.1109/ijcnn60899.2024.10651436","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"2024 International Joint Conference on Neural Networks (IJCNN)","raw_type":"proceedings-article"}],"best_oa_location":null,"sustainable_development_goals":[],"awards":[],"funders":[],"has_content":{"pdf":false,"grobid_xml":false},"content_urls":null,"referenced_works_count":43,"referenced_works":["https://openalex.org/W639708223","https://openalex.org/W2766464167","https://openalex.org/W2801265513","https://openalex.org/W2911055311","https://openalex.org/W2944114271","https://openalex.org/W2947489306","https://openalex.org/W2963037989","https://openalex.org/W2963163009","https://openalex.org/W2972464629","https://openalex.org/W2974047772","https://openalex.org/W2987322373","https://openalex.org/W3005863531","https://openalex.org/W3034390870","https://openalex.org/W3097222248","https://openalex.org/W3108204456","https://openalex.org/W3136257968","https://openalex.org/W3184439416","https://openalex.org/W3199384980","https://openalex.org/W3200751609","https://openalex.org/W3204763521","https://openalex.org/W3205866076","https://openalex.org/W3210179512","https://openalex.org/W4205438624","https://openalex.org/W4213126844","https://openalex.org/W4288054297","https://openalex.org/W4289752563","https://openalex.org/W4294068646","https://openalex.org/W4307937951","https://openalex.org/W4313141308","https://openalex.org/W4313197164","https://openalex.org/W4319027078","https://openalex.org/W4323572372","https://openalex.org/W4324095563","https://openalex.org/W4327652243","https://openalex.org/W4367682399","https://openalex.org/W4382630561","https://openalex.org/W4385482832","https://openalex.org/W4386076325","https://openalex.org/W4386222389","https://openalex.org/W4387059420","https://openalex.org/W4389045162","https://openalex.org/W6620707391","https://openalex.org/W6798838024"],"related_works":["https://openalex.org/W2902873204","https://openalex.org/W2185750513","https://openalex.org/W2010878661","https://openalex.org/W3147379364","https://openalex.org/W2026258298","https://openalex.org/W3204639664","https://openalex.org/W2970836791","https://openalex.org/W2805039731","https://openalex.org/W2989699735","https://openalex.org/W4322710567"],"abstract_inverted_index":{"UAV":[0,28,43,74,84,102],"gesture":[1,29,45,75,85,92],"recognition,":[2],"a":[3,21,41,55,70,82,140,153,158,187],"novel":[4],"human-computer":[5],"interaction":[6],"form,":[7],"offers":[8],"an":[9],"intuitive":[10],"approach":[11],"to":[12,68],"controlling":[13],"UAVs":[14],"in":[15,34,60,73,104,142,189],"various":[16],"environments.":[17],"However,":[18],"there":[19],"is":[20,66],"lack":[22],"of":[23,58,133],"comprehensive":[24],"datasets":[25],"for":[26],"AI-powered":[27],"recognition.":[30],"This":[31,64],"paper":[32],"contributes":[33],"several":[35],"ways:":[36],"(i)":[37],"We":[38,79],"introduce":[39],"MD-UHGRD,":[40],"unique":[42],"static":[44],"dataset":[46,65],"with":[47,119,164],"20,":[48],"000":[49],"images":[50],"and":[51,98,126,152,168,192,196],"annotations,":[52],"collected":[53],"from":[54],"diverse":[56],"group":[57],"participants":[59],"different":[61],"environmental":[62],"conditions.":[63],"expected":[67],"bridge":[69],"significant":[71],"gap":[72],"recognition":[76,86,93],"algorithms.":[77],"(ii)":[78],"propose":[80],"SA-YOLO,":[81],"multifunctional":[83],"method":[87,146],"that":[88],"not":[89,178],"only":[90,179],"enables":[91],"but":[94,184],"also":[95,185],"includes":[96],"face":[97],"pedestrian":[99],"tracking,":[100],"optimizing":[101],"control":[103],"complex":[105],"scenarios.":[106],"SA-YOLO":[107,177],"incorporates":[108],"the":[109,181],"Spatial":[110],"Asymptotic":[111],"Feature":[112],"Pyramid":[113,117],"Network":[114],"(SAFPN),":[115],"Scale":[116],"Pooling":[118],"Cross":[120],"Stage":[121],"Partial":[122],"Networks":[123],"Convolution":[124,128],"(SPPCSPC),":[125],"Space-to-Depth":[127],"(SPD-Conv).":[129],"(iii)":[130],"Extensive":[131],"evaluation":[132],"SAYOLO":[134],"on":[135],"MD-UHGRD":[136],"establishes":[137],"it":[138],"as":[139],"benchmark":[141],"this":[143],"domain.":[144],"Our":[145],"demonstrates":[147],"high":[148],"accuracy,":[149],"processing":[150],"speed,":[151],"compact":[154],"model":[155,190],"size,":[156],"achieving":[157],"93.2%":[159],"mean":[160],"Average":[161],"Precision":[162],"(mAP)":[163],"10.3":[165],"million":[166],"parameters":[167],"48":[169],"frames":[170],"per":[171],"second":[172],"(FPS).":[173],"Among":[174],"competing":[175],"models,":[176],"achieves":[180],"highest":[182],"mAP":[183],"maintains":[186],"balance":[188],"size":[191],"FPS.":[193],"The":[194],"database":[195],"code":[197],"are":[198],"available":[199],"at:":[200],"https://github.com/ijcnn2024/SA-YOLO.":[201]},"counts_by_year":[],"updated_date":"2025-12-27T23:08:20.325037","created_date":"2025-10-10T00:00:00"}
