{"id":"https://openalex.org/W7125955365","doi":"https://doi.org/10.1109/smc58881.2025.11342598","title":"AirVista-II: An Agentic System for Embodied UAVs Toward Dynamic Scene Semantic Understanding","display_name":"AirVista-II: An Agentic System for Embodied UAVs Toward Dynamic Scene Semantic Understanding","publication_year":2025,"publication_date":"2025-10-05","ids":{"openalex":"https://openalex.org/W7125955365","doi":"https://doi.org/10.1109/smc58881.2025.11342598"},"language":null,"primary_location":{"id":"doi:10.1109/smc58881.2025.11342598","is_oa":false,"landing_page_url":"https://doi.org/10.1109/smc58881.2025.11342598","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"2025 IEEE International Conference on Systems, Man, and Cybernetics (SMC)","raw_type":"proceedings-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":false,"oa_status":"closed","oa_url":null,"any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5124137974","display_name":"Fei Lin","orcid":null},"institutions":[{"id":"https://openalex.org/I111950717","display_name":"Macau University of Science and Technology","ror":"https://ror.org/03jqs2n27","country_code":"MO","type":"education","lineage":["https://openalex.org/I111950717","https://openalex.org/I4391767947"]}],"countries":["MO"],"is_corresponding":true,"raw_author_name":"Fei Lin","raw_affiliation_strings":["Faculty of Innovation Engineering, Macau University of Science and Technology,Department of Engineering Science,Macau,China,999078"],"affiliations":[{"raw_affiliation_string":"Faculty of Innovation Engineering, Macau University of Science and Technology,Department of Engineering Science,Macau,China,999078","institution_ids":["https://openalex.org/I111950717"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5115594196","display_name":"Yonglin Tian","orcid":"https://orcid.org/0009-0005-4035-7332"},"institutions":[{"id":"https://openalex.org/I19820366","display_name":"Chinese Academy of Sciences","ror":"https://ror.org/034t30j35","country_code":"CN","type":"government","lineage":["https://openalex.org/I19820366"]},{"id":"https://openalex.org/I4210094879","display_name":"Shandong Institute of Automation","ror":"https://ror.org/00qdtba35","country_code":"CN","type":"facility","lineage":["https://openalex.org/I4210094879","https://openalex.org/I4210142748"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Yonglin Tian","raw_affiliation_strings":["Institute of Automation, Chinese Academy of Sciences,State Key Laboratory for Management and Control of Complex Systems,Beijing,China,100190"],"affiliations":[{"raw_affiliation_string":"Institute of Automation, Chinese Academy of Sciences,State Key Laboratory for Management and Control of Complex Systems,Beijing,China,100190","institution_ids":["https://openalex.org/I4210094879","https://openalex.org/I19820366"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5078400575","display_name":"Tengchao Zhang","orcid":"https://orcid.org/0000-0003-1730-4185"},"institutions":[{"id":"https://openalex.org/I111950717","display_name":"Macau University of Science and Technology","ror":"https://ror.org/03jqs2n27","country_code":"MO","type":"education","lineage":["https://openalex.org/I111950717","https://openalex.org/I4391767947"]}],"countries":["MO"],"is_corresponding":false,"raw_author_name":"Tengchao Zhang","raw_affiliation_strings":["Faculty of Innovation Engineering, Macau University of Science and Technology,Department of Engineering Science,Macau,China,999078"],"affiliations":[{"raw_affiliation_string":"Faculty of Innovation Engineering, Macau University of Science and Technology,Department of Engineering Science,Macau,China,999078","institution_ids":["https://openalex.org/I111950717"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5101488477","display_name":"Jun Huang","orcid":"https://orcid.org/0009-0007-3883-4106"},"institutions":[{"id":"https://openalex.org/I111950717","display_name":"Macau University of Science and Technology","ror":"https://ror.org/03jqs2n27","country_code":"MO","type":"education","lineage":["https://openalex.org/I111950717","https://openalex.org/I4391767947"]}],"countries":["MO"],"is_corresponding":false,"raw_author_name":"Jun Huang","raw_affiliation_strings":["Faculty of Innovation Engineering, Macau University of Science and Technology,Department of Engineering Science,Macau,China,999078"],"affiliations":[{"raw_affiliation_string":"Faculty of Innovation Engineering, Macau University of Science and Technology,Department of Engineering Science,Macau,China,999078","institution_ids":["https://openalex.org/I111950717"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5043826183","display_name":"Sangtian Guan","orcid":"https://orcid.org/0009-0006-9743-3559"},"institutions":[{"id":"https://openalex.org/I111950717","display_name":"Macau University of Science and Technology","ror":"https://ror.org/03jqs2n27","country_code":"MO","type":"education","lineage":["https://openalex.org/I111950717","https://openalex.org/I4391767947"]}],"countries":["MO"],"is_corresponding":false,"raw_author_name":"Sangtian Guan","raw_affiliation_strings":["Faculty of Innovation Engineering, Macau University of Science and Technology,Department of Engineering Science,Macau,China,999078"],"affiliations":[{"raw_affiliation_string":"Faculty of Innovation Engineering, Macau University of Science and Technology,Department of Engineering Science,Macau,China,999078","institution_ids":["https://openalex.org/I111950717"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5124073021","display_name":"Fei-Yue Wang","orcid":null},"institutions":[{"id":"https://openalex.org/I19820366","display_name":"Chinese Academy of Sciences","ror":"https://ror.org/034t30j35","country_code":"CN","type":"government","lineage":["https://openalex.org/I19820366"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Fei-Yue Wang","raw_affiliation_strings":["Chinese Academy of Sciences,State Key Laboratory for Management and Control of Complex Systems,Beijing,100190"],"affiliations":[{"raw_affiliation_string":"Chinese Academy of Sciences,State Key Laboratory for Management and Control of Complex Systems,Beijing,100190","institution_ids":["https://openalex.org/I19820366"]}]}],"institutions":[],"countries_distinct_count":2,"institutions_distinct_count":6,"corresponding_author_ids":["https://openalex.org/A5124137974"],"corresponding_institution_ids":["https://openalex.org/I111950717"],"apc_list":null,"apc_paid":null,"fwci":2.4362,"has_fulltext":false,"cited_by_count":2,"citation_normalized_percentile":{"value":0.91430109,"is_in_top_1_percent":false,"is_in_top_10_percent":true},"cited_by_percentile_year":{"min":95,"max":96},"biblio":{"volume":null,"issue":null,"first_page":"6319","last_page":"6324"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T11714","display_name":"Multimodal Machine Learning Applications","score":0.599399983882904,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T11714","display_name":"Multimodal Machine Learning Applications","score":0.599399983882904,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10812","display_name":"Human Pose and Action Recognition","score":0.09179999679327011,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10709","display_name":"Social Robot Interaction and HRI","score":0.0471000000834465,"subfield":{"id":"https://openalex.org/subfields/3207","display_name":"Social Psychology"},"field":{"id":"https://openalex.org/fields/32","display_name":"Psychology"},"domain":{"id":"https://openalex.org/domains/2","display_name":"Social Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/embodied-cognition","display_name":"Embodied cognition","score":0.7042999863624573},{"id":"https://openalex.org/keywords/task","display_name":"Task (project management)","score":0.5996000170707703},{"id":"https://openalex.org/keywords/perception","display_name":"Perception","score":0.5759999752044678},{"id":"https://openalex.org/keywords/identification","display_name":"Identification (biology)","score":0.5016000270843506},{"id":"https://openalex.org/keywords/mode","display_name":"Mode (computer interface)","score":0.44929999113082886},{"id":"https://openalex.org/keywords/semantics","display_name":"Semantics (computer science)","score":0.387800008058548},{"id":"https://openalex.org/keywords/variety","display_name":"Variety (cybernetics)","score":0.37389999628067017}],"concepts":[{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.7226999998092651},{"id":"https://openalex.org/C100609095","wikidata":"https://www.wikidata.org/wiki/Q1335050","display_name":"Embodied cognition","level":2,"score":0.7042999863624573},{"id":"https://openalex.org/C2780451532","wikidata":"https://www.wikidata.org/wiki/Q759676","display_name":"Task (project management)","level":2,"score":0.5996000170707703},{"id":"https://openalex.org/C26760741","wikidata":"https://www.wikidata.org/wiki/Q160402","display_name":"Perception","level":2,"score":0.5759999752044678},{"id":"https://openalex.org/C107457646","wikidata":"https://www.wikidata.org/wiki/Q207434","display_name":"Human\u2013computer interaction","level":1,"score":0.516700029373169},{"id":"https://openalex.org/C116834253","wikidata":"https://www.wikidata.org/wiki/Q2039217","display_name":"Identification (biology)","level":2,"score":0.5016000270843506},{"id":"https://openalex.org/C48677424","wikidata":"https://www.wikidata.org/wiki/Q6888088","display_name":"Mode (computer interface)","level":2,"score":0.44929999113082886},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.4106000065803528},{"id":"https://openalex.org/C184337299","wikidata":"https://www.wikidata.org/wiki/Q1437428","display_name":"Semantics (computer science)","level":2,"score":0.387800008058548},{"id":"https://openalex.org/C136197465","wikidata":"https://www.wikidata.org/wiki/Q1729295","display_name":"Variety (cybernetics)","level":2,"score":0.37389999628067017},{"id":"https://openalex.org/C3018653863","wikidata":"https://www.wikidata.org/wiki/Q5281355","display_name":"Disaster response","level":3,"score":0.36559998989105225},{"id":"https://openalex.org/C2780910867","wikidata":"https://www.wikidata.org/wiki/Q1952416","display_name":"Multimodality","level":2,"score":0.3628000020980835},{"id":"https://openalex.org/C175154964","wikidata":"https://www.wikidata.org/wiki/Q380077","display_name":"Task analysis","level":3,"score":0.29589998722076416},{"id":"https://openalex.org/C59519942","wikidata":"https://www.wikidata.org/wiki/Q650665","display_name":"Drone","level":2,"score":0.2793000042438507},{"id":"https://openalex.org/C168167062","wikidata":"https://www.wikidata.org/wiki/Q1117970","display_name":"Component (thermodynamics)","level":2,"score":0.27649998664855957},{"id":"https://openalex.org/C36464697","wikidata":"https://www.wikidata.org/wiki/Q451553","display_name":"Visualization","level":2,"score":0.26420000195503235},{"id":"https://openalex.org/C2776544517","wikidata":"https://www.wikidata.org/wiki/Q189447","display_name":"Unexpected events","level":2,"score":0.25589999556541443},{"id":"https://openalex.org/C31972630","wikidata":"https://www.wikidata.org/wiki/Q844240","display_name":"Computer vision","level":1,"score":0.2547999918460846}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.1109/smc58881.2025.11342598","is_oa":false,"landing_page_url":"https://doi.org/10.1109/smc58881.2025.11342598","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"2025 IEEE International Conference on Systems, Man, and Cybernetics (SMC)","raw_type":"proceedings-article"}],"best_oa_location":null,"sustainable_development_goals":[{"score":0.7576739192008972,"display_name":"Climate action","id":"https://metadata.un.org/sdg/13"}],"awards":[],"funders":[{"id":"https://openalex.org/F4320337495","display_name":"Technology Development","ror":null}],"has_content":{"pdf":false,"grobid_xml":false},"content_urls":null,"referenced_works_count":17,"referenced_works":["https://openalex.org/W2964220823","https://openalex.org/W3003741573","https://openalex.org/W4319599994","https://openalex.org/W4366392594","https://openalex.org/W4389492857","https://openalex.org/W4390189932","https://openalex.org/W4400258109","https://openalex.org/W4401806048","https://openalex.org/W4402671548","https://openalex.org/W4404739896","https://openalex.org/W4404784276","https://openalex.org/W4405429615","https://openalex.org/W4408696853","https://openalex.org/W4409217930","https://openalex.org/W4409475638","https://openalex.org/W4413145669","https://openalex.org/W4416036279"],"related_works":[],"abstract_inverted_index":{"Unmanned":[0],"Aerial":[1],"Vehicles":[2],"(UAVs)":[3],"are":[4],"increasingly":[5],"important":[6],"in":[7,42,66],"dynamic":[8,67,112],"environments":[9],"such":[10],"as":[11],"logistics":[12],"transportation":[13],"and":[14,29,44,64,75,80],"disaster":[15],"response.":[16],"However,":[17],"current":[18],"tasks":[19],"often":[20],"rely":[21],"on":[22],"human":[23],"operators":[24],"to":[25,59],"monitor":[26],"aerial":[27],"videos":[28],"make":[30],"operational":[31],"decisions.":[32],"This":[33],"mode":[34],"of":[35,94],"human-machine":[36],"collaboration":[37],"suffers":[38],"from":[39],"significant":[40],"limitations":[41],"efficiency":[43],"adaptability.":[45],"In":[46],"this":[47],"paper,":[48],"we":[49],"present":[50],"AirVista-II\u2014an":[51],"end-to-end":[52],"agentic":[53],"system":[54,70,104],"for":[55,86],"embodied":[56],"UAVs,":[57],"designed":[58],"enable":[60],"general-purpose":[61],"semantic":[62,107],"understanding":[63,108],"reasoning":[65],"scenes.":[68],"The":[69],"integrates":[71],"agent-based":[72],"task":[73],"identification":[74],"scheduling,":[76],"multimodal":[77],"perception":[78],"mechanisms,":[79],"differentiated":[81],"keyframe":[82],"extraction":[83],"strategies":[84],"tailored":[85],"various":[87],"temporal":[88],"scenarios,":[89],"enabling":[90],"the":[91,102],"efficient":[92],"capture":[93],"critical":[95],"scene":[96],"information.":[97],"Experimental":[98],"results":[99],"demonstrate":[100],"that":[101],"proposed":[103],"achieves":[105],"high-quality":[106],"across":[109],"diverse":[110],"UAV-based":[111],"scenarios":[113],"under":[114],"a":[115],"zero-shot":[116],"setting.":[117]},"counts_by_year":[{"year":2025,"cited_by_count":2}],"updated_date":"2026-04-09T08:11:56.329763","created_date":"2026-01-29T00:00:00"}
