{"id":"https://openalex.org/W4417251974","doi":"https://doi.org/10.1109/lra.2025.3643290","title":"GRAD-NAV++: Vision-Language Model Enabled Visual Drone <u>Nav</u> igation With <u>G</u> aussian <u>Ra</u> diance Fields and <u>D</u> ifferentiable Dynamics","display_name":"GRAD-NAV++: Vision-Language Model Enabled Visual Drone <u>Nav</u> igation With <u>G</u> aussian <u>Ra</u> diance Fields and <u>D</u> ifferentiable Dynamics","publication_year":2025,"publication_date":"2025-12-11","ids":{"openalex":"https://openalex.org/W4417251974","doi":"https://doi.org/10.1109/lra.2025.3643290"},"language":null,"primary_location":{"id":"doi:10.1109/lra.2025.3643290","is_oa":false,"landing_page_url":"https://doi.org/10.1109/lra.2025.3643290","pdf_url":null,"source":{"id":"https://openalex.org/S4210169774","display_name":"IEEE Robotics and Automation Letters","issn_l":"2377-3766","issn":["2377-3766"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310319808","host_organization_name":"Institute of Electrical and Electronics Engineers","host_organization_lineage":["https://openalex.org/P4310319808"],"host_organization_lineage_names":["Institute of Electrical and Electronics Engineers"],"type":"journal"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"IEEE Robotics and Automation Letters","raw_type":"journal-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":false,"oa_status":"closed","oa_url":null,"any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5033153152","display_name":"Qianzhong Chen","orcid":"https://orcid.org/0009-0001-5318-7580"},"institutions":[{"id":"https://openalex.org/I97018004","display_name":"Stanford University","ror":"https://ror.org/00f54p054","country_code":"US","type":"education","lineage":["https://openalex.org/I97018004"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Qianzhong Chen","raw_affiliation_strings":["Department of Mechanical Engineering, Stanford University, Stanford, CA, USA"],"raw_orcid":"https://orcid.org/0009-0001-5318-7580","affiliations":[{"raw_affiliation_string":"Department of Mechanical Engineering, Stanford University, Stanford, CA, USA","institution_ids":["https://openalex.org/I97018004"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5090403455","display_name":"Naixiang Gao","orcid":"https://orcid.org/0000-0003-3208-5849"},"institutions":[{"id":"https://openalex.org/I97018004","display_name":"Stanford University","ror":"https://ror.org/00f54p054","country_code":"US","type":"education","lineage":["https://openalex.org/I97018004"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Naixiang Gao","raw_affiliation_strings":["Department of Mechanical Engineering, Stanford University, Stanford, CA, USA"],"raw_orcid":"https://orcid.org/0000-0003-3208-5849","affiliations":[{"raw_affiliation_string":"Department of Mechanical Engineering, Stanford University, Stanford, CA, USA","institution_ids":["https://openalex.org/I97018004"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5114122061","display_name":"Suning Huang","orcid":null},"institutions":[{"id":"https://openalex.org/I13805885","display_name":"Vaughn College of Aeronautics and Technology","ror":"https://ror.org/056e22e24","country_code":"US","type":"education","lineage":["https://openalex.org/I13805885"]},{"id":"https://openalex.org/I97018004","display_name":"Stanford University","ror":"https://ror.org/00f54p054","country_code":"US","type":"education","lineage":["https://openalex.org/I97018004"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Suning Huang","raw_affiliation_strings":["Department of Aeronautics and Astronautics, Stanford University, Stanford, CA, USA"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"Department of Aeronautics and Astronautics, Stanford University, Stanford, CA, USA","institution_ids":["https://openalex.org/I13805885","https://openalex.org/I97018004"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5112189451","display_name":"JunEn Low","orcid":"https://orcid.org/0000-0002-1011-1404"},"institutions":[{"id":"https://openalex.org/I97018004","display_name":"Stanford University","ror":"https://ror.org/00f54p054","country_code":"US","type":"education","lineage":["https://openalex.org/I97018004"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"JunEn Low","raw_affiliation_strings":["Department of Mechanical Engineering, Stanford University, Stanford, CA, USA"],"raw_orcid":"https://orcid.org/0000-0002-1011-1404","affiliations":[{"raw_affiliation_string":"Department of Mechanical Engineering, Stanford University, Stanford, CA, USA","institution_ids":["https://openalex.org/I97018004"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5076466206","display_name":"T. Chen","orcid":"https://orcid.org/0000-0003-3948-8739"},"institutions":[{"id":"https://openalex.org/I13805885","display_name":"Vaughn College of Aeronautics and Technology","ror":"https://ror.org/056e22e24","country_code":"US","type":"education","lineage":["https://openalex.org/I13805885"]},{"id":"https://openalex.org/I97018004","display_name":"Stanford University","ror":"https://ror.org/00f54p054","country_code":"US","type":"education","lineage":["https://openalex.org/I97018004"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Timothy Chen","raw_affiliation_strings":["Department of Aeronautics and Astronautics, Stanford University, Stanford, CA, USA"],"raw_orcid":"https://orcid.org/0000-0003-3948-8739","affiliations":[{"raw_affiliation_string":"Department of Aeronautics and Astronautics, Stanford University, Stanford, CA, USA","institution_ids":["https://openalex.org/I13805885","https://openalex.org/I97018004"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5101424688","display_name":"Jiankai Sun","orcid":"https://orcid.org/0000-0001-5633-1739"},"institutions":[{"id":"https://openalex.org/I13805885","display_name":"Vaughn College of Aeronautics and Technology","ror":"https://ror.org/056e22e24","country_code":"US","type":"education","lineage":["https://openalex.org/I13805885"]},{"id":"https://openalex.org/I97018004","display_name":"Stanford University","ror":"https://ror.org/00f54p054","country_code":"US","type":"education","lineage":["https://openalex.org/I97018004"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Jiankai Sun","raw_affiliation_strings":["Department of Aeronautics and Astronautics, Stanford University, Stanford, CA, USA"],"raw_orcid":"https://orcid.org/0000-0001-5633-1739","affiliations":[{"raw_affiliation_string":"Department of Aeronautics and Astronautics, Stanford University, Stanford, CA, USA","institution_ids":["https://openalex.org/I13805885","https://openalex.org/I97018004"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5081950488","display_name":"Mac Schwager","orcid":"https://orcid.org/0000-0002-7871-3663"},"institutions":[{"id":"https://openalex.org/I13805885","display_name":"Vaughn College of Aeronautics and Technology","ror":"https://ror.org/056e22e24","country_code":"US","type":"education","lineage":["https://openalex.org/I13805885"]},{"id":"https://openalex.org/I97018004","display_name":"Stanford University","ror":"https://ror.org/00f54p054","country_code":"US","type":"education","lineage":["https://openalex.org/I97018004"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Mac Schwager","raw_affiliation_strings":["Department of Aeronautics and Astronautics, Stanford University, Stanford, CA, USA"],"raw_orcid":"https://orcid.org/0000-0002-7871-3663","affiliations":[{"raw_affiliation_string":"Department of Aeronautics and Astronautics, Stanford University, Stanford, CA, USA","institution_ids":["https://openalex.org/I13805885","https://openalex.org/I97018004"]}]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":7,"corresponding_author_ids":[],"corresponding_institution_ids":[],"apc_list":null,"apc_paid":null,"fwci":0.0,"has_fulltext":false,"cited_by_count":0,"citation_normalized_percentile":{"value":0.35540878,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":null,"biblio":{"volume":"11","issue":"2","first_page":"1418","last_page":"1425"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T11714","display_name":"Multimodal Machine Learning Applications","score":0.9444000124931335,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T11714","display_name":"Multimodal Machine Learning Applications","score":0.9444000124931335,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10036","display_name":"Advanced Neural Network Applications","score":0.012000000104308128,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11307","display_name":"Domain Adaptation and Few-Shot Learning","score":0.005799999926239252,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/generalization","display_name":"Generalization","score":0.6811000108718872},{"id":"https://openalex.org/keywords/drone","display_name":"Drone","score":0.6499000191688538},{"id":"https://openalex.org/keywords/benchmark","display_name":"Benchmark (surveying)","score":0.5388000011444092},{"id":"https://openalex.org/keywords/computation","display_name":"Computation","score":0.4964999854564667},{"id":"https://openalex.org/keywords/reinforcement-learning","display_name":"Reinforcement learning","score":0.4839000105857849},{"id":"https://openalex.org/keywords/action","display_name":"Action (physics)","score":0.41280001401901245},{"id":"https://openalex.org/keywords/differentiable-function","display_name":"Differentiable function","score":0.400299996137619},{"id":"https://openalex.org/keywords/adaptation","display_name":"Adaptation (eye)","score":0.374099999666214}],"concepts":[{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.8238000273704529},{"id":"https://openalex.org/C177148314","wikidata":"https://www.wikidata.org/wiki/Q170084","display_name":"Generalization","level":2,"score":0.6811000108718872},{"id":"https://openalex.org/C59519942","wikidata":"https://www.wikidata.org/wiki/Q650665","display_name":"Drone","level":2,"score":0.6499000191688538},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.6233000159263611},{"id":"https://openalex.org/C185798385","wikidata":"https://www.wikidata.org/wiki/Q1161707","display_name":"Benchmark (surveying)","level":2,"score":0.5388000011444092},{"id":"https://openalex.org/C45374587","wikidata":"https://www.wikidata.org/wiki/Q12525525","display_name":"Computation","level":2,"score":0.4964999854564667},{"id":"https://openalex.org/C97541855","wikidata":"https://www.wikidata.org/wiki/Q830687","display_name":"Reinforcement learning","level":2,"score":0.4839000105857849},{"id":"https://openalex.org/C2780791683","wikidata":"https://www.wikidata.org/wiki/Q846785","display_name":"Action (physics)","level":2,"score":0.41280001401901245},{"id":"https://openalex.org/C202615002","wikidata":"https://www.wikidata.org/wiki/Q783507","display_name":"Differentiable function","level":2,"score":0.400299996137619},{"id":"https://openalex.org/C139807058","wikidata":"https://www.wikidata.org/wiki/Q352374","display_name":"Adaptation (eye)","level":2,"score":0.374099999666214},{"id":"https://openalex.org/C31972630","wikidata":"https://www.wikidata.org/wiki/Q844240","display_name":"Computer vision","level":1,"score":0.35339999198913574},{"id":"https://openalex.org/C119857082","wikidata":"https://www.wikidata.org/wiki/Q2539","display_name":"Machine learning","level":1,"score":0.33970001339912415},{"id":"https://openalex.org/C61326573","wikidata":"https://www.wikidata.org/wiki/Q1496376","display_name":"Gaussian process","level":3,"score":0.3278000056743622},{"id":"https://openalex.org/C137293760","wikidata":"https://www.wikidata.org/wiki/Q3621696","display_name":"Language model","level":2,"score":0.3151000142097473},{"id":"https://openalex.org/C2164484","wikidata":"https://www.wikidata.org/wiki/Q5170150","display_name":"Core (optical fiber)","level":2,"score":0.30880001187324524},{"id":"https://openalex.org/C90509273","wikidata":"https://www.wikidata.org/wiki/Q11012","display_name":"Robot","level":2,"score":0.2996000051498413},{"id":"https://openalex.org/C2775924081","wikidata":"https://www.wikidata.org/wiki/Q55608371","display_name":"Control (management)","level":2,"score":0.2985000014305115},{"id":"https://openalex.org/C107457646","wikidata":"https://www.wikidata.org/wiki/Q207434","display_name":"Human\u2013computer interaction","level":1,"score":0.2948000133037567},{"id":"https://openalex.org/C34413123","wikidata":"https://www.wikidata.org/wiki/Q170978","display_name":"Robotics","level":3,"score":0.273499995470047},{"id":"https://openalex.org/C9652623","wikidata":"https://www.wikidata.org/wiki/Q190109","display_name":"Field (mathematics)","level":2,"score":0.26100000739097595},{"id":"https://openalex.org/C145912823","wikidata":"https://www.wikidata.org/wiki/Q113558","display_name":"Dynamics (music)","level":2,"score":0.2596000134944916},{"id":"https://openalex.org/C36464697","wikidata":"https://www.wikidata.org/wiki/Q451553","display_name":"Visualization","level":2,"score":0.25920000672340393},{"id":"https://openalex.org/C79403827","wikidata":"https://www.wikidata.org/wiki/Q3988","display_name":"Real-time computing","level":1,"score":0.2540000081062317},{"id":"https://openalex.org/C44154836","wikidata":"https://www.wikidata.org/wiki/Q45045","display_name":"Simulation","level":1,"score":0.2515000104904175}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.1109/lra.2025.3643290","is_oa":false,"landing_page_url":"https://doi.org/10.1109/lra.2025.3643290","pdf_url":null,"source":{"id":"https://openalex.org/S4210169774","display_name":"IEEE Robotics and Automation Letters","issn_l":"2377-3766","issn":["2377-3766"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310319808","host_organization_name":"Institute of Electrical and Electronics Engineers","host_organization_lineage":["https://openalex.org/P4310319808"],"host_organization_lineage_names":["Institute of Electrical and Electronics Engineers"],"type":"journal"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"IEEE Robotics and Automation Letters","raw_type":"journal-article"}],"best_oa_location":null,"sustainable_development_goals":[],"awards":[{"id":"https://openalex.org/G6951003262","display_name":null,"funder_award_id":"N00014-23-1-2354","funder_id":"https://openalex.org/F4320337345","funder_display_name":"Office of Naval Research"}],"funders":[{"id":"https://openalex.org/F4320315934","display_name":"Toyota Research Institute","ror":null},{"id":"https://openalex.org/F4320337345","display_name":"Office of Naval Research","ror":"https://ror.org/00rk2pe57"}],"has_content":{"pdf":false,"grobid_xml":false},"content_urls":null,"referenced_works_count":15,"referenced_works":["https://openalex.org/W2025653905","https://openalex.org/W2150884987","https://openalex.org/W2951360122","https://openalex.org/W3029808435","https://openalex.org/W4383108274","https://openalex.org/W4385318467","https://openalex.org/W4390873312","https://openalex.org/W4396910019","https://openalex.org/W4407948422","https://openalex.org/W4408709139","https://openalex.org/W4409368288","https://openalex.org/W4409473885","https://openalex.org/W4410771465","https://openalex.org/W4414079054","https://openalex.org/W4416748468"],"related_works":[],"abstract_inverted_index":{"Autonomous":[0],"drones":[1],"capable":[2],"of":[3,77,114,154],"interpreting":[4],"and":[5,50,82,119,138,160,178],"executing":[6],"high-level":[7],"language":[8],"instructions":[9],"in":[10,54,61,124],"unstructured":[11],"environments":[12,159],"remain":[13],"a":[14,41,62,89,111,169],"long-standing":[15],"goal.":[16],"Yet":[17],"existing":[18],"approaches":[19],"are":[20],"constrained":[21],"by":[22],"their":[23],"dependence":[24],"on":[25,116,121,128,135,140,191],"hand-crafted":[26],"skills,":[27],"extensive":[28],"parameter":[29],"tuning,":[30],"or":[31],"computationally":[32],"intensive":[33],"models":[34,183],"unsuitable":[35],"for":[36,172],"onboard":[37,49,174],"use.":[38],"We":[39],"introduce":[40],"lightweight":[42],"Vision\u2013Language\u2013Action":[43],"(VLA)":[44,176],"framework":[45],"that":[46,180],"runs":[47],"fully":[48,173],"follows":[51],"natural-language":[52],"commands":[53],"real":[55,129],"time.":[56],"Our":[57],"policy":[58],"is":[59,88],"trained":[60,117,136],"photorealistic":[63],"3D":[64],"Gaussian":[65],"Splatting":[66],"(3DGS)":[67],"simulator":[68],"via":[69],"Differentiable":[70],"Reinforcement":[71],"Learning":[72],"(DiffRL),":[73],"enabling":[74],"efficient":[75,182],"learning":[76],"low-level":[78],"control":[79],"from":[80],"visual":[81],"linguistic":[83],"inputs.":[84],"At":[85],"its":[86],"core":[87],"Mixture-of-Experts":[90],"(MoE)":[91],"action":[92],"head,":[93],"which":[94],"adaptively":[95],"routes":[96],"computation":[97],"to":[98],"improve":[99],"generalization":[100,106],"while":[101],"mitigating":[102],"forgetting.":[103],"In":[104,143],"multi-task":[105],"experiments,":[107,146],"our":[108,147],"method":[109,148],"achieves":[110,149],"success":[112,134,152],"rate":[113,153],"83%":[115],"tasks":[118,123,137],"75%":[120],"unseen":[122,141],"simulation.":[125],"When":[126],"deployed":[127],"hardware,":[130],"it":[131],"attains":[132],"67%":[133,161],"50%":[139],"ones.":[142],"multi-environment":[144],"adaptation":[145],"an":[150],"average":[151],"81%":[155],"across":[156,162],"diverse":[157],"simulated":[158],"varied":[163],"real-world":[164],"settings.":[165],"These":[166],"results":[167],"establish":[168],"new":[170],"benchmark":[171],"Vision-Language-Action":[175],"flight":[177],"demonstrate":[179],"compact,":[181],"can":[184],"enable":[185],"reliable,":[186],"language-guided":[187],"navigation":[188],"without":[189],"relying":[190],"external":[192],"infrastructure.":[193]},"counts_by_year":[],"updated_date":"2026-06-11T09:08:48.828518","created_date":"2025-12-11T00:00:00"}
