{"id":"https://openalex.org/W7160502977","doi":"https://doi.org/10.48550/arxiv.2605.04451","title":"RemoteZero: Geospatial Reasoning with Zero Human Annotations","display_name":"RemoteZero: Geospatial Reasoning with Zero Human Annotations","publication_year":2026,"publication_date":"2026-05-06","ids":{"openalex":"https://openalex.org/W7160502977","doi":"https://doi.org/10.48550/arxiv.2605.04451"},"language":null,"primary_location":{"id":"doi:10.48550/arxiv.2605.04451","is_oa":true,"landing_page_url":"https://doi.org/10.48550/arxiv.2605.04451","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":null,"is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"article"},"type":"preprint","indexed_in":["datacite"],"open_access":{"is_oa":true,"oa_status":"green","oa_url":"https://doi.org/10.48550/arxiv.2605.04451","any_repository_has_fulltext":true},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5135587006","display_name":"Liang Yao","orcid":null},"institutions":[],"countries":[],"is_corresponding":true,"raw_author_name":"Yao, Liang","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5135572055","display_name":"Fan Liu","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Liu, Fan","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5135633129","display_name":"Shengxiang Xu","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Xu, Shengxiang","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5135539686","display_name":"Chuanyi Zhang","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Zhang, Chuanyi","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5135550012","display_name":"Rui Min","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Min, Rui","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5135631096","display_name":"Shimin Di","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Di, Shimin","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"last","author":{"id":"https://openalex.org/A5135553105","display_name":"Yuhui Zheng","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Zheng, Yuhui","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]}],"institutions":[],"countries_distinct_count":0,"institutions_distinct_count":7,"corresponding_author_ids":["https://openalex.org/A5135587006"],"corresponding_institution_ids":[],"apc_list":null,"apc_paid":null,"fwci":null,"has_fulltext":false,"cited_by_count":0,"citation_normalized_percentile":null,"cited_by_percentile_year":null,"biblio":{"volume":null,"issue":null,"first_page":null,"last_page":null},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10689","display_name":"Remote-Sensing Image Classification","score":0.29510000348091125,"subfield":{"id":"https://openalex.org/subfields/2214","display_name":"Media Technology"},"field":{"id":"https://openalex.org/fields/22","display_name":"Engineering"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10689","display_name":"Remote-Sensing Image Classification","score":0.29510000348091125,"subfield":{"id":"https://openalex.org/subfields/2214","display_name":"Media Technology"},"field":{"id":"https://openalex.org/fields/22","display_name":"Engineering"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11596","display_name":"Constraint Satisfaction and Optimization","score":0.2126999944448471,"subfield":{"id":"https://openalex.org/subfields/1705","display_name":"Computer Networks and Communications"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T13282","display_name":"Automated Road and Building Extraction","score":0.13729999959468842,"subfield":{"id":"https://openalex.org/subfields/2212","display_name":"Ocean Engineering"},"field":{"id":"https://openalex.org/fields/22","display_name":"Engineering"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/geospatial-analysis","display_name":"Geospatial analysis","score":0.8611999750137329},{"id":"https://openalex.org/keywords/discriminative-model","display_name":"Discriminative model","score":0.6686999797821045},{"id":"https://openalex.org/keywords/inference","display_name":"Inference","score":0.6685000061988831},{"id":"https://openalex.org/keywords/semantics","display_name":"Semantics (computer science)","score":0.5723000168800354},{"id":"https://openalex.org/keywords/process","display_name":"Process (computing)","score":0.5525000095367432},{"id":"https://openalex.org/keywords/simple","display_name":"Simple (philosophy)","score":0.4717999994754791},{"id":"https://openalex.org/keywords/spatial-intelligence","display_name":"Spatial intelligence","score":0.44839999079704285},{"id":"https://openalex.org/keywords/path","display_name":"Path (computing)","score":0.4262999892234802}],"concepts":[{"id":"https://openalex.org/C9770341","wikidata":"https://www.wikidata.org/wiki/Q1938983","display_name":"Geospatial analysis","level":2,"score":0.8611999750137329},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.751800000667572},{"id":"https://openalex.org/C97931131","wikidata":"https://www.wikidata.org/wiki/Q5282087","display_name":"Discriminative model","level":2,"score":0.6686999797821045},{"id":"https://openalex.org/C2776214188","wikidata":"https://www.wikidata.org/wiki/Q408386","display_name":"Inference","level":2,"score":0.6685000061988831},{"id":"https://openalex.org/C184337299","wikidata":"https://www.wikidata.org/wiki/Q1437428","display_name":"Semantics (computer science)","level":2,"score":0.5723000168800354},{"id":"https://openalex.org/C98045186","wikidata":"https://www.wikidata.org/wiki/Q205663","display_name":"Process (computing)","level":2,"score":0.5525000095367432},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.5088000297546387},{"id":"https://openalex.org/C2780586882","wikidata":"https://www.wikidata.org/wiki/Q7520643","display_name":"Simple (philosophy)","level":2,"score":0.4717999994754791},{"id":"https://openalex.org/C155911833","wikidata":"https://www.wikidata.org/wiki/Q3817354","display_name":"Spatial intelligence","level":2,"score":0.44839999079704285},{"id":"https://openalex.org/C2777735758","wikidata":"https://www.wikidata.org/wiki/Q817765","display_name":"Path (computing)","level":2,"score":0.4262999892234802},{"id":"https://openalex.org/C19768560","wikidata":"https://www.wikidata.org/wiki/Q320727","display_name":"Dependency (UML)","level":2,"score":0.3880999982357025},{"id":"https://openalex.org/C195344581","wikidata":"https://www.wikidata.org/wiki/Q2555318","display_name":"Automated reasoning","level":2,"score":0.38019999861717224},{"id":"https://openalex.org/C143587482","wikidata":"https://www.wikidata.org/wiki/Q1543216","display_name":"Iterative and incremental development","level":2,"score":0.3483000099658966},{"id":"https://openalex.org/C39399123","wikidata":"https://www.wikidata.org/wiki/Q1348989","display_name":"Earth observation","level":3,"score":0.3280999958515167},{"id":"https://openalex.org/C119857082","wikidata":"https://www.wikidata.org/wiki/Q2539","display_name":"Machine learning","level":1,"score":0.3278999924659729},{"id":"https://openalex.org/C89288958","wikidata":"https://www.wikidata.org/wiki/Q7301504","display_name":"Reasoning system","level":2,"score":0.3068000078201294},{"id":"https://openalex.org/C124101348","wikidata":"https://www.wikidata.org/wiki/Q172491","display_name":"Data mining","level":1,"score":0.30079999566078186},{"id":"https://openalex.org/C2777508537","wikidata":"https://www.wikidata.org/wiki/Q7936620","display_name":"Visual reasoning","level":2,"score":0.29350000619888306},{"id":"https://openalex.org/C2780801425","wikidata":"https://www.wikidata.org/wiki/Q5164392","display_name":"Construct (python library)","level":2,"score":0.2741999924182892},{"id":"https://openalex.org/C36464697","wikidata":"https://www.wikidata.org/wiki/Q451553","display_name":"Visualization","level":2,"score":0.2529999911785126}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.48550/arxiv.2605.04451","is_oa":true,"landing_page_url":"https://doi.org/10.48550/arxiv.2605.04451","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":null,"is_accepted":false,"is_published":null,"raw_source_name":null,"raw_type":"article"}],"best_oa_location":{"id":"doi:10.48550/arxiv.2605.04451","is_oa":true,"landing_page_url":"https://doi.org/10.48550/arxiv.2605.04451","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":null,"is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"article"},"sustainable_development_goals":[{"id":"https://metadata.un.org/sdg/10","score":0.7205292582511902,"display_name":"Reduced inequalities"}],"awards":[],"funders":[],"has_content":{"grobid_xml":false,"pdf":false},"content_urls":null,"referenced_works_count":0,"referenced_works":[],"related_works":[],"abstract_inverted_index":{"Geospatial":[0],"reasoning":[1,24,53,171],"requires":[2],"models":[3,30],"to":[4,31,140],"resolve":[5],"complex":[6],"spatial":[7,59],"semantics":[8],"and":[9,61,123],"user":[10],"intent":[11],"into":[12],"precise":[13,108],"target":[14],"locations":[15],"for":[16,81,169],"Earth":[17],"observation.":[18],"Recent":[19],"progress":[20],"has":[21],"liberated":[22],"the":[23,52,138,164],"path":[25],"from":[26,142],"manual":[27],"curation,":[28],"allowing":[29,137],"generate":[32],"their":[33],"own":[34,149],"inference":[35],"chains.":[36],"Yet":[37],"a":[38,78,88,99,102],"final":[39],"dependency":[40],"remains:":[41],"they":[42],"are":[43],"still":[44],"supervised":[45,161],"by":[46,87],"human-annotated":[47],"ground-truth":[48],"coordinates.":[49,109],"This":[50],"leaves":[51],"process":[54],"autonomous,":[55],"but":[56],"not":[57],"its":[58,148],"endpoint,":[60],"prevents":[62],"true":[63],"self-evolution":[64],"on":[65],"abundant":[66],"unlabeled":[67,143],"remote":[68,144],"sensing":[69,145],"data.":[70],"To":[71],"break":[72],"this":[73,111],"bottleneck,":[74],"we":[75],"introduce":[76],"RemoteZero,":[77],"box-supervision-free":[79],"framework":[80,132],"geospatial":[82,170],"reasoning.":[83],"RemoteZero":[84,115,155],"is":[85,93],"motivated":[86],"simple":[89],"asymmetry:":[90],"an":[91],"MLLM":[92],"typically":[94],"better":[95],"at":[96,105],"verifying":[97],"whether":[98],"region":[100],"satisfies":[101],"query":[103],"than":[104],"directly":[106],"generating":[107],"Leveraging":[110],"stronger":[112],"discriminative":[113],"ability,":[114],"replaces":[116],"geometric":[117],"supervision":[118],"with":[119],"intrinsic":[120],"semantic":[121],"verification":[122,150],"enables":[124],"GRPO":[125],"training":[126,168],"without":[127],"box":[128],"annotations.":[129],"The":[130],"resulting":[131],"further":[133],"supports":[134],"iterative":[135],"self-evolution,":[136],"model":[139],"improve":[141],"imagery":[146],"through":[147],"signal.":[151],"Experiments":[152],"show":[153],"that":[154],"achieves":[156],"competitive":[157],"performance":[158],"against":[159],"strong":[160],"methods,":[162],"demonstrating":[163],"potential":[165],"of":[166],"self-verifying":[167],"localization.":[172]},"counts_by_year":[],"updated_date":"2026-05-08T13:18:25.657630","created_date":"2026-05-08T00:00:00"}
