{"id":"https://openalex.org/W7158502547","doi":"https://doi.org/10.48550/arxiv.2604.26221","title":"Seeking Consensus: Geometric-Semantic On-the-Fly Recalibration for Open-Vocabulary Remote Sensing Semantic Segmentation","display_name":"Seeking Consensus: Geometric-Semantic On-the-Fly Recalibration for Open-Vocabulary Remote Sensing Semantic Segmentation","publication_year":2026,"publication_date":"2026-04-29","ids":{"openalex":"https://openalex.org/W7158502547","doi":"https://doi.org/10.48550/arxiv.2604.26221"},"language":null,"primary_location":{"id":"doi:10.48550/arxiv.2604.26221","is_oa":true,"landing_page_url":"https://doi.org/10.48550/arxiv.2604.26221","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":null,"is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"article"},"type":"preprint","indexed_in":["datacite"],"open_access":{"is_oa":true,"oa_status":"green","oa_url":"https://doi.org/10.48550/arxiv.2604.26221","any_repository_has_fulltext":true},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5069808220","display_name":"Guanchun Wang","orcid":"https://orcid.org/0000-0002-9606-7052"},"institutions":[],"countries":[],"is_corresponding":true,"raw_author_name":"Wang, Guanchun","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5134902616","display_name":"Chenxiao Wu","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Wu, Chenxiao","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5134909944","display_name":"Xiangrong Zhang","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Zhang, Xiangrong","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5016326528","display_name":"Zelin Peng","orcid":"https://orcid.org/0009-0002-4066-7929"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Peng, Zelin","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5127227703","display_name":"Jianxun Lai","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Lai, Jianxun","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5134908876","display_name":"Tianyang Zhang","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Zhang, Tianyang","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"last","author":{"id":"https://openalex.org/A5134899715","display_name":"Xu Tang","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Tang, Xu","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]}],"institutions":[],"countries_distinct_count":0,"institutions_distinct_count":7,"corresponding_author_ids":["https://openalex.org/A5069808220"],"corresponding_institution_ids":[],"apc_list":null,"apc_paid":null,"fwci":null,"has_fulltext":false,"cited_by_count":0,"citation_normalized_percentile":null,"cited_by_percentile_year":null,"biblio":{"volume":null,"issue":null,"first_page":null,"last_page":null},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10689","display_name":"Remote-Sensing Image Classification","score":0.8557999730110168,"subfield":{"id":"https://openalex.org/subfields/2214","display_name":"Media Technology"},"field":{"id":"https://openalex.org/fields/22","display_name":"Engineering"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10689","display_name":"Remote-Sensing Image Classification","score":0.8557999730110168,"subfield":{"id":"https://openalex.org/subfields/2214","display_name":"Media Technology"},"field":{"id":"https://openalex.org/fields/22","display_name":"Engineering"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11307","display_name":"Domain Adaptation and Few-Shot Learning","score":0.0272000003606081,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10036","display_name":"Advanced Neural Network Applications","score":0.026900000870227814,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/inference","display_name":"Inference","score":0.5931000113487244},{"id":"https://openalex.org/keywords/ambiguity","display_name":"Ambiguity","score":0.5839999914169312},{"id":"https://openalex.org/keywords/segmentation","display_name":"Segmentation","score":0.5716999769210815},{"id":"https://openalex.org/keywords/land-cover","display_name":"Land cover","score":0.4999000132083893},{"id":"https://openalex.org/keywords/task","display_name":"Task (project management)","score":0.49410000443458557},{"id":"https://openalex.org/keywords/semantics","display_name":"Semantics (computer science)","score":0.3912000060081482},{"id":"https://openalex.org/keywords/semantic-heterogeneity","display_name":"Semantic heterogeneity","score":0.2980000078678131}],"concepts":[{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.7350999712944031},{"id":"https://openalex.org/C2776214188","wikidata":"https://www.wikidata.org/wiki/Q408386","display_name":"Inference","level":2,"score":0.5931000113487244},{"id":"https://openalex.org/C2780522230","wikidata":"https://www.wikidata.org/wiki/Q1140419","display_name":"Ambiguity","level":2,"score":0.5839999914169312},{"id":"https://openalex.org/C89600930","wikidata":"https://www.wikidata.org/wiki/Q1423946","display_name":"Segmentation","level":2,"score":0.5716999769210815},{"id":"https://openalex.org/C2780648208","wikidata":"https://www.wikidata.org/wiki/Q3001793","display_name":"Land cover","level":3,"score":0.4999000132083893},{"id":"https://openalex.org/C2780451532","wikidata":"https://www.wikidata.org/wiki/Q759676","display_name":"Task (project management)","level":2,"score":0.49410000443458557},{"id":"https://openalex.org/C62649853","wikidata":"https://www.wikidata.org/wiki/Q199687","display_name":"Remote sensing","level":1,"score":0.48559999465942383},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.44690001010894775},{"id":"https://openalex.org/C184337299","wikidata":"https://www.wikidata.org/wiki/Q1437428","display_name":"Semantics (computer science)","level":2,"score":0.3912000060081482},{"id":"https://openalex.org/C119857082","wikidata":"https://www.wikidata.org/wiki/Q2539","display_name":"Machine learning","level":1,"score":0.3070000112056732},{"id":"https://openalex.org/C23123220","wikidata":"https://www.wikidata.org/wiki/Q816826","display_name":"Information retrieval","level":1,"score":0.3025999963283539},{"id":"https://openalex.org/C2778180026","wikidata":"https://www.wikidata.org/wiki/Q18378163","display_name":"Semantic heterogeneity","level":4,"score":0.2980000078678131},{"id":"https://openalex.org/C175154964","wikidata":"https://www.wikidata.org/wiki/Q380077","display_name":"Task analysis","level":3,"score":0.2946999967098236},{"id":"https://openalex.org/C183365957","wikidata":"https://www.wikidata.org/wiki/Q17140402","display_name":"Remote sensing application","level":3,"score":0.2872999906539917},{"id":"https://openalex.org/C51632099","wikidata":"https://www.wikidata.org/wiki/Q3985153","display_name":"Training set","level":2,"score":0.2793000042438507},{"id":"https://openalex.org/C165064840","wikidata":"https://www.wikidata.org/wiki/Q1321061","display_name":"Matching (statistics)","level":2,"score":0.275299996137619},{"id":"https://openalex.org/C2775955345","wikidata":"https://www.wikidata.org/wiki/Q7449071","display_name":"Semantic mapping","level":2,"score":0.27390000224113464},{"id":"https://openalex.org/C26517878","wikidata":"https://www.wikidata.org/wiki/Q228039","display_name":"Key (lock)","level":2,"score":0.273499995470047},{"id":"https://openalex.org/C124504099","wikidata":"https://www.wikidata.org/wiki/Q56933","display_name":"Image segmentation","level":3,"score":0.2712000012397766},{"id":"https://openalex.org/C2780980858","wikidata":"https://www.wikidata.org/wiki/Q110022","display_name":"Dual (grammatical number)","level":2,"score":0.251800000667572},{"id":"https://openalex.org/C204321447","wikidata":"https://www.wikidata.org/wiki/Q30642","display_name":"Natural language processing","level":1,"score":0.2508000135421753}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.48550/arxiv.2604.26221","is_oa":true,"landing_page_url":"https://doi.org/10.48550/arxiv.2604.26221","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":null,"is_accepted":false,"is_published":null,"raw_source_name":null,"raw_type":"article"}],"best_oa_location":{"id":"doi:10.48550/arxiv.2604.26221","is_oa":true,"landing_page_url":"https://doi.org/10.48550/arxiv.2604.26221","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":null,"is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"article"},"sustainable_development_goals":[{"score":0.6123055219650269,"id":"https://metadata.un.org/sdg/4","display_name":"Quality Education"}],"awards":[],"funders":[],"has_content":{"pdf":false,"grobid_xml":false},"content_urls":null,"referenced_works_count":0,"referenced_works":[],"related_works":[],"abstract_inverted_index":{"Open-vocabulary":[0],"semantic":[1,42,95,129],"segmentation":[2],"(OVSS)":[3],"in":[4,41,44,72],"remote":[5,73,151],"sensing":[6,74,152],"images":[7],"is":[8],"a":[9,29,61],"promising":[10],"task":[11],"that":[12],"employs":[13],"textual":[14,100,111],"descriptions":[15],"for":[16,141],"identifying":[17],"undefined":[18],"land":[19,46],"cover":[20],"categories.":[21],"Despite":[22],"notable":[23],"advances,":[24],"existing":[25],"methods":[26],"typically":[27],"employ":[28],"static":[30],"inference":[31],"paradigm,":[32],"overlooking":[33],"the":[34,66,126],"distinct":[35],"distribution":[36],"of":[37,68,108],"each":[38,142],"scene,":[39],"resulting":[40],"ambiguity":[43],"diverse":[45],"covers":[47],"and":[48,94,110,128,161],"incomplete":[49],"foreground":[50],"activation.":[51],"Motivated":[52],"by":[53,82],"this,":[54],"we":[55],"propose":[56],"Seeking":[57],"Consensus,":[58],"termed":[59],"SeeCo,":[60],"plug-and-play":[62],"framework":[63],"to":[64],"boost":[65],"performance":[67],"training-free":[69],"OVSS":[70,79,153],"models":[71,80],"images,":[75],"which":[76,104],"recalibrates":[77,138],"arbitrary":[78],"on-the-fly":[81],"seeking":[83],"dual":[84],"consensus:":[85],"geometric":[86],"consensus":[87,96,115,121],"learning":[88,97],"(GCL)":[89],"through":[90],"multi-view":[91],"consistent":[92,156],"observations":[93],"(SCL)":[98],"via":[99,118],"description":[101],"adaptive":[102],"calibration,":[103],"assists":[105],"collaborative":[106],"recalibration":[107],"visual":[109],"semantics.":[112],"The":[113],"two":[114],"are":[116],"injected":[117],"an":[119],"online":[120],"injector":[122],"(OCI),":[123],"effectively":[124],"alleviating":[125],"under-activation":[127],"bias.":[130],"SeeCo":[131],"requires":[132],"no":[133],"specific":[134],"training":[135],"process,":[136],"yet":[137],"semantic-geometric":[139],"alignment":[140],"unique":[143],"scene":[144],"during":[145],"inference.":[146],"Extensive":[147],"experiments":[148],"on":[149],"eight":[150],"benchmarks":[154],"show":[155],"gains,":[157],"proving":[158],"its":[159],"effectiveness":[160],"universality.":[162]},"counts_by_year":[],"updated_date":"2026-05-01T06:10:29.291645","created_date":"2026-05-01T00:00:00"}
