{"id":"https://openalex.org/W7128633325","doi":"https://doi.org/10.48550/arxiv.2602.09932","title":"GeoFormer: A Lightweight Swin Transformer for Joint Building Height and Footprint Estimation from Sentinel Imagery","display_name":"GeoFormer: A Lightweight Swin Transformer for Joint Building Height and Footprint Estimation from Sentinel Imagery","publication_year":2026,"publication_date":"2026-02-10","ids":{"openalex":"https://openalex.org/W7128633325","doi":"https://doi.org/10.48550/arxiv.2602.09932"},"language":null,"primary_location":{"id":"pmh:doi:10.48550/arxiv.2602.09932","is_oa":true,"landing_page_url":null,"pdf_url":null,"source":{"id":"https://openalex.org/S4406922384","display_name":"Open MIND","issn_l":null,"issn":null,"is_oa":false,"is_in_doaj":false,"is_core":false,"host_organization":null,"host_organization_name":null,"host_organization_lineage":[],"host_organization_lineage_names":[],"type":"repository"},"license":"publisher-specific-oa","license_id":"https://openalex.org/licenses/publisher-specific-oa","version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"Article"},"type":"preprint","indexed_in":["datacite"],"open_access":{"is_oa":true,"oa_status":"green","oa_url":null,"any_repository_has_fulltext":true},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5125625611","display_name":"Han Jinzhen","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Jinzhen, Han","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5125632633","display_name":"JinByeong Lee","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Lee, JinByeong","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5125671892","display_name":"JiSung Kim","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Kim, JiSung","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5125632925","display_name":"MinKyung Cho","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Cho, MinKyung","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5125665598","display_name":"DaHee Kim","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Kim, DaHee","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"last","author":{"id":"https://openalex.org/A5016480271","display_name":"Hongsik Yun","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Yun, HongSik","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]}],"institutions":[],"countries_distinct_count":0,"institutions_distinct_count":6,"corresponding_author_ids":[],"corresponding_institution_ids":[],"apc_list":null,"apc_paid":null,"fwci":null,"has_fulltext":false,"cited_by_count":0,"citation_normalized_percentile":null,"cited_by_percentile_year":null,"biblio":{"volume":null,"issue":null,"first_page":null,"last_page":null},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10689","display_name":"Remote-Sensing Image Classification","score":0.42399999499320984,"subfield":{"id":"https://openalex.org/subfields/2214","display_name":"Media Technology"},"field":{"id":"https://openalex.org/fields/22","display_name":"Engineering"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10689","display_name":"Remote-Sensing Image Classification","score":0.42399999499320984,"subfield":{"id":"https://openalex.org/subfields/2214","display_name":"Media Technology"},"field":{"id":"https://openalex.org/fields/22","display_name":"Engineering"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11164","display_name":"Remote Sensing and LiDAR Applications","score":0.2736999988555908,"subfield":{"id":"https://openalex.org/subfields/2305","display_name":"Environmental Engineering"},"field":{"id":"https://openalex.org/fields/23","display_name":"Environmental Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10801","display_name":"Synthetic Aperture Radar (SAR) Applications and Techniques","score":0.06480000168085098,"subfield":{"id":"https://openalex.org/subfields/2202","display_name":"Aerospace Engineering"},"field":{"id":"https://openalex.org/fields/22","display_name":"Engineering"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/footprint","display_name":"Footprint","score":0.6779999732971191},{"id":"https://openalex.org/keywords/mean-squared-error","display_name":"Mean squared error","score":0.6118999719619751},{"id":"https://openalex.org/keywords/estimation","display_name":"Estimation","score":0.5103999972343445},{"id":"https://openalex.org/keywords/grid","display_name":"Grid","score":0.48500001430511475},{"id":"https://openalex.org/keywords/satellite-imagery","display_name":"Satellite imagery","score":0.41510000824928284},{"id":"https://openalex.org/keywords/sensor-fusion","display_name":"Sensor fusion","score":0.34209999442100525}],"concepts":[{"id":"https://openalex.org/C132943942","wikidata":"https://www.wikidata.org/wiki/Q2562511","display_name":"Footprint","level":2,"score":0.6779999732971191},{"id":"https://openalex.org/C139945424","wikidata":"https://www.wikidata.org/wiki/Q1940696","display_name":"Mean squared error","level":2,"score":0.6118999719619751},{"id":"https://openalex.org/C62649853","wikidata":"https://www.wikidata.org/wiki/Q199687","display_name":"Remote sensing","level":1,"score":0.5620999932289124},{"id":"https://openalex.org/C96250715","wikidata":"https://www.wikidata.org/wiki/Q965330","display_name":"Estimation","level":2,"score":0.5103999972343445},{"id":"https://openalex.org/C187691185","wikidata":"https://www.wikidata.org/wiki/Q2020720","display_name":"Grid","level":2,"score":0.48500001430511475},{"id":"https://openalex.org/C2778102629","wikidata":"https://www.wikidata.org/wiki/Q725252","display_name":"Satellite imagery","level":2,"score":0.41510000824928284},{"id":"https://openalex.org/C39432304","wikidata":"https://www.wikidata.org/wiki/Q188847","display_name":"Environmental science","level":0,"score":0.4025000035762787},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.40209999680519104},{"id":"https://openalex.org/C33954974","wikidata":"https://www.wikidata.org/wiki/Q486494","display_name":"Sensor fusion","level":2,"score":0.34209999442100525},{"id":"https://openalex.org/C153294291","wikidata":"https://www.wikidata.org/wiki/Q25261","display_name":"Meteorology","level":1,"score":0.31290000677108765},{"id":"https://openalex.org/C108597893","wikidata":"https://www.wikidata.org/wiki/Q663650","display_name":"Reflectivity","level":2,"score":0.2858999967575073},{"id":"https://openalex.org/C127040729","wikidata":"https://www.wikidata.org/wiki/Q174844","display_name":"Megacity","level":2,"score":0.26649999618530273},{"id":"https://openalex.org/C132651083","wikidata":"https://www.wikidata.org/wiki/Q7942","display_name":"Climate change","level":2,"score":0.2660999894142151},{"id":"https://openalex.org/C35651441","wikidata":"https://www.wikidata.org/wiki/Q625303","display_name":"Independence (probability theory)","level":2,"score":0.25589999556541443},{"id":"https://openalex.org/C51399673","wikidata":"https://www.wikidata.org/wiki/Q504027","display_name":"Lidar","level":2,"score":0.2540999948978424}],"mesh":[],"locations_count":2,"locations":[{"id":"pmh:doi:10.48550/arxiv.2602.09932","is_oa":true,"landing_page_url":null,"pdf_url":null,"source":{"id":"https://openalex.org/S4406922384","display_name":"Open MIND","issn_l":null,"issn":null,"is_oa":false,"is_in_doaj":false,"is_core":false,"host_organization":null,"host_organization_name":null,"host_organization_lineage":[],"host_organization_lineage_names":[],"type":"repository"},"license":"publisher-specific-oa","license_id":"https://openalex.org/licenses/publisher-specific-oa","version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"Article"},{"id":"doi:10.48550/arxiv.2602.09932","is_oa":true,"landing_page_url":"https://doi.org/10.48550/arxiv.2602.09932","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":null,"is_accepted":false,"is_published":null,"raw_source_name":null,"raw_type":"article"}],"best_oa_location":{"id":"pmh:doi:10.48550/arxiv.2602.09932","is_oa":true,"landing_page_url":null,"pdf_url":null,"source":{"id":"https://openalex.org/S4406922384","display_name":"Open MIND","issn_l":null,"issn":null,"is_oa":false,"is_in_doaj":false,"is_core":false,"host_organization":null,"host_organization_name":null,"host_organization_lineage":[],"host_organization_lineage_names":[],"type":"repository"},"license":"publisher-specific-oa","license_id":"https://openalex.org/licenses/publisher-specific-oa","version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"Article"},"sustainable_development_goals":[{"id":"https://metadata.un.org/sdg/13","score":0.7351348996162415,"display_name":"Climate action"}],"awards":[],"funders":[],"has_content":{"pdf":false,"grobid_xml":false},"content_urls":null,"referenced_works_count":0,"referenced_works":[],"related_works":[],"abstract_inverted_index":{"Building":[0],"height":[1,165],"(BH)":[2],"and":[3,17,43,57,70,88,96,147,167,191],"footprint":[4],"(BF)":[5],"are":[6,196],"fundamental":[7],"urban":[8],"morphological":[9],"parameters":[10,114],"required":[11],"by":[12,122],"climate":[13],"modelling,":[14],"disaster-risk":[15],"assessment,":[16],"population":[18],"mapping,":[19],"yet":[20],"globally":[21],"consistent":[22],"data":[23],"remain":[24],"scarce.":[25],"In":[26],"this":[27],"work,":[28],"we":[29],"develop":[30],"GeoFormer,":[31],"a":[32,46,104,153],"lightweight":[33],"Swin":[34],"Transformer-based":[35],"multi-task":[36],"learning":[37],"framework":[38],"that":[39,101,126,152],"jointly":[40],"estimates":[41],"BH":[42,105,179],"BF":[44],"on":[45,141],"100":[47],"m":[48,109,183],"grid":[49],"using":[50],"only":[51,111],"open-access":[52],"Sentinel-1":[53],"SAR,":[54],"Sentinel-2":[55],"multispectral,":[56],"DEM":[58,161],"data.":[59],"A":[60],"geo-blocked":[61],"data-splitting":[62],"strategy":[63],"enforces":[64],"strict":[65],"spatial":[66,97],"independence":[67],"between":[68],"training":[69],"evaluation":[71],"regions":[72],"across":[73],"54":[74],"morphologically":[75],"diverse":[76],"cities.":[77],"We":[78],"set":[79],"representative":[80],"CNN":[81,119],"baselines":[82],"(ResNet,":[83],"UNet,":[84],"SENet)":[85],"as":[86],"benchmarks":[87],"thoroughly":[89],"evaluate":[90],"GeoFormer's":[91],"prediction":[92],"accuracy,":[93],"computational":[94],"efficiency,":[95],"transferability.":[98],"Results":[99],"show":[100],"GeoFormer":[102],"achieves":[103],"RMSE":[106,180],"of":[107],"3.19":[108],"with":[110],"0.32":[112],"M":[113],"--":[115,124],"outperforming":[116],"the":[117,171,192],"best":[118],"baseline":[120],"(UNet)":[121],"7.5%":[123],"indicating":[125],"windowed":[127],"local":[128],"attention":[129],"is":[130,159,162],"more":[131],"effective":[132],"than":[133],"convolution":[134],"for":[135,164],"scene-level":[136],"building-parameter":[137],"retrieval.":[138],"Systematic":[139],"ablation":[140],"context":[142],"window":[143],"size,":[144],"model":[145,189],"capacity,":[146],"input":[148],"modality":[149],"further":[150],"reveals":[151],"5x5":[154],"(500":[155],"m)":[156],"receptive":[157],"field":[158],"optimal,":[160],"indispensable":[163],"estimation,":[166],"multispectral":[168],"reflectance":[169],"carries":[170],"dominant":[172],"predictive":[173],"signal.":[174],"Cross-continent":[175],"transfer":[176],"tests":[177],"confirm":[178],"below":[181],"3.5":[182],"without":[184],"region-specific":[185],"fine-tuning.":[186],"All":[187],"code,":[188],"weights,":[190],"resulting":[193],"global":[194],"product":[195],"publicly":[197],"released.":[198]},"counts_by_year":[],"updated_date":"2026-06-11T09:08:48.828518","created_date":"2026-02-12T00:00:00"}
