{"id":"https://openalex.org/W7124932506","doi":"https://doi.org/10.1109/cloudcom67567.2025.11331451","title":"All Seeing Eyes: A Native-Resolution Vision-Language Framework for High-Fidelity Remote Sensing Image Understanding","display_name":"All Seeing Eyes: A Native-Resolution Vision-Language Framework for High-Fidelity Remote Sensing Image Understanding","publication_year":2025,"publication_date":"2025-11-14","ids":{"openalex":"https://openalex.org/W7124932506","doi":"https://doi.org/10.1109/cloudcom67567.2025.11331451"},"language":null,"primary_location":{"id":"doi:10.1109/cloudcom67567.2025.11331451","is_oa":false,"landing_page_url":"https://doi.org/10.1109/cloudcom67567.2025.11331451","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"2025 lEEE International Conference on Cloud Computing Technology and Science (CloudCom)","raw_type":"proceedings-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":false,"oa_status":"closed","oa_url":null,"any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5075392699","display_name":"Jingrui Zhang","orcid":"https://orcid.org/0000-0001-7732-8459"},"institutions":[{"id":"https://openalex.org/I4210152380","display_name":"Shenzhen Technology University","ror":"https://ror.org/04qzpec27","country_code":"CN","type":"education","lineage":["https://openalex.org/I4210152380"]}],"countries":["CN"],"is_corresponding":true,"raw_author_name":"Jingrui Zhang","raw_affiliation_strings":["Shenzhen MSU-BIT University,Guangdong-Hong Kong-Macao Joint Laboratory for Emotional Intelligence and Pervasive Computing,Shenzhen,China"],"affiliations":[{"raw_affiliation_string":"Shenzhen MSU-BIT University,Guangdong-Hong Kong-Macao Joint Laboratory for Emotional Intelligence and Pervasive Computing,Shenzhen,China","institution_ids":["https://openalex.org/I4210152380"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5115590655","display_name":"Zhang Ye","orcid":"https://orcid.org/0000-0003-3495-5596"},"institutions":[{"id":"https://openalex.org/I4210152380","display_name":"Shenzhen Technology University","ror":"https://ror.org/04qzpec27","country_code":"CN","type":"education","lineage":["https://openalex.org/I4210152380"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Yong Zhang","raw_affiliation_strings":["Shenzhen MSU-BIT University,Guangdong-Hong Kong-Macao Joint Laboratory for Emotional Intelligence and Pervasive Computing,Shenzhen,China"],"affiliations":[{"raw_affiliation_string":"Shenzhen MSU-BIT University,Guangdong-Hong Kong-Macao Joint Laboratory for Emotional Intelligence and Pervasive Computing,Shenzhen,China","institution_ids":["https://openalex.org/I4210152380"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5123415793","display_name":"Yimeng Xu","orcid":null},"institutions":[{"id":"https://openalex.org/I4210152380","display_name":"Shenzhen Technology University","ror":"https://ror.org/04qzpec27","country_code":"CN","type":"education","lineage":["https://openalex.org/I4210152380"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Yimeng Xu","raw_affiliation_strings":["Shenzhen MSU-BIT University,Guangdong-Hong Kong-Macao Joint Laboratory for Emotional Intelligence and Pervasive Computing,Shenzhen,China"],"affiliations":[{"raw_affiliation_string":"Shenzhen MSU-BIT University,Guangdong-Hong Kong-Macao Joint Laboratory for Emotional Intelligence and Pervasive Computing,Shenzhen,China","institution_ids":["https://openalex.org/I4210152380"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5123375025","display_name":"Zixuan Shangguan","orcid":null},"institutions":[{"id":"https://openalex.org/I4210152380","display_name":"Shenzhen Technology University","ror":"https://ror.org/04qzpec27","country_code":"CN","type":"education","lineage":["https://openalex.org/I4210152380"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Zixuan Shangguan","raw_affiliation_strings":["Shenzhen MSU-BIT University,Guangdong-Hong Kong-Macao Joint Laboratory for Emotional Intelligence and Pervasive Computing,Shenzhen,China"],"affiliations":[{"raw_affiliation_string":"Shenzhen MSU-BIT University,Guangdong-Hong Kong-Macao Joint Laboratory for Emotional Intelligence and Pervasive Computing,Shenzhen,China","institution_ids":["https://openalex.org/I4210152380"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5123379970","display_name":"Lijie Zhang","orcid":null},"institutions":[{"id":"https://openalex.org/I4210134503","display_name":"Petroleum Technology Company (Norway)","ror":"https://ror.org/03d9q1m75","country_code":"NO","type":"company","lineage":["https://openalex.org/I4210134503"]}],"countries":["NO"],"is_corresponding":false,"raw_author_name":"Lijie Zhang","raw_affiliation_strings":["Shandong Kerui Petroleum &#x0026; Gas Equipment Co., Ltd.,Dongying,China"],"affiliations":[{"raw_affiliation_string":"Shandong Kerui Petroleum &#x0026; Gas Equipment Co., Ltd.,Dongying,China","institution_ids":["https://openalex.org/I4210134503"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5123448635","display_name":"Lihao Yang","orcid":null},"institutions":[{"id":"https://openalex.org/I4210088761","display_name":"International Marine and Dredging Consultants","ror":"https://ror.org/00b7zp807","country_code":"BE","type":"company","lineage":["https://openalex.org/I4210088761"]}],"countries":["BE"],"is_corresponding":false,"raw_author_name":"Lihao Yang","raw_affiliation_strings":["CCCC. Tianjin Dredging Co., Ltd.,Tianjin,China"],"affiliations":[{"raw_affiliation_string":"CCCC. Tianjin Dredging Co., Ltd.,Tianjin,China","institution_ids":["https://openalex.org/I4210088761"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5123440940","display_name":"Yang Zhou","orcid":null},"institutions":[{"id":"https://openalex.org/I4210109870","display_name":"Vi Technology (United States)","ror":"https://ror.org/016mnbp44","country_code":"US","type":"company","lineage":["https://openalex.org/I4210109870"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Yang Zhou","raw_affiliation_strings":["Nova Stella (Shenzhen) Technology Co., Ltd.,Shenzhen,China"],"affiliations":[{"raw_affiliation_string":"Nova Stella (Shenzhen) Technology Co., Ltd.,Shenzhen,China","institution_ids":["https://openalex.org/I4210109870"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5102758440","display_name":"Xiaoyi Fan","orcid":"https://orcid.org/0000-0001-5135-9855"},"institutions":[{"id":"https://openalex.org/I4210152380","display_name":"Shenzhen Technology University","ror":"https://ror.org/04qzpec27","country_code":"CN","type":"education","lineage":["https://openalex.org/I4210152380"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Xiaoyi Fan","raw_affiliation_strings":["Shenzhen MSU-BIT University,Guangdong-Hong Kong-Macao Joint Laboratory for Emotional Intelligence and Pervasive Computing,Shenzhen,China"],"affiliations":[{"raw_affiliation_string":"Shenzhen MSU-BIT University,Guangdong-Hong Kong-Macao Joint Laboratory for Emotional Intelligence and Pervasive Computing,Shenzhen,China","institution_ids":["https://openalex.org/I4210152380"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5123405278","display_name":"Feng Liang","orcid":null},"institutions":[{"id":"https://openalex.org/I4210152380","display_name":"Shenzhen Technology University","ror":"https://ror.org/04qzpec27","country_code":"CN","type":"education","lineage":["https://openalex.org/I4210152380"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Feng Liang","raw_affiliation_strings":["Shenzhen MSU-BIT University,Guangdong-Hong Kong-Macao Joint Laboratory for Emotional Intelligence and Pervasive Computing,Shenzhen,China"],"affiliations":[{"raw_affiliation_string":"Shenzhen MSU-BIT University,Guangdong-Hong Kong-Macao Joint Laboratory for Emotional Intelligence and Pervasive Computing,Shenzhen,China","institution_ids":["https://openalex.org/I4210152380"]}]}],"institutions":[],"countries_distinct_count":4,"institutions_distinct_count":9,"corresponding_author_ids":["https://openalex.org/A5075392699"],"corresponding_institution_ids":["https://openalex.org/I4210152380"],"apc_list":null,"apc_paid":null,"fwci":0.0,"has_fulltext":false,"cited_by_count":0,"citation_normalized_percentile":{"value":0.67221539,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":null,"biblio":{"volume":null,"issue":null,"first_page":"1","last_page":"8"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T11714","display_name":"Multimodal Machine Learning Applications","score":0.4074000120162964,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T11714","display_name":"Multimodal Machine Learning Applications","score":0.4074000120162964,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10036","display_name":"Advanced Neural Network Applications","score":0.1738000065088272,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11307","display_name":"Domain Adaptation and Few-Shot Learning","score":0.09830000251531601,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/encoder","display_name":"Encoder","score":0.6216999888420105},{"id":"https://openalex.org/keywords/implementation","display_name":"Implementation","score":0.4262999892234802},{"id":"https://openalex.org/keywords/image-resolution","display_name":"Image resolution","score":0.4058000147342682},{"id":"https://openalex.org/keywords/image-processing","display_name":"Image processing","score":0.3684999942779541},{"id":"https://openalex.org/keywords/remote-sensing-application","display_name":"Remote sensing application","score":0.35580000281333923},{"id":"https://openalex.org/keywords/image","display_name":"Image (mathematics)","score":0.353300005197525}],"concepts":[{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.7287999987602234},{"id":"https://openalex.org/C62649853","wikidata":"https://www.wikidata.org/wiki/Q199687","display_name":"Remote sensing","level":1,"score":0.6829000115394592},{"id":"https://openalex.org/C118505674","wikidata":"https://www.wikidata.org/wiki/Q42586063","display_name":"Encoder","level":2,"score":0.6216999888420105},{"id":"https://openalex.org/C31972630","wikidata":"https://www.wikidata.org/wiki/Q844240","display_name":"Computer vision","level":1,"score":0.44909998774528503},{"id":"https://openalex.org/C26713055","wikidata":"https://www.wikidata.org/wiki/Q245962","display_name":"Implementation","level":2,"score":0.4262999892234802},{"id":"https://openalex.org/C205372480","wikidata":"https://www.wikidata.org/wiki/Q210521","display_name":"Image resolution","level":2,"score":0.4058000147342682},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.39259999990463257},{"id":"https://openalex.org/C9417928","wikidata":"https://www.wikidata.org/wiki/Q1070689","display_name":"Image processing","level":3,"score":0.3684999942779541},{"id":"https://openalex.org/C183365957","wikidata":"https://www.wikidata.org/wiki/Q17140402","display_name":"Remote sensing application","level":3,"score":0.35580000281333923},{"id":"https://openalex.org/C115961682","wikidata":"https://www.wikidata.org/wiki/Q860623","display_name":"Image (mathematics)","level":2,"score":0.353300005197525},{"id":"https://openalex.org/C3020199158","wikidata":"https://www.wikidata.org/wiki/Q210521","display_name":"High resolution","level":2,"score":0.3472999930381775},{"id":"https://openalex.org/C9652623","wikidata":"https://www.wikidata.org/wiki/Q190109","display_name":"Field (mathematics)","level":2,"score":0.3456999957561493},{"id":"https://openalex.org/C2778102629","wikidata":"https://www.wikidata.org/wiki/Q725252","display_name":"Satellite imagery","level":2,"score":0.2904999852180481},{"id":"https://openalex.org/C66322947","wikidata":"https://www.wikidata.org/wiki/Q11658","display_name":"Transformer","level":3,"score":0.2858000099658966},{"id":"https://openalex.org/C138268822","wikidata":"https://www.wikidata.org/wiki/Q1051925","display_name":"Resolution (logic)","level":2,"score":0.27489998936653137}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.1109/cloudcom67567.2025.11331451","is_oa":false,"landing_page_url":"https://doi.org/10.1109/cloudcom67567.2025.11331451","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"2025 lEEE International Conference on Cloud Computing Technology and Science (CloudCom)","raw_type":"proceedings-article"}],"best_oa_location":null,"sustainable_development_goals":[],"awards":[{"id":"https://openalex.org/G8465124245","display_name":null,"funder_award_id":"62576213","funder_id":"https://openalex.org/F4320321001","funder_display_name":"National Natural Science Foundation of China"}],"funders":[{"id":"https://openalex.org/F4320321001","display_name":"National Natural Science Foundation of China","ror":"https://ror.org/01h0zpd94"}],"has_content":{"pdf":false,"grobid_xml":false},"content_urls":null,"referenced_works_count":21,"referenced_works":["https://openalex.org/W1980038761","https://openalex.org/W2510520237","https://openalex.org/W2515866431","https://openalex.org/W2779054585","https://openalex.org/W2962749812","https://openalex.org/W3003741573","https://openalex.org/W3035104321","https://openalex.org/W3128592650","https://openalex.org/W3151130473","https://openalex.org/W4206706211","https://openalex.org/W4214614183","https://openalex.org/W4292968451","https://openalex.org/W4312769131","https://openalex.org/W4321497943","https://openalex.org/W4322707256","https://openalex.org/W4386071599","https://openalex.org/W4386075535","https://openalex.org/W4394938913","https://openalex.org/W4405806139","https://openalex.org/W4407152340","https://openalex.org/W4409383105"],"related_works":[],"abstract_inverted_index":{"The":[0],"success":[1],"of":[2,73,88,100,113,192],"Vision":[3],"Transformers":[4],"(ViTs)":[5],"has":[6],"profoundly":[7],"reshaped":[8],"research":[9],"paradigms":[10],"in":[11,63,80,96,136,225],"computer":[12],"vision.":[13],"However,":[14],"similar":[15],"to":[16,25,28,45,188],"conventional":[17],"CNN-based":[18],"models,":[19],"ViTs":[20,127],"still":[21],"require":[22],"input":[23],"images":[24,37,194],"be":[26],"resized":[27],"fixed":[29],"resolution.":[30],"Mainstream":[31],"open-source":[32,126],"ViT":[33,185],"implementations":[34],"typically":[35],"resize":[36],"into":[38],"a":[39,77,92,104,111,152],"square":[40],"shape,":[41],"which":[42],"inevitably":[43],"leads":[44],"information":[46,140],"loss":[47],"and":[48,51,159],"increases":[49],"computational":[50],"memory":[52],"overhead.":[53],"Moreover,":[54],"prior":[55],"studies":[56],"have":[57],"highlighted":[58],"that":[59,155,164,204],"the":[60,70,86,97,121,178,183,190],"visual":[61,74],"encoder":[62,154],"multimodal":[64],"large":[65],"language":[66],"models":[67],"(MLLMs),":[68],"as":[69],"primary":[71],"source":[72],"information,":[75],"plays":[76],"crucial":[78],"role":[79],"determining":[81],"overall":[82],"model":[83],"understanding.":[84,173],"In":[85,174],"field":[87],"satellite":[89],"remote":[90,106,143,170,208],"sensing,":[91],"distinctive":[93],"challenge":[94],"lies":[95],"ultra-high":[98],"resolution":[99,112,123,198],"imagery.":[101],"For":[102],"instance,":[103],"2K":[105],"sensing":[107,144,171,209],"image":[108,172,212],"may":[109],"reach":[110],"<tex":[114,129],"xmlns:mml=\"http://www.w3.org/1998/Math/MathML\"":[115,130],"xmlns:xlink=\"http://www.w3.org/1999/xlink\">$2560":[116],"\\times":[117],"1440$</tex>,":[118],"far":[119],"exceeding":[120],"maximum":[122],"supported":[124],"by":[125],"(e.g.,":[128],"xmlns:xlink=\"http://www.w3.org/1999/xlink\">$336\\times":[131],"336$</tex>).":[132],"This":[133],"limitation":[134],"results":[135,202],"even":[137],"more":[138],"severe":[139],"degradation":[141],"for":[142,169],"scenarios.":[145,227],"To":[146],"address":[147],"this,":[148],"Google":[149],"proposed":[150],"NaViT,":[151],"vision":[153],"supports":[156],"native":[157,197],"resolutions":[158],"aspect":[160],"ratios.":[161],"We":[162],"argue":[163],"NaViT":[165,187],"is":[166],"particularly":[167],"valuable":[168],"this":[175],"work,":[176],"following":[177],"LLaVA":[179],"paradigm,":[180],"we":[181],"replace":[182],"standard":[184],"with":[186],"investigate":[189],"benefits":[191],"processing":[193],"at":[195],"their":[196],"within":[199],"MLLMs.":[200],"Experimental":[201],"demonstrate":[203],"across":[205,218],"several":[206],"main-stream":[207],"benchmarks,":[210],"native-resolution":[211],"understanding":[213],"consistently":[214],"delivers":[215],"notable":[216],"improvements":[217],"multiple":[219],"evaluation":[220],"metrics,":[221],"validating":[222],"its":[223],"effectiveness":[224],"high-resolution":[226]},"counts_by_year":[],"updated_date":"2026-04-09T08:11:56.329763","created_date":"2026-01-21T00:00:00"}
