{"id":"https://openalex.org/W4417289896","doi":"https://doi.org/10.48550/arxiv.2512.09251","title":"GLACIA: Instance-Aware Positional Reasoning for Glacial Lake Segmentation via Multimodal Large Language Model","display_name":"GLACIA: Instance-Aware Positional Reasoning for Glacial Lake Segmentation via Multimodal Large Language Model","publication_year":2025,"publication_date":"2025-12-10","ids":{"openalex":"https://openalex.org/W4417289896","doi":"https://doi.org/10.48550/arxiv.2512.09251"},"language":null,"primary_location":{"id":"pmh:oai:arXiv.org:2512.09251","is_oa":true,"landing_page_url":"http://arxiv.org/abs/2512.09251","pdf_url":"https://arxiv.org/pdf/2512.09251","source":{"id":"https://openalex.org/S4393918464","display_name":"ArXiv.org","issn_l":"2331-8422","issn":["2331-8422"],"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":null,"host_organization_name":null,"host_organization_lineage":[],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"text"},"type":"preprint","indexed_in":["arxiv","datacite"],"open_access":{"is_oa":true,"oa_status":"green","oa_url":"https://arxiv.org/pdf/2512.09251","any_repository_has_fulltext":true},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5050693808","display_name":"Lalit Maurya","orcid":"https://orcid.org/0000-0003-2234-8692"},"institutions":[],"countries":[],"is_corresponding":true,"raw_author_name":"Maurya, Lalit","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5082426214","display_name":"Saurabh Kaushik","orcid":"https://orcid.org/0000-0002-2791-3729"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Kaushik, Saurabh","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"last","author":{"id":"https://openalex.org/A5087383776","display_name":"Beth Tellman","orcid":"https://orcid.org/0000-0003-3026-6435"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Tellman, Beth","raw_affiliation_strings":[],"affiliations":[]}],"institutions":[],"countries_distinct_count":0,"institutions_distinct_count":3,"corresponding_author_ids":["https://openalex.org/A5050693808"],"corresponding_institution_ids":[],"apc_list":null,"apc_paid":null,"fwci":null,"has_fulltext":false,"cited_by_count":0,"citation_normalized_percentile":null,"cited_by_percentile_year":null,"biblio":{"volume":null,"issue":null,"first_page":null,"last_page":null},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10757","display_name":"Geographic Information Systems Studies","score":0.23149999976158142,"subfield":{"id":"https://openalex.org/subfields/3305","display_name":"Geography, Planning and Development"},"field":{"id":"https://openalex.org/fields/33","display_name":"Social Sciences"},"domain":{"id":"https://openalex.org/domains/2","display_name":"Social Sciences"}},"topics":[{"id":"https://openalex.org/T10757","display_name":"Geographic Information Systems Studies","score":0.23149999976158142,"subfield":{"id":"https://openalex.org/subfields/3305","display_name":"Geography, Planning and Development"},"field":{"id":"https://openalex.org/fields/33","display_name":"Social Sciences"},"domain":{"id":"https://openalex.org/domains/2","display_name":"Social Sciences"}},{"id":"https://openalex.org/T11714","display_name":"Multimodal Machine Learning Applications","score":0.15850000083446503,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10644","display_name":"Cryospheric studies and observations","score":0.1216999962925911,"subfield":{"id":"https://openalex.org/subfields/1902","display_name":"Atmospheric Science"},"field":{"id":"https://openalex.org/fields/19","display_name":"Earth and Planetary Sciences"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/segmentation","display_name":"Segmentation","score":0.6780999898910522},{"id":"https://openalex.org/keywords/glacial-period","display_name":"Glacial period","score":0.4442000091075897},{"id":"https://openalex.org/keywords/image-segmentation","display_name":"Image segmentation","score":0.41370001435279846},{"id":"https://openalex.org/keywords/context","display_name":"Context (archaeology)","score":0.40369999408721924},{"id":"https://openalex.org/keywords/semantics","display_name":"Semantics (computer science)","score":0.392300009727478},{"id":"https://openalex.org/keywords/convolutional-neural-network","display_name":"Convolutional neural network","score":0.36640000343322754},{"id":"https://openalex.org/keywords/construct","display_name":"Construct (python library)","score":0.36250001192092896},{"id":"https://openalex.org/keywords/transformer","display_name":"Transformer","score":0.3488999903202057}],"concepts":[{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.732200026512146},{"id":"https://openalex.org/C89600930","wikidata":"https://www.wikidata.org/wiki/Q1423946","display_name":"Segmentation","level":2,"score":0.6780999898910522},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.5981000065803528},{"id":"https://openalex.org/C15739521","wikidata":"https://www.wikidata.org/wiki/Q602963","display_name":"Glacial period","level":2,"score":0.4442000091075897},{"id":"https://openalex.org/C124504099","wikidata":"https://www.wikidata.org/wiki/Q56933","display_name":"Image segmentation","level":3,"score":0.41370001435279846},{"id":"https://openalex.org/C2779343474","wikidata":"https://www.wikidata.org/wiki/Q3109175","display_name":"Context (archaeology)","level":2,"score":0.40369999408721924},{"id":"https://openalex.org/C184337299","wikidata":"https://www.wikidata.org/wiki/Q1437428","display_name":"Semantics (computer science)","level":2,"score":0.392300009727478},{"id":"https://openalex.org/C81363708","wikidata":"https://www.wikidata.org/wiki/Q17084460","display_name":"Convolutional neural network","level":2,"score":0.36640000343322754},{"id":"https://openalex.org/C2780801425","wikidata":"https://www.wikidata.org/wiki/Q5164392","display_name":"Construct (python library)","level":2,"score":0.36250001192092896},{"id":"https://openalex.org/C66322947","wikidata":"https://www.wikidata.org/wiki/Q11658","display_name":"Transformer","level":3,"score":0.3488999903202057},{"id":"https://openalex.org/C50644808","wikidata":"https://www.wikidata.org/wiki/Q192776","display_name":"Artificial neural network","level":2,"score":0.32100000977516174},{"id":"https://openalex.org/C108583219","wikidata":"https://www.wikidata.org/wiki/Q197536","display_name":"Deep learning","level":2,"score":0.3052000105381012},{"id":"https://openalex.org/C183322885","wikidata":"https://www.wikidata.org/wiki/Q17007702","display_name":"Context model","level":3,"score":0.3005000054836273},{"id":"https://openalex.org/C204321447","wikidata":"https://www.wikidata.org/wiki/Q30642","display_name":"Natural language processing","level":1,"score":0.28220000863075256},{"id":"https://openalex.org/C64754055","wikidata":"https://www.wikidata.org/wiki/Q7574053","display_name":"Spatial contextual awareness","level":2,"score":0.2806999981403351},{"id":"https://openalex.org/C86827895","wikidata":"https://www.wikidata.org/wiki/Q7098582","display_name":"Opportunistic reasoning","level":4,"score":0.2791999876499176},{"id":"https://openalex.org/C119857082","wikidata":"https://www.wikidata.org/wiki/Q2539","display_name":"Machine learning","level":1,"score":0.2743000090122223},{"id":"https://openalex.org/C2779439875","wikidata":"https://www.wikidata.org/wiki/Q1078276","display_name":"Natural language understanding","level":3,"score":0.27059999108314514},{"id":"https://openalex.org/C195324797","wikidata":"https://www.wikidata.org/wiki/Q33742","display_name":"Natural language","level":2,"score":0.26919999718666077},{"id":"https://openalex.org/C2776214188","wikidata":"https://www.wikidata.org/wiki/Q408386","display_name":"Inference","level":2,"score":0.2612000107765198},{"id":"https://openalex.org/C137293760","wikidata":"https://www.wikidata.org/wiki/Q3621696","display_name":"Language model","level":2,"score":0.2524000108242035}],"mesh":[],"locations_count":2,"locations":[{"id":"pmh:oai:arXiv.org:2512.09251","is_oa":true,"landing_page_url":"http://arxiv.org/abs/2512.09251","pdf_url":"https://arxiv.org/pdf/2512.09251","source":{"id":"https://openalex.org/S4393918464","display_name":"ArXiv.org","issn_l":"2331-8422","issn":["2331-8422"],"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":null,"host_organization_name":null,"host_organization_lineage":[],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"text"},{"id":"doi:10.48550/arxiv.2512.09251","is_oa":true,"landing_page_url":"https://doi.org/10.48550/arxiv.2512.09251","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":null,"is_accepted":false,"is_published":null,"raw_source_name":null,"raw_type":"article"}],"best_oa_location":{"id":"pmh:oai:arXiv.org:2512.09251","is_oa":true,"landing_page_url":"http://arxiv.org/abs/2512.09251","pdf_url":"https://arxiv.org/pdf/2512.09251","source":{"id":"https://openalex.org/S4393918464","display_name":"ArXiv.org","issn_l":"2331-8422","issn":["2331-8422"],"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":null,"host_organization_name":null,"host_organization_lineage":[],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"text"},"sustainable_development_goals":[],"awards":[],"funders":[],"has_content":{"grobid_xml":false,"pdf":false},"content_urls":null,"referenced_works_count":0,"referenced_works":[],"related_works":[],"abstract_inverted_index":{"Glacial":[0,12,81],"lake":[1],"monitoring":[2],"bears":[3],"great":[4],"significance":[5],"in":[6,105,154],"mitigating":[7],"the":[8,56,80,98,155],"anticipated":[9],"risk":[10],"of":[11,100,157],"Lake":[13,82],"Outburst":[14],"Floods.":[15],"However,":[16],"existing":[17],"segmentation":[18,51,65,71,139],"methods":[19,140],"based":[20,118,138],"on":[21,119,178],"convolutional":[22],"neural":[23],"networks":[24],"(CNNs)":[25],"and":[26,40,73,136,151,171],"Vision":[27],"Transformers":[28],"(ViTs),":[29],"remain":[30],"constrained":[31],"to":[32,67,96],"pixel-level":[33],"predictions,":[34],"lacking":[35],"high-level":[36],"global":[37],"scene":[38],"semantics":[39],"human-interpretable":[41],"reasoning.":[42],"To":[43],"address":[44],"this,":[45],"we":[46],"introduce":[47],"GLACIA":[48,112],"(\\textbf{G}lacial":[49],"\\textbf{LA}ke":[50],"with":[52,64],"\\textbf{C}ontextual":[53],"\\textbf{I}nstance":[54],"\\textbf{A}wareness),":[55],"first":[57],"framework":[58],"that":[59,111],"integrates":[60],"large":[61],"language":[62,165],"models":[63,131],"capabilities":[66],"produce":[68],"both":[69],"accurate":[70],"masks":[72],"corresponding":[74],"spatial":[75],"reasoning":[76,103,137],"outputs.":[77],"We":[78],"construct":[79],"Position":[83],"Reasoning":[84],"(GLake-Pos)":[85],"dataset":[86],"pipeline,":[87],"which":[88],"provides":[89],"diverse,":[90],"spatially":[91],"grounded":[92],"question-answer":[93],"pairs":[94],"designed":[95],"overcome":[97],"lack":[99],"instance-aware":[101],"positional":[102],"data":[104],"remote":[106],"sensing.":[107],"Comparative":[108],"evaluation":[109],"demonstrate":[110],"(mIoU:":[113,121,126,132,141],"87.30)":[114],"surpasses":[115],"state-of-the-art":[116],"method":[117],"CNNs":[120],"78.55":[122],"-":[123,128,134,143],"79.01),":[124],"ViTs":[125],"69.27":[127],"81.75),":[129],"Geo-foundation":[130],"76.37":[133],"87.10),":[135],"60.12":[142],"75.66).":[144],"Our":[145],"approach":[146],"enables":[147],"intuitive":[148],"disaster":[149],"preparedness":[150],"informed":[152],"policy-making":[153],"context":[156],"rapidly":[158],"changing":[159],"glacial":[160],"environments":[161],"by":[162],"facilitating":[163],"natural":[164],"interaction,":[166],"thereby":[167],"supporting":[168],"more":[169],"efficient":[170],"interpretable":[172],"decision-making.":[173],"The":[174],"code":[175],"is":[176],"released":[177],"https://github.com/lalitmaurya47/GLACIA":[179]},"counts_by_year":[],"updated_date":"2026-03-07T16:01:11.037858","created_date":"2025-12-12T00:00:00"}
