{"id":"https://openalex.org/W7155399835","doi":"https://doi.org/10.48550/arxiv.2604.20190","title":"WildFireVQA: A Large-Scale Radiometric Thermal VQA Benchmark for Aerial Wildfire Monitoring","display_name":"WildFireVQA: A Large-Scale Radiometric Thermal VQA Benchmark for Aerial Wildfire Monitoring","publication_year":2026,"publication_date":"2026-04-22","ids":{"openalex":"https://openalex.org/W7155399835","doi":"https://doi.org/10.48550/arxiv.2604.20190"},"language":null,"primary_location":{"id":"doi:10.48550/arxiv.2604.20190","is_oa":true,"landing_page_url":"https://doi.org/10.48550/arxiv.2604.20190","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":null,"is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"article"},"type":"preprint","indexed_in":["datacite"],"open_access":{"is_oa":true,"oa_status":"green","oa_url":"https://doi.org/10.48550/arxiv.2604.20190","any_repository_has_fulltext":true},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5134402510","display_name":"Mobin Habibpour","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Habibpour, Mobin","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5031144137","display_name":"Niloufar Alipour Talemi","orcid":"https://orcid.org/0009-0000-6881-3671"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Talemi, Niloufar Alipour","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5134432887","display_name":"John Spodnik","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Spodnik, John","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5134406380","display_name":"Camren J. Khoury","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Khoury, Camren J.","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"last","author":{"id":"https://openalex.org/A5134438980","display_name":"Fatemeh Afghah","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Afghah, Fatemeh","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]}],"institutions":[],"countries_distinct_count":0,"institutions_distinct_count":5,"corresponding_author_ids":[],"corresponding_institution_ids":[],"apc_list":null,"apc_paid":null,"fwci":null,"has_fulltext":false,"cited_by_count":0,"citation_normalized_percentile":null,"cited_by_percentile_year":null,"biblio":{"volume":null,"issue":null,"first_page":null,"last_page":null},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T11714","display_name":"Multimodal Machine Learning Applications","score":0.7199000120162964,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T11714","display_name":"Multimodal Machine Learning Applications","score":0.7199000120162964,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T12597","display_name":"Fire Detection and Safety Systems","score":0.0982000008225441,"subfield":{"id":"https://openalex.org/subfields/2213","display_name":"Safety, Risk, Reliability and Quality"},"field":{"id":"https://openalex.org/fields/22","display_name":"Engineering"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10036","display_name":"Advanced Neural Network Applications","score":0.05590000003576279,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/benchmark","display_name":"Benchmark (surveying)","score":0.6852999925613403},{"id":"https://openalex.org/keywords/context","display_name":"Context (archaeology)","score":0.633400022983551},{"id":"https://openalex.org/keywords/consistency","display_name":"Consistency (knowledge bases)","score":0.43630000948905945},{"id":"https://openalex.org/keywords/rgb-color-model","display_name":"RGB color model","score":0.4226999878883362},{"id":"https://openalex.org/keywords/aerial-image","display_name":"Aerial image","score":0.4212999939918518},{"id":"https://openalex.org/keywords/aerial-survey","display_name":"Aerial survey","score":0.4156999886035919},{"id":"https://openalex.org/keywords/task","display_name":"Task (project management)","score":0.38760000467300415},{"id":"https://openalex.org/keywords/aerial-photography","display_name":"Aerial photography","score":0.3691999912261963}],"concepts":[{"id":"https://openalex.org/C185798385","wikidata":"https://www.wikidata.org/wiki/Q1161707","display_name":"Benchmark (surveying)","level":2,"score":0.6852999925613403},{"id":"https://openalex.org/C2779343474","wikidata":"https://www.wikidata.org/wiki/Q3109175","display_name":"Context (archaeology)","level":2,"score":0.633400022983551},{"id":"https://openalex.org/C62649853","wikidata":"https://www.wikidata.org/wiki/Q199687","display_name":"Remote sensing","level":1,"score":0.5727999806404114},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.5625},{"id":"https://openalex.org/C39432304","wikidata":"https://www.wikidata.org/wiki/Q188847","display_name":"Environmental science","level":0,"score":0.4377000033855438},{"id":"https://openalex.org/C2776436953","wikidata":"https://www.wikidata.org/wiki/Q5163215","display_name":"Consistency (knowledge bases)","level":2,"score":0.43630000948905945},{"id":"https://openalex.org/C82990744","wikidata":"https://www.wikidata.org/wiki/Q166194","display_name":"RGB color model","level":2,"score":0.4226999878883362},{"id":"https://openalex.org/C2776429412","wikidata":"https://www.wikidata.org/wiki/Q4688011","display_name":"Aerial image","level":3,"score":0.4212999939918518},{"id":"https://openalex.org/C176262533","wikidata":"https://www.wikidata.org/wiki/Q4688034","display_name":"Aerial survey","level":2,"score":0.4156999886035919},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.39800000190734863},{"id":"https://openalex.org/C2780451532","wikidata":"https://www.wikidata.org/wiki/Q759676","display_name":"Task (project management)","level":2,"score":0.38760000467300415},{"id":"https://openalex.org/C133214962","wikidata":"https://www.wikidata.org/wiki/Q191839","display_name":"Aerial photography","level":2,"score":0.3691999912261963},{"id":"https://openalex.org/C2780385302","wikidata":"https://www.wikidata.org/wiki/Q367158","display_name":"Protocol (science)","level":3,"score":0.35280001163482666},{"id":"https://openalex.org/C63479239","wikidata":"https://www.wikidata.org/wiki/Q7353546","display_name":"Robustness (evolution)","level":3,"score":0.32820001244544983},{"id":"https://openalex.org/C146849305","wikidata":"https://www.wikidata.org/wiki/Q370766","display_name":"Ground truth","level":2,"score":0.3273000121116638},{"id":"https://openalex.org/C170187044","wikidata":"https://www.wikidata.org/wiki/Q214753","display_name":"Radiometric dating","level":2,"score":0.32359999418258667},{"id":"https://openalex.org/C145804949","wikidata":"https://www.wikidata.org/wiki/Q478123","display_name":"Situation awareness","level":2,"score":0.31769999861717224},{"id":"https://openalex.org/C2778522173","wikidata":"https://www.wikidata.org/wiki/Q7281293","display_name":"Radiometric calibration","level":3,"score":0.3070000112056732},{"id":"https://openalex.org/C124101348","wikidata":"https://www.wikidata.org/wiki/Q172491","display_name":"Data mining","level":1,"score":0.2888999879360199},{"id":"https://openalex.org/C39399123","wikidata":"https://www.wikidata.org/wiki/Q1348989","display_name":"Earth observation","level":3,"score":0.28859999775886536},{"id":"https://openalex.org/C119857082","wikidata":"https://www.wikidata.org/wiki/Q2539","display_name":"Machine learning","level":1,"score":0.2867000102996826},{"id":"https://openalex.org/C87456703","wikidata":"https://www.wikidata.org/wiki/Q247760","display_name":"Radiometry","level":2,"score":0.28610000014305115},{"id":"https://openalex.org/C2776760102","wikidata":"https://www.wikidata.org/wiki/Q5139990","display_name":"Code (set theory)","level":3,"score":0.26759999990463257},{"id":"https://openalex.org/C31972630","wikidata":"https://www.wikidata.org/wiki/Q844240","display_name":"Computer vision","level":1,"score":0.26489999890327454},{"id":"https://openalex.org/C204530211","wikidata":"https://www.wikidata.org/wiki/Q752823","display_name":"Thermal","level":2,"score":0.25760000944137573},{"id":"https://openalex.org/C206345919","wikidata":"https://www.wikidata.org/wiki/Q20380951","display_name":"Resource (disambiguation)","level":2,"score":0.2506999969482422}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.48550/arxiv.2604.20190","is_oa":true,"landing_page_url":"https://doi.org/10.48550/arxiv.2604.20190","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":null,"is_accepted":false,"is_published":null,"raw_source_name":null,"raw_type":"article"}],"best_oa_location":{"id":"doi:10.48550/arxiv.2604.20190","is_oa":true,"landing_page_url":"https://doi.org/10.48550/arxiv.2604.20190","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":null,"is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"article"},"sustainable_development_goals":[],"awards":[],"funders":[],"has_content":{"pdf":false,"grobid_xml":false},"content_urls":null,"referenced_works_count":0,"referenced_works":[],"related_works":[],"abstract_inverted_index":{"Wildfire":[0],"monitoring":[1,38],"requires":[2],"timely,":[3],"actionable":[4],"situational":[5],"awareness":[6],"from":[7],"airborne":[8],"platforms,":[9],"yet":[10],"existing":[11,180],"aerial":[12,36],"visual":[13],"question":[14],"answering":[15],"(VQA)":[16],"benchmarks":[17],"do":[18],"not":[19],"evaluate":[20],"wildfire-specific":[21],"multimodal":[22,107],"reasoning":[23,175],"grounded":[24],"in":[25,182],"thermal":[26,45,61,66,144,162],"measurements.":[27],"We":[28,126],"introduce":[29],"WildFireVQA,":[30],"a":[31,59,64,75,129],"large-scale":[32],"VQA":[33],"benchmark":[34,189],"for":[35,97,133,157,166],"wildfire":[37,99,184],"that":[39,148],"integrates":[40],"RGB":[41,57,152],"imagery":[42],"with":[43,71,114],"radiometric":[44,65,143],"data.":[46],"WildFireVQA":[47],"contains":[48],"6,097":[49],"RGB-thermal":[50],"samples,":[51],"where":[52],"each":[53],"sample":[54],"includes":[55],"an":[56],"image,":[58],"color-mapped":[60],"visualization,":[62],"and":[63,68,83,87,90,94,120,122,139,176,188],"TIFF,":[67],"is":[69],"paired":[70],"34":[72],"questions,":[73],"yielding":[74],"total":[76],"of":[77,173,179],"207,298":[78],"multiple-choice":[79],"questions":[80],"spanning":[81],"presence":[82],"detection,":[84],"classification,":[85],"distribution":[86],"segmentation,":[88],"localization":[89],"direction,":[91],"cross-modal":[92],"reasoning,":[93],"flight":[95],"planning":[96],"operational":[98],"intelligence.":[100],"To":[101],"improve":[102],"annotation":[103],"reliability,":[104],"we":[105],"combine":[106],"large":[108],"language":[109],"model":[110],"(MLLM)-based":[111],"answer":[112],"generation":[113],"sensor-driven":[115],"deterministic":[116],"labeling,":[117],"manual":[118],"verification,":[119],"intra-frame":[121],"inter-frame":[123],"consistency":[124],"checks.":[125],"further":[127],"establish":[128],"comprehensive":[130],"evaluation":[131],"protocol":[132],"representative":[134],"MLLMs":[135,181],"under":[136],"RGB,":[137],"Thermal,":[138],"retrieval-augmented":[140],"settings":[141],"using":[142],"statistics.":[145],"Experiments":[146],"show":[147],"across":[149],"task":[150],"categories,":[151],"remains":[153],"the":[154,171,177],"strongest":[155],"modality":[156],"current":[158],"models,":[159],"while":[160],"retrieved":[161],"context":[163],"yields":[164],"gains":[165],"stronger":[167],"MLLMs,":[168],"highlighting":[169],"both":[170],"value":[172],"temperature-grounded":[174],"limitations":[178],"safety-critical":[183],"scenarios.":[185],"The":[186],"dataset":[187],"code":[190],"are":[191],"open-source":[192],"at":[193],"https://github.com/mobiiin/WildFire_VQA.":[194]},"counts_by_year":[],"updated_date":"2026-06-11T09:08:48.828518","created_date":"2026-04-24T00:00:00"}
