{"id":"https://openalex.org/W4417129277","doi":"https://doi.org/10.48550/arxiv.2510.09343","title":"Enhancing Infrared Vision: Progressive Prompt Fusion Network and Benchmark","display_name":"Enhancing Infrared Vision: Progressive Prompt Fusion Network and Benchmark","publication_year":2025,"publication_date":"2025-10-10","ids":{"openalex":"https://openalex.org/W4417129277","doi":"https://doi.org/10.48550/arxiv.2510.09343"},"language":"en","primary_location":{"id":"pmh:oai:arXiv.org:2510.09343","is_oa":true,"landing_page_url":"http://arxiv.org/abs/2510.09343","pdf_url":"https://arxiv.org/pdf/2510.09343","source":{"id":"https://openalex.org/S4393918464","display_name":"ArXiv.org","issn_l":"2331-8422","issn":["2331-8422"],"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":null,"host_organization_name":null,"host_organization_lineage":[],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"text"},"type":"preprint","indexed_in":["arxiv","datacite"],"open_access":{"is_oa":true,"oa_status":"green","oa_url":"https://arxiv.org/pdf/2510.09343","any_repository_has_fulltext":true},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5100675904","display_name":"Jinyuan Liu","orcid":"https://orcid.org/0000-0003-2085-2676"},"institutions":[],"countries":[],"is_corresponding":true,"raw_author_name":"Liu, Jinyuan","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5046711799","display_name":"Zihang Chen","orcid":"https://orcid.org/0000-0002-7437-7850"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Chen, Zihang","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5100380632","display_name":"Zhu Liu","orcid":"https://orcid.org/0000-0003-0975-2711"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Liu, Zhu","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5016996735","display_name":"Zhiying Jiang","orcid":"https://orcid.org/0000-0001-9683-4971"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Jiang, Zhiying","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5037377300","display_name":"Long Ma","orcid":"https://orcid.org/0000-0001-5125-0198"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Ma, Long","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5006602012","display_name":"Xin Fan","orcid":"https://orcid.org/0000-0001-5865-2464"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Fan, Xin","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"last","author":{"id":"https://openalex.org/A5042370642","display_name":"Risheng Liu","orcid":"https://orcid.org/0000-0002-9554-0565"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Liu, Risheng","raw_affiliation_strings":[],"affiliations":[]}],"institutions":[],"countries_distinct_count":0,"institutions_distinct_count":7,"corresponding_author_ids":["https://openalex.org/A5100675904"],"corresponding_institution_ids":[],"apc_list":null,"apc_paid":null,"fwci":null,"has_fulltext":false,"cited_by_count":0,"citation_normalized_percentile":null,"cited_by_percentile_year":null,"biblio":{"volume":null,"issue":null,"first_page":null,"last_page":null},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T11019","display_name":"Image Enhancement Techniques","score":0.2669000029563904,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T11019","display_name":"Image Enhancement Techniques","score":0.2669000029563904,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T12389","display_name":"Infrared Target Detection Methodologies","score":0.25999999046325684,"subfield":{"id":"https://openalex.org/subfields/2202","display_name":"Aerospace Engineering"},"field":{"id":"https://openalex.org/fields/22","display_name":"Engineering"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11659","display_name":"Advanced Image Fusion Techniques","score":0.18250000476837158,"subfield":{"id":"https://openalex.org/subfields/2214","display_name":"Media Technology"},"field":{"id":"https://openalex.org/fields/22","display_name":"Engineering"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/fuse","display_name":"Fuse (electrical)","score":0.7172999978065491},{"id":"https://openalex.org/keywords/benchmark","display_name":"Benchmark (surveying)","score":0.6207000017166138},{"id":"https://openalex.org/keywords/task","display_name":"Task (project management)","score":0.5618000030517578},{"id":"https://openalex.org/keywords/key","display_name":"Key (lock)","score":0.489300012588501},{"id":"https://openalex.org/keywords/fusion-mechanism","display_name":"Fusion mechanism","score":0.48330000042915344},{"id":"https://openalex.org/keywords/code","display_name":"Code (set theory)","score":0.47850000858306885},{"id":"https://openalex.org/keywords/noise","display_name":"Noise (video)","score":0.45329999923706055},{"id":"https://openalex.org/keywords/focus","display_name":"Focus (optics)","score":0.45170000195503235},{"id":"https://openalex.org/keywords/infrared","display_name":"Infrared","score":0.40230000019073486}],"concepts":[{"id":"https://openalex.org/C141353440","wikidata":"https://www.wikidata.org/wiki/Q182221","display_name":"Fuse (electrical)","level":2,"score":0.7172999978065491},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.7067000269889832},{"id":"https://openalex.org/C185798385","wikidata":"https://www.wikidata.org/wiki/Q1161707","display_name":"Benchmark (surveying)","level":2,"score":0.6207000017166138},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.6054999828338623},{"id":"https://openalex.org/C2780451532","wikidata":"https://www.wikidata.org/wiki/Q759676","display_name":"Task (project management)","level":2,"score":0.5618000030517578},{"id":"https://openalex.org/C26517878","wikidata":"https://www.wikidata.org/wiki/Q228039","display_name":"Key (lock)","level":2,"score":0.489300012588501},{"id":"https://openalex.org/C173414695","wikidata":"https://www.wikidata.org/wiki/Q5510276","display_name":"Fusion mechanism","level":4,"score":0.48330000042915344},{"id":"https://openalex.org/C31972630","wikidata":"https://www.wikidata.org/wiki/Q844240","display_name":"Computer vision","level":1,"score":0.47870001196861267},{"id":"https://openalex.org/C2776760102","wikidata":"https://www.wikidata.org/wiki/Q5139990","display_name":"Code (set theory)","level":3,"score":0.47850000858306885},{"id":"https://openalex.org/C99498987","wikidata":"https://www.wikidata.org/wiki/Q2210247","display_name":"Noise (video)","level":3,"score":0.45329999923706055},{"id":"https://openalex.org/C192209626","wikidata":"https://www.wikidata.org/wiki/Q190909","display_name":"Focus (optics)","level":2,"score":0.45170000195503235},{"id":"https://openalex.org/C158355884","wikidata":"https://www.wikidata.org/wiki/Q11388","display_name":"Infrared","level":2,"score":0.40230000019073486},{"id":"https://openalex.org/C69744172","wikidata":"https://www.wikidata.org/wiki/Q860822","display_name":"Image fusion","level":3,"score":0.3905999958515167},{"id":"https://openalex.org/C158525013","wikidata":"https://www.wikidata.org/wiki/Q2593739","display_name":"Fusion","level":2,"score":0.37369999289512634},{"id":"https://openalex.org/C89611455","wikidata":"https://www.wikidata.org/wiki/Q6804646","display_name":"Mechanism (biology)","level":2,"score":0.37229999899864197},{"id":"https://openalex.org/C2776151529","wikidata":"https://www.wikidata.org/wiki/Q3045304","display_name":"Object detection","level":3,"score":0.34880000352859497},{"id":"https://openalex.org/C82990744","wikidata":"https://www.wikidata.org/wiki/Q166194","display_name":"RGB color model","level":2,"score":0.3199000060558319},{"id":"https://openalex.org/C108583219","wikidata":"https://www.wikidata.org/wiki/Q197536","display_name":"Deep learning","level":2,"score":0.3142000138759613},{"id":"https://openalex.org/C2779679103","wikidata":"https://www.wikidata.org/wiki/Q5251805","display_name":"Degradation (telecommunications)","level":2,"score":0.311599999666214},{"id":"https://openalex.org/C2779222261","wikidata":"https://www.wikidata.org/wiki/Q624587","display_name":"Thermography","level":3,"score":0.30320000648498535},{"id":"https://openalex.org/C115961682","wikidata":"https://www.wikidata.org/wiki/Q860623","display_name":"Image (mathematics)","level":2,"score":0.28459998965263367},{"id":"https://openalex.org/C43126263","wikidata":"https://www.wikidata.org/wiki/Q128751","display_name":"Source code","level":2,"score":0.28450000286102295},{"id":"https://openalex.org/C2776502983","wikidata":"https://www.wikidata.org/wiki/Q690182","display_name":"Contrast (vision)","level":2,"score":0.27869999408721924},{"id":"https://openalex.org/C204323151","wikidata":"https://www.wikidata.org/wiki/Q905424","display_name":"Range (aeronautics)","level":2,"score":0.27790001034736633},{"id":"https://openalex.org/C79403827","wikidata":"https://www.wikidata.org/wiki/Q3988","display_name":"Real-time computing","level":1,"score":0.2689000070095062},{"id":"https://openalex.org/C63479239","wikidata":"https://www.wikidata.org/wiki/Q7353546","display_name":"Robustness (evolution)","level":3,"score":0.26179999113082886},{"id":"https://openalex.org/C44154836","wikidata":"https://www.wikidata.org/wiki/Q45045","display_name":"Simulation","level":1,"score":0.25029999017715454}],"mesh":[],"locations_count":2,"locations":[{"id":"pmh:oai:arXiv.org:2510.09343","is_oa":true,"landing_page_url":"http://arxiv.org/abs/2510.09343","pdf_url":"https://arxiv.org/pdf/2510.09343","source":{"id":"https://openalex.org/S4393918464","display_name":"ArXiv.org","issn_l":"2331-8422","issn":["2331-8422"],"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":null,"host_organization_name":null,"host_organization_lineage":[],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"text"},{"id":"doi:10.48550/arxiv.2510.09343","is_oa":true,"landing_page_url":"https://doi.org/10.48550/arxiv.2510.09343","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":null,"is_accepted":false,"is_published":null,"raw_source_name":null,"raw_type":"article"}],"best_oa_location":{"id":"pmh:oai:arXiv.org:2510.09343","is_oa":true,"landing_page_url":"http://arxiv.org/abs/2510.09343","pdf_url":"https://arxiv.org/pdf/2510.09343","source":{"id":"https://openalex.org/S4393918464","display_name":"ArXiv.org","issn_l":"2331-8422","issn":["2331-8422"],"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":null,"host_organization_name":null,"host_organization_lineage":[],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"text"},"sustainable_development_goals":[],"awards":[],"funders":[],"has_content":{"pdf":false,"grobid_xml":false},"content_urls":null,"referenced_works_count":0,"referenced_works":[],"related_works":[],"abstract_inverted_index":{"We":[0],"engage":[1],"in":[2,54],"the":[3,51,64,76,84,95,101,109,134,142,149,163,167,173],"relatively":[4],"underexplored":[5],"task":[6],"named":[7],"thermal":[8,85,168],"infrared":[9,13,177],"image":[10,14],"enhancement.":[11],"Existing":[12],"enhancement":[15,38,143],"methods":[16],"primarily":[17],"focus":[18],"on":[19,83,205],"tackling":[20],"individual":[21],"degradations,":[22],"such":[23],"as":[24],"noise,":[25],"contrast,":[26],"and":[27,67,155],"blurring,":[28],"making":[29],"it":[30],"difficult":[31],"to":[32,42,50,99,111,131,140,151],"handle":[33],"coupled":[34],"degradations.":[35],"Meanwhile,":[36],"all-in-one":[37],"methods,":[39],"commonly":[40],"applied":[41],"RGB":[43],"sensors,":[44],"often":[45],"demonstrate":[46],"limited":[47],"effectiveness":[48],"due":[49],"significant":[52],"differences":[53],"imaging":[55,65,86],"models.":[56],"In":[57,121],"sight":[58],"of":[59,91,137,166,183],"this,":[60],"we":[61,93,171],"first":[62],"revisit":[63],"mechanism":[66,128],"introduce":[68,172],"a":[69,123,180,210],"Progressive":[70,125],"Prompt":[71],"Fusion":[72],"Network":[73],"(PPFN).":[74],"Specifically,":[75],"PPFN":[77],"initially":[78],"establishes":[79],"prompt":[80,97],"pairs":[81,98],"based":[82],"process.":[87],"For":[88],"each":[89],"type":[90],"degradation,":[92],"fuse":[94],"corresponding":[96],"modulate":[100],"model's":[102,135],"features,":[103],"providing":[104],"adaptive":[105],"guidance":[106],"that":[107,188],"enables":[108],"model":[110,150],"better":[112],"address":[113],"specific":[114,198],"degradations":[115],"under":[116,197],"single":[117],"or":[118],"multiple":[119],"conditions.":[120],"addition,":[122],"Selective":[124],"Training":[126],"(SPT)":[127],"is":[129,215],"introduced":[130],"gradually":[132],"refine":[133],"handling":[136],"composite":[138],"cases":[139],"align":[141],"process,":[144],"which":[145],"not":[146,191],"only":[147,192],"allows":[148],"remove":[152],"camera":[153],"noise":[154],"retain":[156],"key":[157],"structural":[158],"details,":[159],"but":[160,200],"also":[161,201],"enhancing":[162],"overall":[164],"contrast":[165],"image.":[169],"Furthermore,":[170],"most":[174],"high-quality,":[175],"multi-scenarios":[176],"benchmark":[178],"covering":[179],"wide":[181],"range":[182],"scenarios.":[184],"Extensive":[185],"experiments":[186],"substantiate":[187],"our":[189],"approach":[190],"delivers":[193],"promising":[194],"visual":[195],"results":[196],"degradation":[199,207],"significantly":[202],"improves":[203],"performance":[204],"complex":[206],"scenes,":[208],"achieving":[209],"notable":[211],"8.76\\%":[212],"improvement.":[213],"Code":[214],"available":[216],"at":[217],"https://github.com/Zihang-Chen/HM-TIR.":[218]},"counts_by_year":[],"updated_date":"2026-03-07T16:01:11.037858","created_date":"2025-10-14T00:00:00"}
