{"id":"https://openalex.org/W7124137174","doi":"https://doi.org/10.1109/icpads67057.2025.11322970","title":"VIF-YOLO: Visible-Infrared Fusion YOLO for Remote Sensing Small Object Detection","display_name":"VIF-YOLO: Visible-Infrared Fusion YOLO for Remote Sensing Small Object Detection","publication_year":2025,"publication_date":"2025-12-14","ids":{"openalex":"https://openalex.org/W7124137174","doi":"https://doi.org/10.1109/icpads67057.2025.11322970"},"language":null,"primary_location":{"id":"doi:10.1109/icpads67057.2025.11322970","is_oa":false,"landing_page_url":"https://doi.org/10.1109/icpads67057.2025.11322970","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"2025 IEEE 31th International Conference on Parallel and Distributed Systems (ICPADS)","raw_type":"proceedings-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":false,"oa_status":"closed","oa_url":null,"any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5122178412","display_name":"Renjie Chen","orcid":null},"institutions":[{"id":"https://openalex.org/I96908189","display_name":"Xinjiang University","ror":"https://ror.org/059gw8r13","country_code":"CN","type":"education","lineage":["https://openalex.org/I96908189"]}],"countries":["CN"],"is_corresponding":true,"raw_author_name":"Renjie Chen","raw_affiliation_strings":["School of Software, Xinjiang University,Urumqi,China"],"affiliations":[{"raw_affiliation_string":"School of Software, Xinjiang University,Urumqi,China","institution_ids":["https://openalex.org/I96908189"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5111701038","display_name":"Hua Yan Sun","orcid":null},"institutions":[{"id":"https://openalex.org/I96908189","display_name":"Xinjiang University","ror":"https://ror.org/059gw8r13","country_code":"CN","type":"education","lineage":["https://openalex.org/I96908189"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Hua Sun","raw_affiliation_strings":["School of Software, Xinjiang University,Urumqi,China"],"affiliations":[{"raw_affiliation_string":"School of Software, Xinjiang University,Urumqi,China","institution_ids":["https://openalex.org/I96908189"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5122099547","display_name":"Haiyang Fan","orcid":null},"institutions":[{"id":"https://openalex.org/I96908189","display_name":"Xinjiang University","ror":"https://ror.org/059gw8r13","country_code":"CN","type":"education","lineage":["https://openalex.org/I96908189"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Haiyang Fan","raw_affiliation_strings":["School of Software, Xinjiang University,Urumqi,China"],"affiliations":[{"raw_affiliation_string":"School of Software, Xinjiang University,Urumqi,China","institution_ids":["https://openalex.org/I96908189"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5122236309","display_name":"Pingxiang Wu","orcid":null},"institutions":[{"id":"https://openalex.org/I96908189","display_name":"Xinjiang University","ror":"https://ror.org/059gw8r13","country_code":"CN","type":"education","lineage":["https://openalex.org/I96908189"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Pingxiang Wu","raw_affiliation_strings":["School of Software, Xinjiang University,Urumqi,China"],"affiliations":[{"raw_affiliation_string":"School of Software, Xinjiang University,Urumqi,China","institution_ids":["https://openalex.org/I96908189"]}]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":4,"corresponding_author_ids":["https://openalex.org/A5122178412"],"corresponding_institution_ids":["https://openalex.org/I96908189"],"apc_list":null,"apc_paid":null,"fwci":0.0,"has_fulltext":false,"cited_by_count":0,"citation_normalized_percentile":{"value":0.71505112,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":null,"biblio":{"volume":null,"issue":null,"first_page":"1","last_page":"8"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T11659","display_name":"Advanced Image Fusion Techniques","score":0.5918999910354614,"subfield":{"id":"https://openalex.org/subfields/2214","display_name":"Media Technology"},"field":{"id":"https://openalex.org/fields/22","display_name":"Engineering"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T11659","display_name":"Advanced Image Fusion Techniques","score":0.5918999910354614,"subfield":{"id":"https://openalex.org/subfields/2214","display_name":"Media Technology"},"field":{"id":"https://openalex.org/fields/22","display_name":"Engineering"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10689","display_name":"Remote-Sensing Image Classification","score":0.12129999697208405,"subfield":{"id":"https://openalex.org/subfields/2214","display_name":"Media Technology"},"field":{"id":"https://openalex.org/fields/22","display_name":"Engineering"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10036","display_name":"Advanced Neural Network Applications","score":0.08269999921321869,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/multispectral-image","display_name":"Multispectral image","score":0.873199999332428},{"id":"https://openalex.org/keywords/object-detection","display_name":"Object detection","score":0.7006000280380249},{"id":"https://openalex.org/keywords/feature","display_name":"Feature (linguistics)","score":0.5891000032424927},{"id":"https://openalex.org/keywords/visibility","display_name":"Visibility","score":0.5159000158309937},{"id":"https://openalex.org/keywords/sensor-fusion","display_name":"Sensor fusion","score":0.4848000109195709},{"id":"https://openalex.org/keywords/multispectral-pattern-recognition","display_name":"Multispectral pattern recognition","score":0.44190001487731934},{"id":"https://openalex.org/keywords/pyramid","display_name":"Pyramid (geometry)","score":0.43059998750686646},{"id":"https://openalex.org/keywords/object","display_name":"Object (grammar)","score":0.41909998655319214}],"concepts":[{"id":"https://openalex.org/C173163844","wikidata":"https://www.wikidata.org/wiki/Q1761440","display_name":"Multispectral image","level":2,"score":0.873199999332428},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.748199999332428},{"id":"https://openalex.org/C62649853","wikidata":"https://www.wikidata.org/wiki/Q199687","display_name":"Remote sensing","level":1,"score":0.7184000015258789},{"id":"https://openalex.org/C2776151529","wikidata":"https://www.wikidata.org/wiki/Q3045304","display_name":"Object detection","level":3,"score":0.7006000280380249},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.5996999740600586},{"id":"https://openalex.org/C31972630","wikidata":"https://www.wikidata.org/wiki/Q844240","display_name":"Computer vision","level":1,"score":0.5925999879837036},{"id":"https://openalex.org/C2776401178","wikidata":"https://www.wikidata.org/wiki/Q12050496","display_name":"Feature (linguistics)","level":2,"score":0.5891000032424927},{"id":"https://openalex.org/C123403432","wikidata":"https://www.wikidata.org/wiki/Q654068","display_name":"Visibility","level":2,"score":0.5159000158309937},{"id":"https://openalex.org/C33954974","wikidata":"https://www.wikidata.org/wiki/Q486494","display_name":"Sensor fusion","level":2,"score":0.4848000109195709},{"id":"https://openalex.org/C104541649","wikidata":"https://www.wikidata.org/wiki/Q6935090","display_name":"Multispectral pattern recognition","level":3,"score":0.44190001487731934},{"id":"https://openalex.org/C142575187","wikidata":"https://www.wikidata.org/wiki/Q3358290","display_name":"Pyramid (geometry)","level":2,"score":0.43059998750686646},{"id":"https://openalex.org/C2781238097","wikidata":"https://www.wikidata.org/wiki/Q175026","display_name":"Object (grammar)","level":2,"score":0.41909998655319214},{"id":"https://openalex.org/C183365957","wikidata":"https://www.wikidata.org/wiki/Q17140402","display_name":"Remote sensing application","level":3,"score":0.4142000079154968},{"id":"https://openalex.org/C159078339","wikidata":"https://www.wikidata.org/wiki/Q959005","display_name":"Hyperspectral imaging","level":2,"score":0.41019999980926514},{"id":"https://openalex.org/C69744172","wikidata":"https://www.wikidata.org/wiki/Q860822","display_name":"Image fusion","level":3,"score":0.40209999680519104},{"id":"https://openalex.org/C203595873","wikidata":"https://www.wikidata.org/wiki/Q25389927","display_name":"Change detection","level":2,"score":0.38609999418258667},{"id":"https://openalex.org/C52622490","wikidata":"https://www.wikidata.org/wiki/Q1026626","display_name":"Feature extraction","level":2,"score":0.33660000562667847},{"id":"https://openalex.org/C158525013","wikidata":"https://www.wikidata.org/wiki/Q2593739","display_name":"Fusion","level":2,"score":0.3231000006198883},{"id":"https://openalex.org/C153180895","wikidata":"https://www.wikidata.org/wiki/Q7148389","display_name":"Pattern recognition (psychology)","level":2,"score":0.2833000123500824},{"id":"https://openalex.org/C9652623","wikidata":"https://www.wikidata.org/wiki/Q190109","display_name":"Field (mathematics)","level":2,"score":0.2685999870300293},{"id":"https://openalex.org/C2780226545","wikidata":"https://www.wikidata.org/wiki/Q6888030","display_name":"Modality (human\u2013computer interaction)","level":2,"score":0.2533999979496002}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.1109/icpads67057.2025.11322970","is_oa":false,"landing_page_url":"https://doi.org/10.1109/icpads67057.2025.11322970","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"2025 IEEE 31th International Conference on Parallel and Distributed Systems (ICPADS)","raw_type":"proceedings-article"}],"best_oa_location":null,"sustainable_development_goals":[],"awards":[],"funders":[],"has_content":{"grobid_xml":false,"pdf":false},"content_urls":null,"referenced_works_count":18,"referenced_works":["https://openalex.org/W2092380336","https://openalex.org/W2102605133","https://openalex.org/W2176924101","https://openalex.org/W2946490545","https://openalex.org/W2983056308","https://openalex.org/W3106808132","https://openalex.org/W3213472242","https://openalex.org/W4285264169","https://openalex.org/W4296138560","https://openalex.org/W4327652243","https://openalex.org/W4327785494","https://openalex.org/W4385801610","https://openalex.org/W4386189887","https://openalex.org/W4389491034","https://openalex.org/W4396901107","https://openalex.org/W4401806723","https://openalex.org/W4404177279","https://openalex.org/W4404909364"],"related_works":[],"abstract_inverted_index":{"The":[0],"remote":[1,15,36,69],"sensing":[2,16,37,70],"object":[3,54,64,90,178],"detection":[4,17,33,38,75,191,220],"technique":[5],"has":[6],"shown":[7],"considerable":[8],"applicability":[9],"across":[10],"various":[11],"domains.":[12,140],"Visible":[13,56],"light":[14],"is":[18,39],"easily":[19],"affected":[20,41],"by":[21,42,79],"environmental":[22,43],"factors":[23],"such":[24],"as":[25],"lighting":[26],"and":[27,58,92,122,125,184,196,208],"weather":[28],"conditions,":[29],"resulting":[30],"in":[31,53,88,137,218],"poor":[32],"performance.":[34],"Infrared":[35],"less":[40],"factors,":[44],"but":[45],"its":[46,51],"limited":[47],"texture":[48],"detail":[49],"restricts":[50],"accuracy":[52],"detection.":[55],"imagery":[57,60],"infrared":[59],"combined":[61],"for":[62,176],"multispectral":[63,74,102,177],"recognition":[65],"effectively":[66],"address":[67],"complex":[68],"scenarios.":[71],"Nonetheless,":[72],"prior":[73],"algorithms":[76],"are":[77],"plagued":[78],"challenges":[80],"like":[81],"inadequate":[82],"modality":[83],"information":[84,163],"fusion,":[85],"inferior":[86],"performance":[87],"multi-scale":[89],"detection,":[91,179],"insufficient":[93],"exploitation":[94],"of":[95,132,205,215],"semantic":[96],"information.":[97],"We":[98,169],"propose":[99],"a":[100,172,188],"novel":[101],"fusion":[103,131],"architecture":[104],"to":[105,119,154],"tackle":[106],"these":[107],"difficulties.":[108],"Initially,":[109],"we":[110,142],"developed":[111,171],"the":[112,144,151,157,194,213],"Cross-modal":[113],"Adaptive":[114],"Frequency":[115],"Fusion":[116],"(CAFF)":[117],"module":[118,153],"independently":[120],"decompose":[121],"integrate":[123],"highfrequency":[124],"low-frequency":[126],"information,":[127],"thereby":[128],"achieving":[129],"fine":[130,166],"images":[133],"from":[134],"different":[135,138],"modalities":[136],"frequency":[139],"Subsequently,":[141],"integrated":[143],"Multi-scale":[145],"Receptive":[146],"Field":[147],"Aggregator":[148],"(MRFA)":[149],"into":[150],"SPPF":[152],"ensure":[155],"that":[156],"target":[158],"obtains":[159],"sufficient":[160],"global":[161],"contextual":[162],"while":[164],"maintaining":[165],"spatial":[167],"details.":[168],"have":[170],"feature":[173,182],"pyramid":[174],"network":[175],"significantly":[180],"improving":[181],"interaction":[183],"fusion.":[185],"This":[186],"constitutes":[187],"thorough":[189],"VIF-YOLO":[190,199],"framework.":[192],"On":[193],"VEDAI":[195],"LLVIP":[197],"datasets,":[198],"attains":[200],"<tex":[201],"xmlns:mml=\"http://www.w3.org/1998/Math/MathML\"":[202],"xmlns:xlink=\"http://www.w3.org/1999/xlink\">$\\text{mAP}_{50}$</tex>":[203],"values":[204],"75.1":[206],"%":[207],"96.3":[209],"%,":[210],"respectively,":[211],"illustrating":[212],"efficacy":[214],"our":[216],"approach":[217],"enhancing":[219],"capabilities.":[221]},"counts_by_year":[],"updated_date":"2026-01-16T23:16:36.188383","created_date":"2026-01-15T00:00:00"}
