{"id":"https://openalex.org/W4401567633","doi":"https://doi.org/10.1109/tiv.2024.3443264","title":"CDC-YOLOFusion: Leveraging Cross-Scale Dynamic Convolution Fusion for Visible-Infrared Object Detection","display_name":"CDC-YOLOFusion: Leveraging Cross-Scale Dynamic Convolution Fusion for Visible-Infrared Object Detection","publication_year":2024,"publication_date":"2024-08-14","ids":{"openalex":"https://openalex.org/W4401567633","doi":"https://doi.org/10.1109/tiv.2024.3443264"},"language":"en","primary_location":{"id":"doi:10.1109/tiv.2024.3443264","is_oa":false,"landing_page_url":"https://doi.org/10.1109/tiv.2024.3443264","pdf_url":null,"source":{"id":"https://openalex.org/S4210199657","display_name":"IEEE Transactions on Intelligent Vehicles","issn_l":"2379-8858","issn":["2379-8858","2379-8904"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310319808","host_organization_name":"Institute of Electrical and Electronics Engineers","host_organization_lineage":["https://openalex.org/P4310319808"],"host_organization_lineage_names":["Institute of Electrical and Electronics Engineers"],"type":"journal"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"IEEE Transactions on Intelligent Vehicles","raw_type":"journal-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":false,"oa_status":"closed","oa_url":null,"any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5010561697","display_name":"Zian Wang","orcid":"https://orcid.org/0009-0008-3510-3428"},"institutions":[{"id":"https://openalex.org/I16609230","display_name":"Hunan University","ror":"https://ror.org/05htk5m33","country_code":"CN","type":"education","lineage":["https://openalex.org/I16609230"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Zian Wang","raw_affiliation_strings":["College of Computer Science and Electronic Engineering, Hunan University, Changsha, China"],"raw_orcid":"https://orcid.org/0009-0008-3510-3428","affiliations":[{"raw_affiliation_string":"College of Computer Science and Electronic Engineering, Hunan University, Changsha, China","institution_ids":["https://openalex.org/I16609230"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5040862900","display_name":"Xianghui Liao","orcid":null},"institutions":[{"id":"https://openalex.org/I16609230","display_name":"Hunan University","ror":"https://ror.org/05htk5m33","country_code":"CN","type":"education","lineage":["https://openalex.org/I16609230"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Xianghui Liao","raw_affiliation_strings":["College of Computer Science and Electronic Engineering, Hunan University, Changsha, China"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"College of Computer Science and Electronic Engineering, Hunan University, Changsha, China","institution_ids":["https://openalex.org/I16609230"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5100603557","display_name":"Jin Yuan","orcid":"https://orcid.org/0000-0002-9600-7789"},"institutions":[{"id":"https://openalex.org/I16609230","display_name":"Hunan University","ror":"https://ror.org/05htk5m33","country_code":"CN","type":"education","lineage":["https://openalex.org/I16609230"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Jin Yuan","raw_affiliation_strings":["College of Computer Science and Electronic Engineering, Hunan University, Changsha, China"],"raw_orcid":"https://orcid.org/0000-0002-9600-7789","affiliations":[{"raw_affiliation_string":"College of Computer Science and Electronic Engineering, Hunan University, Changsha, China","institution_ids":["https://openalex.org/I16609230"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5035821863","display_name":"You Yao","orcid":null},"institutions":[{"id":"https://openalex.org/I1174212","display_name":"University of Southern California","ror":"https://ror.org/03taz7m60","country_code":"US","type":"education","lineage":["https://openalex.org/I1174212"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"You Yao","raw_affiliation_strings":["USC Viterbi School of Engineering, University of Southern California, Los Angeles, CA, USA"],"raw_orcid":"https://orcid.org/0009-0001-8902-4193","affiliations":[{"raw_affiliation_string":"USC Viterbi School of Engineering, University of Southern California, Los Angeles, CA, USA","institution_ids":["https://openalex.org/I1174212"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5100396723","display_name":"Zhiyong Li","orcid":"https://orcid.org/0000-0001-9720-5915"},"institutions":[{"id":"https://openalex.org/I16609230","display_name":"Hunan University","ror":"https://ror.org/05htk5m33","country_code":"CN","type":"education","lineage":["https://openalex.org/I16609230"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Zhiyong Li","raw_affiliation_strings":["College of Computer Science and Electronic Engineering, Hunan University, Changsha, China"],"raw_orcid":"https://orcid.org/0000-0001-9720-5915","affiliations":[{"raw_affiliation_string":"College of Computer Science and Electronic Engineering, Hunan University, Changsha, China","institution_ids":["https://openalex.org/I16609230"]}]}],"institutions":[],"countries_distinct_count":2,"institutions_distinct_count":5,"corresponding_author_ids":[],"corresponding_institution_ids":[],"apc_list":null,"apc_paid":null,"fwci":40.3469,"has_fulltext":false,"cited_by_count":32,"citation_normalized_percentile":{"value":0.99748676,"is_in_top_1_percent":true,"is_in_top_10_percent":true},"cited_by_percentile_year":{"min":94,"max":100},"biblio":{"volume":"10","issue":"3","first_page":"2080","last_page":"2093"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T12389","display_name":"Infrared Target Detection Methodologies","score":0.9879999756813049,"subfield":{"id":"https://openalex.org/subfields/2202","display_name":"Aerospace Engineering"},"field":{"id":"https://openalex.org/fields/22","display_name":"Engineering"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T12389","display_name":"Infrared Target Detection Methodologies","score":0.9879999756813049,"subfield":{"id":"https://openalex.org/subfields/2202","display_name":"Aerospace Engineering"},"field":{"id":"https://openalex.org/fields/22","display_name":"Engineering"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10689","display_name":"Remote-Sensing Image Classification","score":0.9448999762535095,"subfield":{"id":"https://openalex.org/subfields/2214","display_name":"Media Technology"},"field":{"id":"https://openalex.org/fields/22","display_name":"Engineering"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11659","display_name":"Advanced Image Fusion Techniques","score":0.9287999868392944,"subfield":{"id":"https://openalex.org/subfields/2214","display_name":"Media Technology"},"field":{"id":"https://openalex.org/fields/22","display_name":"Engineering"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/infrared","display_name":"Infrared","score":0.7513676881790161},{"id":"https://openalex.org/keywords/convolution","display_name":"Convolution (computer science)","score":0.6390251517295837},{"id":"https://openalex.org/keywords/fusion","display_name":"Fusion","score":0.6244129538536072},{"id":"https://openalex.org/keywords/scale","display_name":"Scale (ratio)","score":0.6198468208312988},{"id":"https://openalex.org/keywords/object","display_name":"Object (grammar)","score":0.4953876733779907},{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.4719630479812622},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.37427330017089844},{"id":"https://openalex.org/keywords/physics","display_name":"Physics","score":0.26649707555770874},{"id":"https://openalex.org/keywords/optics","display_name":"Optics","score":0.23515266180038452}],"concepts":[{"id":"https://openalex.org/C158355884","wikidata":"https://www.wikidata.org/wiki/Q11388","display_name":"Infrared","level":2,"score":0.7513676881790161},{"id":"https://openalex.org/C45347329","wikidata":"https://www.wikidata.org/wiki/Q5166604","display_name":"Convolution (computer science)","level":3,"score":0.6390251517295837},{"id":"https://openalex.org/C158525013","wikidata":"https://www.wikidata.org/wiki/Q2593739","display_name":"Fusion","level":2,"score":0.6244129538536072},{"id":"https://openalex.org/C2778755073","wikidata":"https://www.wikidata.org/wiki/Q10858537","display_name":"Scale (ratio)","level":2,"score":0.6198468208312988},{"id":"https://openalex.org/C2781238097","wikidata":"https://www.wikidata.org/wiki/Q175026","display_name":"Object (grammar)","level":2,"score":0.4953876733779907},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.4719630479812622},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.37427330017089844},{"id":"https://openalex.org/C121332964","wikidata":"https://www.wikidata.org/wiki/Q413","display_name":"Physics","level":0,"score":0.26649707555770874},{"id":"https://openalex.org/C120665830","wikidata":"https://www.wikidata.org/wiki/Q14620","display_name":"Optics","level":1,"score":0.23515266180038452},{"id":"https://openalex.org/C41895202","wikidata":"https://www.wikidata.org/wiki/Q8162","display_name":"Linguistics","level":1,"score":0.0},{"id":"https://openalex.org/C138885662","wikidata":"https://www.wikidata.org/wiki/Q5891","display_name":"Philosophy","level":0,"score":0.0},{"id":"https://openalex.org/C50644808","wikidata":"https://www.wikidata.org/wiki/Q192776","display_name":"Artificial neural network","level":2,"score":0.0},{"id":"https://openalex.org/C62520636","wikidata":"https://www.wikidata.org/wiki/Q944","display_name":"Quantum mechanics","level":1,"score":0.0}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.1109/tiv.2024.3443264","is_oa":false,"landing_page_url":"https://doi.org/10.1109/tiv.2024.3443264","pdf_url":null,"source":{"id":"https://openalex.org/S4210199657","display_name":"IEEE Transactions on Intelligent Vehicles","issn_l":"2379-8858","issn":["2379-8858","2379-8904"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310319808","host_organization_name":"Institute of Electrical and Electronics Engineers","host_organization_lineage":["https://openalex.org/P4310319808"],"host_organization_lineage_names":["Institute of Electrical and Electronics Engineers"],"type":"journal"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"IEEE Transactions on Intelligent Vehicles","raw_type":"journal-article"}],"best_oa_location":null,"sustainable_development_goals":[],"awards":[{"id":"https://openalex.org/G4041047505","display_name":null,"funder_award_id":"U23A20341","funder_id":"https://openalex.org/F4320321001","funder_display_name":"National Natural Science Foundation of China"},{"id":"https://openalex.org/G8354495100","display_name":null,"funder_award_id":"U21A20518","funder_id":"https://openalex.org/F4320321001","funder_display_name":"National Natural Science Foundation of China"},{"id":"https://openalex.org/G8637866159","display_name":null,"funder_award_id":"62272157","funder_id":"https://openalex.org/F4320321001","funder_display_name":"National Natural Science Foundation of China"}],"funders":[{"id":"https://openalex.org/F4320321001","display_name":"National Natural Science Foundation of China","ror":"https://ror.org/01h0zpd94"}],"has_content":{"grobid_xml":false,"pdf":false},"content_urls":null,"referenced_works_count":64,"referenced_works":["https://openalex.org/W1536680647","https://openalex.org/W2041346029","https://openalex.org/W2056716515","https://openalex.org/W2176924101","https://openalex.org/W2597926275","https://openalex.org/W2622634896","https://openalex.org/W2915569587","https://openalex.org/W2963037989","https://openalex.org/W2963150697","https://openalex.org/W3006663681","https://openalex.org/W3034421924","https://openalex.org/W3035678286","https://openalex.org/W3036931590","https://openalex.org/W3133873791","https://openalex.org/W3152390103","https://openalex.org/W3156772576","https://openalex.org/W3164282918","https://openalex.org/W3164576087","https://openalex.org/W3168463823","https://openalex.org/W3177052299","https://openalex.org/W3186033197","https://openalex.org/W3199191229","https://openalex.org/W3203003533","https://openalex.org/W3207919963","https://openalex.org/W3212881378","https://openalex.org/W3213472242","https://openalex.org/W4200631567","https://openalex.org/W4210621820","https://openalex.org/W4304080855","https://openalex.org/W4312594135","https://openalex.org/W4312735552","https://openalex.org/W4312946813","https://openalex.org/W4313007055","https://openalex.org/W4317036849","https://openalex.org/W4318624514","https://openalex.org/W4319299740","https://openalex.org/W4327785494","https://openalex.org/W4366378409","https://openalex.org/W4376131895","https://openalex.org/W4379528676","https://openalex.org/W4382119971","https://openalex.org/W4385245566","https://openalex.org/W4385326867","https://openalex.org/W4386076325","https://openalex.org/W4386083029","https://openalex.org/W4386189887","https://openalex.org/W4386737234","https://openalex.org/W4388854490","https://openalex.org/W4390787329","https://openalex.org/W4390873988","https://openalex.org/W4390874259","https://openalex.org/W4391461226","https://openalex.org/W4391559729","https://openalex.org/W4391849436","https://openalex.org/W4391953389","https://openalex.org/W4392132227","https://openalex.org/W4395017707","https://openalex.org/W6620707391","https://openalex.org/W6757585730","https://openalex.org/W6767312599","https://openalex.org/W6802521057","https://openalex.org/W6843259600","https://openalex.org/W6845935626","https://openalex.org/W6861081364"],"related_works":["https://openalex.org/W2374614594","https://openalex.org/W2391549584","https://openalex.org/W2737719445","https://openalex.org/W2099421762","https://openalex.org/W2362091980","https://openalex.org/W2530546662","https://openalex.org/W4387838477","https://openalex.org/W4239098401","https://openalex.org/W2391203560","https://openalex.org/W2967030268"],"abstract_inverted_index":{"Feature-level":[0],"fusion":[1,25],"methods":[2,26],"have":[3],"demonstrated":[4],"superior":[5],"performance":[6,191,198],"for":[7,167],"visible-infrared":[8],"object":[9],"detection":[10,176],"due":[11],"to":[12,34,39,42,67,91,117,154,202,208],"the":[13,110,130,151,186,209],"deep":[14],"exploration":[15],"of":[16,132,164],"visible":[17,96],"and":[18,70,97,161],"infrared":[19,98],"features.":[20],"However,":[21],"most":[22],"existing":[23,187],"feature-level":[24],"utilize":[27],"multiple":[28],"convolutional":[29],"layers":[30],"with":[31,199],"fixed":[32],"parameters":[33],"extract":[35,69],"bimodal":[36,72],"features,":[37],"leading":[38],"low":[40],"adaptivity":[41],"diverse":[43],"data":[44,76,84],"distributions.":[45],"This":[46],"paper":[47],"proposes":[48],"a":[49,59,82,124,144],"Cross-scale":[50,61],"Dynamic":[51,62],"Convolution-driven":[52],"YOLO":[53],"Fusion":[54,64],"(CDC-YOLOFusion)":[55],"network,":[56],"which":[57,128],"introduces":[58],"novel":[60,83,145],"Convolution":[63],"(CDCF)":[65],"module":[66],"adaptively":[68],"fuse":[71],"features":[73,116,134,160,163],"concerning":[74],"on":[75,108,157,173],"distribution.":[77],"Technically,":[78],"CDC-YOLOFusion":[79],"first":[80],"designs":[81],"augmentation":[85],"strategy":[86],"\u201cCross-modal":[87],"Data":[88],"Swapping\u201d":[89],"(CDS)":[90],"exchange":[92],"local":[93,105],"regions":[94],"between":[95,135],"images,":[99],"effectively":[100,141],"capturing":[101],"cross-modal":[102,146],"correlations":[103],"within":[104],"regions.":[106],"Building":[107],"this,":[109],"proposed":[111],"CDCF":[112,139,180],"utilizes":[113],"cross-scale":[114],"enhanced":[115],"assist":[118],"dynamic":[119],"convolution":[120],"prediction":[121],"by":[122,143],"introducing":[123],"disparity":[125],"attention":[126],"mask,":[127],"emphasizes":[129],"extraction":[131],"disparate":[133],"two":[136],"modalities.":[137],"Our":[138],"is":[140],"guided":[142],"kernel":[147],"interaction":[148],"loss,":[149],"aiming":[150],"learned":[152],"kernels":[153],"simultaneously":[155],"focus":[156],"common":[158],"salient":[159],"unique":[162],"each":[165],"modality":[166],"comprehensive":[168],"feature":[169],"generation.":[170],"Extensive":[171],"experiments":[172],"three":[174],"representative":[175],"datasets":[177],"demonstrate":[178],"that":[179],"can":[181],"be":[182],"easily":[183],"plugined":[184],"into":[185],"pipelines,":[188],"obtaining":[189],"consistent":[190],"improvements.":[192],"Moreover,":[193],"our":[194],"approach":[195],"yields":[196],"SOTA":[197],"about":[200],"2%":[201],"3%":[203],"mAP":[204],"improvements":[205],"as":[206],"compared":[207],"state-of-the-art":[210],"methods.":[211]},"counts_by_year":[{"year":2026,"cited_by_count":14},{"year":2025,"cited_by_count":16},{"year":2024,"cited_by_count":2}],"updated_date":"2026-06-13T07:54:00.901334","created_date":"2025-10-10T00:00:00"}
