{"id":"https://openalex.org/W4416751112","doi":"https://doi.org/10.1109/iros60139.2025.11247103","title":"CoDifFu: Diffusion-Based Collaborative Perception with Efficient Heterogeneous Feature Fusion","display_name":"CoDifFu: Diffusion-Based Collaborative Perception with Efficient Heterogeneous Feature Fusion","publication_year":2025,"publication_date":"2025-10-19","ids":{"openalex":"https://openalex.org/W4416751112","doi":"https://doi.org/10.1109/iros60139.2025.11247103"},"language":null,"primary_location":{"id":"doi:10.1109/iros60139.2025.11247103","is_oa":false,"landing_page_url":"https://doi.org/10.1109/iros60139.2025.11247103","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"2025 IEEE/RSJ International Conference on Intelligent Robots and Systems (IROS)","raw_type":"proceedings-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":false,"oa_status":"closed","oa_url":null,"any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":null,"display_name":"Zeyu Meng","orcid":null},"institutions":[{"id":"https://openalex.org/I87445476","display_name":"Xi'an Jiaotong University","ror":"https://ror.org/017zhmm22","country_code":"CN","type":"education","lineage":["https://openalex.org/I87445476"]}],"countries":["CN"],"is_corresponding":true,"raw_author_name":"Zeyu Meng","raw_affiliation_strings":["Xi&#x2019;an Jiaotong University,Institute of Artificial Intelligence and Robotics,CN"],"affiliations":[{"raw_affiliation_string":"Xi&#x2019;an Jiaotong University,Institute of Artificial Intelligence and Robotics,CN","institution_ids":["https://openalex.org/I87445476"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5110814145","display_name":"Yonghong Song","orcid":"https://orcid.org/0000-0001-5978-3781"},"institutions":[{"id":"https://openalex.org/I87445476","display_name":"Xi'an Jiaotong University","ror":"https://ror.org/017zhmm22","country_code":"CN","type":"education","lineage":["https://openalex.org/I87445476"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Yonghong Song","raw_affiliation_strings":["Xi&#x2019;an Jiaotong University,School of Software Engineering,CN"],"affiliations":[{"raw_affiliation_string":"Xi&#x2019;an Jiaotong University,School of Software Engineering,CN","institution_ids":["https://openalex.org/I87445476"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5046450643","display_name":"Yuanlin Zhang","orcid":"https://orcid.org/0000-0003-0960-3636"},"institutions":[{"id":"https://openalex.org/I87445476","display_name":"Xi'an Jiaotong University","ror":"https://ror.org/017zhmm22","country_code":"CN","type":"education","lineage":["https://openalex.org/I87445476"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Yuanlin Zhang","raw_affiliation_strings":["Xi&#x2019;an Jiaotong University,Institute of Artificial Intelligence and Robotics,CN"],"affiliations":[{"raw_affiliation_string":"Xi&#x2019;an Jiaotong University,Institute of Artificial Intelligence and Robotics,CN","institution_ids":["https://openalex.org/I87445476"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5109737208","display_name":"Zenan Bai","orcid":null},"institutions":[{"id":"https://openalex.org/I87445476","display_name":"Xi'an Jiaotong University","ror":"https://ror.org/017zhmm22","country_code":"CN","type":"education","lineage":["https://openalex.org/I87445476"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Zenan Bai","raw_affiliation_strings":["Xi&#x2019;an Jiaotong University,School of Software Engineering,CN"],"affiliations":[{"raw_affiliation_string":"Xi&#x2019;an Jiaotong University,School of Software Engineering,CN","institution_ids":["https://openalex.org/I87445476"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5113242844","display_name":"Jiayi Duan","orcid":null},"institutions":[{"id":"https://openalex.org/I87445476","display_name":"Xi'an Jiaotong University","ror":"https://ror.org/017zhmm22","country_code":"CN","type":"education","lineage":["https://openalex.org/I87445476"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Jiayi Duan","raw_affiliation_strings":["Xi&#x2019;an Jiaotong University,School of Software Engineering,CN"],"affiliations":[{"raw_affiliation_string":"Xi&#x2019;an Jiaotong University,School of Software Engineering,CN","institution_ids":["https://openalex.org/I87445476"]}]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":5,"corresponding_author_ids":[],"corresponding_institution_ids":["https://openalex.org/I87445476"],"apc_list":null,"apc_paid":null,"fwci":0.0,"has_fulltext":false,"cited_by_count":0,"citation_normalized_percentile":{"value":0.36355175,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":null,"biblio":{"volume":null,"issue":null,"first_page":"10108","last_page":"10115"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10036","display_name":"Advanced Neural Network Applications","score":0.7175999879837036,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10036","display_name":"Advanced Neural Network Applications","score":0.7175999879837036,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11099","display_name":"Autonomous Vehicle Technology and Safety","score":0.028200000524520874,"subfield":{"id":"https://openalex.org/subfields/2203","display_name":"Automotive Engineering"},"field":{"id":"https://openalex.org/fields/22","display_name":"Engineering"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11448","display_name":"Face recognition and analysis","score":0.022199999541044235,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/ground-truth","display_name":"Ground truth","score":0.6187999844551086},{"id":"https://openalex.org/keywords/robustness","display_name":"Robustness (evolution)","score":0.588100016117096},{"id":"https://openalex.org/keywords/perception","display_name":"Perception","score":0.5580000281333923},{"id":"https://openalex.org/keywords/feature","display_name":"Feature (linguistics)","score":0.5284000039100647},{"id":"https://openalex.org/keywords/feature-matching","display_name":"Feature matching","score":0.477400004863739},{"id":"https://openalex.org/keywords/set","display_name":"Set (abstract data type)","score":0.42179998755455017},{"id":"https://openalex.org/keywords/object-detection","display_name":"Object detection","score":0.4081999957561493},{"id":"https://openalex.org/keywords/landmark","display_name":"Landmark","score":0.3970000147819519}],"concepts":[{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.7566999793052673},{"id":"https://openalex.org/C146849305","wikidata":"https://www.wikidata.org/wiki/Q370766","display_name":"Ground truth","level":2,"score":0.6187999844551086},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.6096000075340271},{"id":"https://openalex.org/C63479239","wikidata":"https://www.wikidata.org/wiki/Q7353546","display_name":"Robustness (evolution)","level":3,"score":0.588100016117096},{"id":"https://openalex.org/C26760741","wikidata":"https://www.wikidata.org/wiki/Q160402","display_name":"Perception","level":2,"score":0.5580000281333923},{"id":"https://openalex.org/C2776401178","wikidata":"https://www.wikidata.org/wiki/Q12050496","display_name":"Feature (linguistics)","level":2,"score":0.5284000039100647},{"id":"https://openalex.org/C2983787585","wikidata":"https://www.wikidata.org/wiki/Q93586","display_name":"Feature matching","level":3,"score":0.477400004863739},{"id":"https://openalex.org/C31972630","wikidata":"https://www.wikidata.org/wiki/Q844240","display_name":"Computer vision","level":1,"score":0.44449999928474426},{"id":"https://openalex.org/C177264268","wikidata":"https://www.wikidata.org/wiki/Q1514741","display_name":"Set (abstract data type)","level":2,"score":0.42179998755455017},{"id":"https://openalex.org/C2776151529","wikidata":"https://www.wikidata.org/wiki/Q3045304","display_name":"Object detection","level":3,"score":0.4081999957561493},{"id":"https://openalex.org/C2780297707","wikidata":"https://www.wikidata.org/wiki/Q4895393","display_name":"Landmark","level":2,"score":0.3970000147819519},{"id":"https://openalex.org/C2781238097","wikidata":"https://www.wikidata.org/wiki/Q175026","display_name":"Object (grammar)","level":2,"score":0.38580000400543213},{"id":"https://openalex.org/C158525013","wikidata":"https://www.wikidata.org/wiki/Q2593739","display_name":"Fusion","level":2,"score":0.38499999046325684},{"id":"https://openalex.org/C52622490","wikidata":"https://www.wikidata.org/wiki/Q1026626","display_name":"Feature extraction","level":2,"score":0.36000001430511475},{"id":"https://openalex.org/C2780310539","wikidata":"https://www.wikidata.org/wiki/Q12547192","display_name":"Imperfect","level":2,"score":0.35910001397132874},{"id":"https://openalex.org/C33954974","wikidata":"https://www.wikidata.org/wiki/Q486494","display_name":"Sensor fusion","level":2,"score":0.3472000062465668},{"id":"https://openalex.org/C119857082","wikidata":"https://www.wikidata.org/wiki/Q2539","display_name":"Machine learning","level":1,"score":0.3463999927043915},{"id":"https://openalex.org/C124101348","wikidata":"https://www.wikidata.org/wiki/Q172491","display_name":"Data mining","level":1,"score":0.3353999853134155},{"id":"https://openalex.org/C153180895","wikidata":"https://www.wikidata.org/wiki/Q7148389","display_name":"Pattern recognition (psychology)","level":2,"score":0.32710000872612},{"id":"https://openalex.org/C163716315","wikidata":"https://www.wikidata.org/wiki/Q901177","display_name":"Gaussian","level":2,"score":0.32010000944137573},{"id":"https://openalex.org/C64876066","wikidata":"https://www.wikidata.org/wiki/Q5141226","display_name":"Cognitive neuroscience of visual object recognition","level":3,"score":0.3181999921798706},{"id":"https://openalex.org/C2776760102","wikidata":"https://www.wikidata.org/wiki/Q5139990","display_name":"Code (set theory)","level":3,"score":0.27799999713897705},{"id":"https://openalex.org/C2781234732","wikidata":"https://www.wikidata.org/wiki/Q943505","display_name":"Fusion center","level":4,"score":0.26820001006126404},{"id":"https://openalex.org/C173414695","wikidata":"https://www.wikidata.org/wiki/Q5510276","display_name":"Fusion mechanism","level":4,"score":0.2662999927997589}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.1109/iros60139.2025.11247103","is_oa":false,"landing_page_url":"https://doi.org/10.1109/iros60139.2025.11247103","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"2025 IEEE/RSJ International Conference on Intelligent Robots and Systems (IROS)","raw_type":"proceedings-article"}],"best_oa_location":null,"sustainable_development_goals":[],"awards":[],"funders":[{"id":"https://openalex.org/F4320321001","display_name":"National Natural Science Foundation of China","ror":"https://ror.org/01h0zpd94"}],"has_content":{"pdf":false,"grobid_xml":false},"content_urls":null,"referenced_works_count":19,"referenced_works":["https://openalex.org/W2968296999","https://openalex.org/W2982681137","https://openalex.org/W2985739927","https://openalex.org/W2996759437","https://openalex.org/W3035098634","https://openalex.org/W3096609285","https://openalex.org/W3109991383","https://openalex.org/W3123928227","https://openalex.org/W3201193904","https://openalex.org/W3210076120","https://openalex.org/W4312604822","https://openalex.org/W4312933868","https://openalex.org/W4312939270","https://openalex.org/W4383108834","https://openalex.org/W4390873752","https://openalex.org/W4390874305","https://openalex.org/W4394592975","https://openalex.org/W4403889749","https://openalex.org/W4409262867"],"related_works":[],"abstract_inverted_index":{"Multi-Agent":[0],"collaborative":[1,51],"perception":[2,32,52],"is":[3],"currently":[4],"experiencing":[5],"a":[6,11,48,76,112,129],"surge":[7],"in":[8,21,30,63,162],"attention":[9],"as":[10,35,138],"novel":[12,49],"approach":[13],"to":[14,27,92,100,119,140],"addressing":[15],"autonomous":[16],"driving":[17],"challenges.":[18],"Despite":[19],"advances":[20],"previous":[22],"efforts,":[23],"challenges":[24],"remain":[25],"due":[26],"various":[28],"dilemmas":[29],"the":[31,82,89,93,97,102,106,108,122,135,171,176],"process,":[33],"such":[34],"imperfect":[36],"localization":[37,58],"and":[38,60,149,165,175],"collaboration":[39,151],"heterogeneity.":[40,152],"To":[41,153],"tackle":[42],"these":[43],"issues,":[44],"we":[45,127,157],"propose":[46],"CoDifFu,":[47,156],"diffusion-based":[50,68],"framework":[53],"that":[54],"enhances":[55],"robustness":[56],"against":[57],"uncertainty":[59],"improves":[61],"efficiency":[62],"heterogeneous":[64],"feature":[65,144],"fusion.":[66],"A":[67],"detection":[69,161],"head":[70],"progressively":[71,110],"denoises":[72],"object":[73,160],"centers":[74,116],"through":[75],"learnable":[77],"reverse":[78,101],"process.":[79,104],"During":[80],"training,":[81],"center":[83],"coordinates":[84],"of":[85,114,117,146,173,178],"objects":[86],"diffuse":[87],"from":[88],"ground":[90,123],"truth":[91,124],"Gaussian":[94],"distribution,":[95],"then":[96],"network":[98],"learns":[99],"diffusion":[103],"In":[105],"inference,":[107],"model":[109],"refines":[111],"set":[113],"random":[115],"boxes":[118],"align":[120],"with":[121],"centers.":[125],"Moreover,":[126],"devised":[128],"confidence-guided":[130],"multi-agent":[131],"communication":[132],"module(CMC),":[133],"utilizing":[134],"confidence":[136],"map":[137],"guidance":[139],"effectively":[141],"achieve":[142],"complementary":[143],"fusion":[145],"multi-agent\u2019s":[147],"features":[148],"alleviates":[150],"thoroughly":[154],"evaluate":[155],"consider":[158],"3D":[159],"both":[163],"real-world":[164],"simulation":[166],"scenarios.":[167],"Extensive":[168],"experiments":[169],"demonstrate":[170],"superiority":[172],"CoDifFu":[174],"effectiveness":[177],"all":[179],"its":[180],"vital":[181],"components.":[182],"The":[183],"code":[184],"will":[185],"be":[186],"released.":[187]},"counts_by_year":[],"updated_date":"2026-04-21T08:09:41.155169","created_date":"2025-11-28T00:00:00"}
