{"id":"https://openalex.org/W4401414563","doi":"https://doi.org/10.1109/icra57147.2024.10610545","title":"EMIFF: Enhanced Multi-scale Image Feature Fusion for Vehicle-Infrastructure Cooperative 3D Object Detection","display_name":"EMIFF: Enhanced Multi-scale Image Feature Fusion for Vehicle-Infrastructure Cooperative 3D Object Detection","publication_year":2024,"publication_date":"2024-05-13","ids":{"openalex":"https://openalex.org/W4401414563","doi":"https://doi.org/10.1109/icra57147.2024.10610545"},"language":"en","primary_location":{"id":"doi:10.1109/icra57147.2024.10610545","is_oa":false,"landing_page_url":"https://doi.org/10.1109/icra57147.2024.10610545","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"2024 IEEE International Conference on Robotics and Automation (ICRA)","raw_type":"proceedings-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":false,"oa_status":"closed","oa_url":null,"any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5100407596","display_name":"Zhe Wang","orcid":"https://orcid.org/0000-0002-0597-4475"},"institutions":[{"id":"https://openalex.org/I99065089","display_name":"Tsinghua University","ror":"https://ror.org/03cve4549","country_code":"CN","type":"education","lineage":["https://openalex.org/I99065089"]}],"countries":["CN"],"is_corresponding":true,"raw_author_name":"Zhe Wang","raw_affiliation_strings":["Tsinghua University,Institute for AI Industry Research (AIR),Beijing,China"],"affiliations":[{"raw_affiliation_string":"Tsinghua University,Institute for AI Industry Research (AIR),Beijing,China","institution_ids":["https://openalex.org/I99065089"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5007154878","display_name":"Siqi Fan","orcid":"https://orcid.org/0000-0003-4962-6293"},"institutions":[{"id":"https://openalex.org/I99065089","display_name":"Tsinghua University","ror":"https://ror.org/03cve4549","country_code":"CN","type":"education","lineage":["https://openalex.org/I99065089"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Siqi Fan","raw_affiliation_strings":["Tsinghua University,Institute for AI Industry Research (AIR),Beijing,China"],"affiliations":[{"raw_affiliation_string":"Tsinghua University,Institute for AI Industry Research (AIR),Beijing,China","institution_ids":["https://openalex.org/I99065089"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5044920305","display_name":"Xiaoliang Huo","orcid":null},"institutions":[{"id":"https://openalex.org/I99065089","display_name":"Tsinghua University","ror":"https://ror.org/03cve4549","country_code":"CN","type":"education","lineage":["https://openalex.org/I99065089"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Xiaoliang Huo","raw_affiliation_strings":["Tsinghua University,Institute for AI Industry Research (AIR),Beijing,China"],"affiliations":[{"raw_affiliation_string":"Tsinghua University,Institute for AI Industry Research (AIR),Beijing,China","institution_ids":["https://openalex.org/I99065089"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5022610350","display_name":"Tongda Xu","orcid":"https://orcid.org/0000-0002-5594-3992"},"institutions":[{"id":"https://openalex.org/I99065089","display_name":"Tsinghua University","ror":"https://ror.org/03cve4549","country_code":"CN","type":"education","lineage":["https://openalex.org/I99065089"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Tongda Xu","raw_affiliation_strings":["Tsinghua University,Institute for AI Industry Research (AIR),Beijing,China"],"affiliations":[{"raw_affiliation_string":"Tsinghua University,Institute for AI Industry Research (AIR),Beijing,China","institution_ids":["https://openalex.org/I99065089"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5100322699","display_name":"Yan Wang","orcid":"https://orcid.org/0000-0002-4751-0708"},"institutions":[{"id":"https://openalex.org/I99065089","display_name":"Tsinghua University","ror":"https://ror.org/03cve4549","country_code":"CN","type":"education","lineage":["https://openalex.org/I99065089"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Yan Wang","raw_affiliation_strings":["Tsinghua University,Institute for AI Industry Research (AIR),Beijing,China"],"affiliations":[{"raw_affiliation_string":"Tsinghua University,Institute for AI Industry Research (AIR),Beijing,China","institution_ids":["https://openalex.org/I99065089"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5115596103","display_name":"Jingjing Liu","orcid":"https://orcid.org/0009-0008-0338-8465"},"institutions":[{"id":"https://openalex.org/I99065089","display_name":"Tsinghua University","ror":"https://ror.org/03cve4549","country_code":"CN","type":"education","lineage":["https://openalex.org/I99065089"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Jingjing Liu","raw_affiliation_strings":["Tsinghua University,Institute for AI Industry Research (AIR),Beijing,China"],"affiliations":[{"raw_affiliation_string":"Tsinghua University,Institute for AI Industry Research (AIR),Beijing,China","institution_ids":["https://openalex.org/I99065089"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5020418881","display_name":"Yilun Chen","orcid":"https://orcid.org/0000-0002-9134-9368"},"institutions":[{"id":"https://openalex.org/I99065089","display_name":"Tsinghua University","ror":"https://ror.org/03cve4549","country_code":"CN","type":"education","lineage":["https://openalex.org/I99065089"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Yilun Chen","raw_affiliation_strings":["Tsinghua University,Institute for AI Industry Research (AIR),Beijing,China"],"affiliations":[{"raw_affiliation_string":"Tsinghua University,Institute for AI Industry Research (AIR),Beijing,China","institution_ids":["https://openalex.org/I99065089"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5100663306","display_name":"Yaqin Zhang","orcid":"https://orcid.org/0000-0001-5675-8804"},"institutions":[{"id":"https://openalex.org/I99065089","display_name":"Tsinghua University","ror":"https://ror.org/03cve4549","country_code":"CN","type":"education","lineage":["https://openalex.org/I99065089"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Ya-Qin Zhang","raw_affiliation_strings":["Tsinghua University,Institute for AI Industry Research (AIR),Beijing,China"],"affiliations":[{"raw_affiliation_string":"Tsinghua University,Institute for AI Industry Research (AIR),Beijing,China","institution_ids":["https://openalex.org/I99065089"]}]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":8,"corresponding_author_ids":["https://openalex.org/A5100407596"],"corresponding_institution_ids":["https://openalex.org/I99065089"],"apc_list":null,"apc_paid":null,"fwci":3.1698,"has_fulltext":false,"cited_by_count":12,"citation_normalized_percentile":{"value":0.9300783,"is_in_top_1_percent":false,"is_in_top_10_percent":true},"cited_by_percentile_year":{"min":94,"max":99},"biblio":{"volume":null,"issue":null,"first_page":"16388","last_page":"16394"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10036","display_name":"Advanced Neural Network Applications","score":1.0,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10036","display_name":"Advanced Neural Network Applications","score":1.0,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T12707","display_name":"Vehicle License Plate Recognition","score":0.9972000122070312,"subfield":{"id":"https://openalex.org/subfields/2214","display_name":"Media Technology"},"field":{"id":"https://openalex.org/fields/22","display_name":"Engineering"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11606","display_name":"Infrastructure Maintenance and Monitoring","score":0.9945999979972839,"subfield":{"id":"https://openalex.org/subfields/2205","display_name":"Civil and Structural Engineering"},"field":{"id":"https://openalex.org/fields/22","display_name":"Engineering"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.7123496532440186},{"id":"https://openalex.org/keywords/object-detection","display_name":"Object detection","score":0.6523966789245605},{"id":"https://openalex.org/keywords/computer-vision","display_name":"Computer vision","score":0.6277352571487427},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.5805591940879822},{"id":"https://openalex.org/keywords/scale","display_name":"Scale (ratio)","score":0.5736786127090454},{"id":"https://openalex.org/keywords/image-fusion","display_name":"Image fusion","score":0.5729110836982727},{"id":"https://openalex.org/keywords/feature","display_name":"Feature (linguistics)","score":0.527755081653595},{"id":"https://openalex.org/keywords/fusion","display_name":"Fusion","score":0.48066723346710205},{"id":"https://openalex.org/keywords/object","display_name":"Object (grammar)","score":0.4712646007537842},{"id":"https://openalex.org/keywords/image","display_name":"Image (mathematics)","score":0.4658876955509186},{"id":"https://openalex.org/keywords/sensor-fusion","display_name":"Sensor fusion","score":0.4393857717514038},{"id":"https://openalex.org/keywords/feature-detection","display_name":"Feature detection (computer vision)","score":0.42841556668281555},{"id":"https://openalex.org/keywords/pattern-recognition","display_name":"Pattern recognition (psychology)","score":0.36993926763534546},{"id":"https://openalex.org/keywords/image-processing","display_name":"Image processing","score":0.2545571029186249},{"id":"https://openalex.org/keywords/geography","display_name":"Geography","score":0.05869007110595703}],"concepts":[{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.7123496532440186},{"id":"https://openalex.org/C2776151529","wikidata":"https://www.wikidata.org/wiki/Q3045304","display_name":"Object detection","level":3,"score":0.6523966789245605},{"id":"https://openalex.org/C31972630","wikidata":"https://www.wikidata.org/wiki/Q844240","display_name":"Computer vision","level":1,"score":0.6277352571487427},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.5805591940879822},{"id":"https://openalex.org/C2778755073","wikidata":"https://www.wikidata.org/wiki/Q10858537","display_name":"Scale (ratio)","level":2,"score":0.5736786127090454},{"id":"https://openalex.org/C69744172","wikidata":"https://www.wikidata.org/wiki/Q860822","display_name":"Image fusion","level":3,"score":0.5729110836982727},{"id":"https://openalex.org/C2776401178","wikidata":"https://www.wikidata.org/wiki/Q12050496","display_name":"Feature (linguistics)","level":2,"score":0.527755081653595},{"id":"https://openalex.org/C158525013","wikidata":"https://www.wikidata.org/wiki/Q2593739","display_name":"Fusion","level":2,"score":0.48066723346710205},{"id":"https://openalex.org/C2781238097","wikidata":"https://www.wikidata.org/wiki/Q175026","display_name":"Object (grammar)","level":2,"score":0.4712646007537842},{"id":"https://openalex.org/C115961682","wikidata":"https://www.wikidata.org/wiki/Q860623","display_name":"Image (mathematics)","level":2,"score":0.4658876955509186},{"id":"https://openalex.org/C33954974","wikidata":"https://www.wikidata.org/wiki/Q486494","display_name":"Sensor fusion","level":2,"score":0.4393857717514038},{"id":"https://openalex.org/C126422989","wikidata":"https://www.wikidata.org/wiki/Q93586","display_name":"Feature detection (computer vision)","level":4,"score":0.42841556668281555},{"id":"https://openalex.org/C153180895","wikidata":"https://www.wikidata.org/wiki/Q7148389","display_name":"Pattern recognition (psychology)","level":2,"score":0.36993926763534546},{"id":"https://openalex.org/C9417928","wikidata":"https://www.wikidata.org/wiki/Q1070689","display_name":"Image processing","level":3,"score":0.2545571029186249},{"id":"https://openalex.org/C205649164","wikidata":"https://www.wikidata.org/wiki/Q1071","display_name":"Geography","level":0,"score":0.05869007110595703},{"id":"https://openalex.org/C138885662","wikidata":"https://www.wikidata.org/wiki/Q5891","display_name":"Philosophy","level":0,"score":0.0},{"id":"https://openalex.org/C58640448","wikidata":"https://www.wikidata.org/wiki/Q42515","display_name":"Cartography","level":1,"score":0.0},{"id":"https://openalex.org/C41895202","wikidata":"https://www.wikidata.org/wiki/Q8162","display_name":"Linguistics","level":1,"score":0.0}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.1109/icra57147.2024.10610545","is_oa":false,"landing_page_url":"https://doi.org/10.1109/icra57147.2024.10610545","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"2024 IEEE International Conference on Robotics and Automation (ICRA)","raw_type":"proceedings-article"}],"best_oa_location":null,"sustainable_development_goals":[{"score":0.5799999833106995,"id":"https://metadata.un.org/sdg/9","display_name":"Industry, innovation and infrastructure"}],"awards":[],"funders":[],"has_content":{"grobid_xml":false,"pdf":false},"content_urls":null,"referenced_works_count":50,"referenced_works":["https://openalex.org/W2115579991","https://openalex.org/W2194775991","https://openalex.org/W2565639579","https://openalex.org/W2601564443","https://openalex.org/W2752782242","https://openalex.org/W2897529137","https://openalex.org/W2968296999","https://openalex.org/W2982770724","https://openalex.org/W3034669477","https://openalex.org/W3035098634","https://openalex.org/W3035574168","https://openalex.org/W3109395584","https://openalex.org/W3109991383","https://openalex.org/W3171032126","https://openalex.org/W3173668541","https://openalex.org/W3201193904","https://openalex.org/W3215100485","https://openalex.org/W4224947594","https://openalex.org/W4225793049","https://openalex.org/W4226305814","https://openalex.org/W4281255813","https://openalex.org/W4284701604","https://openalex.org/W4286544732","https://openalex.org/W4290056039","https://openalex.org/W4297411803","https://openalex.org/W4312604822","https://openalex.org/W4312894406","https://openalex.org/W4312939270","https://openalex.org/W4319300075","https://openalex.org/W4330338357","https://openalex.org/W4382464460","https://openalex.org/W4383108819","https://openalex.org/W4385804883","https://openalex.org/W4386083148","https://openalex.org/W4386634496","https://openalex.org/W4390872833","https://openalex.org/W6769990807","https://openalex.org/W6785667878","https://openalex.org/W6802311648","https://openalex.org/W6810001583","https://openalex.org/W6810460759","https://openalex.org/W6811230113","https://openalex.org/W6838844109","https://openalex.org/W6839180059","https://openalex.org/W6839355098","https://openalex.org/W6839364997","https://openalex.org/W6840665015","https://openalex.org/W6842774165","https://openalex.org/W6851123386","https://openalex.org/W6941281266"],"related_works":["https://openalex.org/W2132659060","https://openalex.org/W2031992971","https://openalex.org/W2788731446","https://openalex.org/W2204403038","https://openalex.org/W3214791684","https://openalex.org/W3152170969","https://openalex.org/W2379054866","https://openalex.org/W2549658594","https://openalex.org/W2095903272","https://openalex.org/W2353265673"],"abstract_inverted_index":{"In":[0],"autonomous":[1],"driving,":[2],"cooperative":[3,39],"perception":[4],"makes":[5],"use":[6],"of":[7,24],"multi-view":[8,50],"cameras":[9],"from":[10,65,95],"both":[11,96],"vehicles":[12,97],"and":[13,98,106,115,121,143,163],"infrastructure,":[14,99],"providing":[15],"a":[16,28,75,136],"global":[17],"vantage":[18],"point":[19],"with":[20,141,166],"rich":[21],"semantic":[22],"context":[23],"road":[25],"conditions":[26],"beyond":[27],"single":[29],"vehicle":[30,116],"viewpoint.":[31],"Currently,":[32],"two":[33],"major":[34],"challenges":[35],"persist":[36],"in":[37,61],"vehicle-infrastructure":[38],"3D":[40,78],"(VIC3D)":[41],"object":[42],"detection:":[43],"1)":[44],"inherent":[45],"pose":[46,127],"errors":[47],"when":[48],"fusing":[49],"images,":[51],"caused":[52],"by":[53,130],"time":[54],"asynchrony":[55],"across":[56],"cameras;":[57],"2)":[58],"information":[59],"loss":[60],"transmission":[62,148,168],"process":[63],"resulted":[64],"limited":[66],"communication":[67],"bandwidth.":[68],"To":[69,90],"address":[70],"these":[71],"issues,":[72],"we":[73,100],"propose":[74,101],"novel":[76],"camera-based":[77],"detection":[79],"framework":[80],"for":[81,147],"VIC3D":[82],"task,":[83],"Enhanced":[84],"Multi-scale":[85,102],"Image":[86],"Feature":[87,137],"Fusion":[88],"(EMIFF).":[89],"fully":[91],"exploit":[92],"holistic":[93],"perspectives":[94],"Cross":[103],"Attention":[104],"(MCA)":[105],"Camera-aware":[107],"Channel":[108],"Masking":[109],"(CCM)":[110],"modules":[111],"to":[112,124],"enhance":[113],"infrastructure":[114],"features":[117],"at":[118],"scale,":[119],"spatial,":[120],"channel":[122,142],"levels":[123],"correct":[125],"the":[126],"error":[128],"introduced":[129],"camera":[131],"asynchrony.":[132],"We":[133],"also":[134],"introduce":[135],"Compression":[138],"(FC)":[139],"module":[140],"spatial":[144],"compression":[145],"blocks":[146],"efficiency.":[149],"Experiments":[150],"show":[151],"that":[152],"EMIFF":[153],"achieves":[154],"SOTA":[155],"on":[156],"DAIR-V2X-C":[157],"datasets,":[158],"significantly":[159],"outperforming":[160],"previous":[161],"early-fusion":[162],"late-fusion":[164],"methods":[165],"comparable":[167],"costs.":[169]},"counts_by_year":[{"year":2026,"cited_by_count":1},{"year":2025,"cited_by_count":9},{"year":2024,"cited_by_count":2}],"updated_date":"2026-03-03T08:47:05.690250","created_date":"2025-10-10T00:00:00"}
