{"id":"https://openalex.org/W7129293643","doi":"https://doi.org/10.1109/icipw68931.2025.11385981","title":"Dynamic Object Detection for Autonomous Vehicles Using Multi-Modal Knowledge Distillation","display_name":"Dynamic Object Detection for Autonomous Vehicles Using Multi-Modal Knowledge Distillation","publication_year":2025,"publication_date":"2025-09-14","ids":{"openalex":"https://openalex.org/W7129293643","doi":"https://doi.org/10.1109/icipw68931.2025.11385981"},"language":null,"primary_location":{"id":"doi:10.1109/icipw68931.2025.11385981","is_oa":false,"landing_page_url":"https://doi.org/10.1109/icipw68931.2025.11385981","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"2025 IEEE International Conference on Image Processing Workshops (ICIPW)","raw_type":"proceedings-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":false,"oa_status":"closed","oa_url":null,"any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5102876878","display_name":"Vishnudatta Thota","orcid":null},"institutions":[{"id":"https://openalex.org/I94234084","display_name":"Indian Institute of Technology Kanpur","ror":"https://ror.org/05pjsgx75","country_code":"IN","type":"education","lineage":["https://openalex.org/I94234084"]}],"countries":["IN"],"is_corresponding":true,"raw_author_name":"Vishnudatta Thota","raw_affiliation_strings":["Indian Institute of Technology,Kanpur,India"],"affiliations":[{"raw_affiliation_string":"Indian Institute of Technology,Kanpur,India","institution_ids":["https://openalex.org/I94234084"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5126229856","display_name":"Tushar Sandhan","orcid":null},"institutions":[{"id":"https://openalex.org/I94234084","display_name":"Indian Institute of Technology Kanpur","ror":"https://ror.org/05pjsgx75","country_code":"IN","type":"education","lineage":["https://openalex.org/I94234084"]}],"countries":["IN"],"is_corresponding":false,"raw_author_name":"Tushar Sandhan","raw_affiliation_strings":["Indian Institute of Technology,Kanpur,India"],"affiliations":[{"raw_affiliation_string":"Indian Institute of Technology,Kanpur,India","institution_ids":["https://openalex.org/I94234084"]}]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":2,"corresponding_author_ids":["https://openalex.org/A5102876878"],"corresponding_institution_ids":["https://openalex.org/I94234084"],"apc_list":null,"apc_paid":null,"fwci":0.0,"has_fulltext":false,"cited_by_count":0,"citation_normalized_percentile":{"value":0.74155729,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":null,"biblio":{"volume":null,"issue":null,"first_page":"374","last_page":"379"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10036","display_name":"Advanced Neural Network Applications","score":0.9567000269889832,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10036","display_name":"Advanced Neural Network Applications","score":0.9567000269889832,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11099","display_name":"Autonomous Vehicle Technology and Safety","score":0.0142000000923872,"subfield":{"id":"https://openalex.org/subfields/2203","display_name":"Automotive Engineering"},"field":{"id":"https://openalex.org/fields/22","display_name":"Engineering"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11038","display_name":"Advanced SAR Imaging Techniques","score":0.0031999999191612005,"subfield":{"id":"https://openalex.org/subfields/2202","display_name":"Aerospace Engineering"},"field":{"id":"https://openalex.org/fields/22","display_name":"Engineering"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/object-detection","display_name":"Object detection","score":0.7052000164985657},{"id":"https://openalex.org/keywords/robustness","display_name":"Robustness (evolution)","score":0.6414999961853027},{"id":"https://openalex.org/keywords/sensor-fusion","display_name":"Sensor fusion","score":0.48429998755455017},{"id":"https://openalex.org/keywords/object","display_name":"Object (grammar)","score":0.4781999886035919},{"id":"https://openalex.org/keywords/rgb-color-model","display_name":"RGB color model","score":0.42239999771118164},{"id":"https://openalex.org/keywords/edge-detection","display_name":"Edge detection","score":0.390500009059906},{"id":"https://openalex.org/keywords/task","display_name":"Task (project management)","score":0.3571999967098236}],"concepts":[{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.7215999960899353},{"id":"https://openalex.org/C2776151529","wikidata":"https://www.wikidata.org/wiki/Q3045304","display_name":"Object detection","level":3,"score":0.7052000164985657},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.6680999994277954},{"id":"https://openalex.org/C63479239","wikidata":"https://www.wikidata.org/wiki/Q7353546","display_name":"Robustness (evolution)","level":3,"score":0.6414999961853027},{"id":"https://openalex.org/C31972630","wikidata":"https://www.wikidata.org/wiki/Q844240","display_name":"Computer vision","level":1,"score":0.6225000023841858},{"id":"https://openalex.org/C33954974","wikidata":"https://www.wikidata.org/wiki/Q486494","display_name":"Sensor fusion","level":2,"score":0.48429998755455017},{"id":"https://openalex.org/C2781238097","wikidata":"https://www.wikidata.org/wiki/Q175026","display_name":"Object (grammar)","level":2,"score":0.4781999886035919},{"id":"https://openalex.org/C82990744","wikidata":"https://www.wikidata.org/wiki/Q166194","display_name":"RGB color model","level":2,"score":0.42239999771118164},{"id":"https://openalex.org/C193536780","wikidata":"https://www.wikidata.org/wiki/Q1513153","display_name":"Edge detection","level":4,"score":0.390500009059906},{"id":"https://openalex.org/C2780451532","wikidata":"https://www.wikidata.org/wiki/Q759676","display_name":"Task (project management)","level":2,"score":0.3571999967098236},{"id":"https://openalex.org/C162307627","wikidata":"https://www.wikidata.org/wiki/Q204833","display_name":"Enhanced Data Rates for GSM Evolution","level":2,"score":0.34850001335144043},{"id":"https://openalex.org/C124101348","wikidata":"https://www.wikidata.org/wiki/Q172491","display_name":"Data mining","level":1,"score":0.33709999918937683},{"id":"https://openalex.org/C64876066","wikidata":"https://www.wikidata.org/wiki/Q5141226","display_name":"Cognitive neuroscience of visual object recognition","level":3,"score":0.32589998841285706},{"id":"https://openalex.org/C739882","wikidata":"https://www.wikidata.org/wiki/Q3560506","display_name":"Anomaly detection","level":2,"score":0.3037000000476837},{"id":"https://openalex.org/C153180895","wikidata":"https://www.wikidata.org/wiki/Q7148389","display_name":"Pattern recognition (psychology)","level":2,"score":0.28029999136924744},{"id":"https://openalex.org/C79403827","wikidata":"https://www.wikidata.org/wiki/Q3988","display_name":"Real-time computing","level":1,"score":0.2754000127315521},{"id":"https://openalex.org/C115901376","wikidata":"https://www.wikidata.org/wiki/Q184199","display_name":"Automation","level":2,"score":0.2678999900817871},{"id":"https://openalex.org/C554190296","wikidata":"https://www.wikidata.org/wiki/Q47528","display_name":"Radar","level":2,"score":0.2632000148296356},{"id":"https://openalex.org/C202474056","wikidata":"https://www.wikidata.org/wiki/Q1931635","display_name":"Video tracking","level":3,"score":0.25049999356269836}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.1109/icipw68931.2025.11385981","is_oa":false,"landing_page_url":"https://doi.org/10.1109/icipw68931.2025.11385981","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"2025 IEEE International Conference on Image Processing Workshops (ICIPW)","raw_type":"proceedings-article"}],"best_oa_location":null,"sustainable_development_goals":[],"awards":[],"funders":[],"has_content":{"pdf":false,"grobid_xml":false},"content_urls":null,"referenced_works_count":22,"referenced_works":["https://openalex.org/W639708223","https://openalex.org/W1973644502","https://openalex.org/W2069537876","https://openalex.org/W2901505625","https://openalex.org/W2952787292","https://openalex.org/W2963438049","https://openalex.org/W2967098543","https://openalex.org/W2972006294","https://openalex.org/W2991138066","https://openalex.org/W3096609285","https://openalex.org/W3108124733","https://openalex.org/W3118518413","https://openalex.org/W3128655704","https://openalex.org/W3211204716","https://openalex.org/W4283826072","https://openalex.org/W4289861074","https://openalex.org/W4372260444","https://openalex.org/W4386596822","https://openalex.org/W4386598287","https://openalex.org/W4396525349","https://openalex.org/W4402916760","https://openalex.org/W4406728012"],"related_works":[],"abstract_inverted_index":{"Object":[0],"detection":[1,23,98,133],"is":[2,12],"a":[3,27,124],"crucial":[4],"task":[5],"performed":[6,114],"by":[7],"autonomous":[8,76],"vehicles.":[9],"Multi-modal":[10],"data":[11,87,148],"widely":[13],"used":[14],"to":[15,58,71,84,136],"increase":[16],"the":[17,34,37,53,101,108,116,130,137],"robustness":[18],"and":[19,36,103,140,160],"accuracy":[20],"of":[21,55],"object":[22,97,132],"tasks.":[24],"We":[25,89],"propose":[26],"simplified":[28],"fusion":[29],"technique":[30],"for":[31,96,129,155],"effectively":[32],"combining":[33],"visual":[35],"corresponding":[38],"radar":[39],"data.":[40],"It":[41,66],"forms":[42],"3-channel":[43],"fused":[44],"image,":[45],"which":[46],"resembles":[47],"ubiquitous":[48],"RGB":[49],"channels,":[50],"thus":[51],"increases":[52],"versatility":[54],"proposed":[56],"method":[57],"be":[59,69,163],"integrated":[60,70],"with":[61,75],"multiple":[62],"existing":[63,72],"CNN":[64],"architectures.":[65],"can":[67],"easily":[68],"edge":[73],"devices":[74],"navigation":[77],"platforms":[78],"as":[79,134],"it":[80,122,144],"manipulates":[81],"input":[82],"modalities":[83],"create":[85],"combined":[86],"structure.":[88],"have":[90],"also":[91],"given":[92],"weight":[93],"update":[94,105],"rules":[95],"models,":[99],"namely":[100],"Single":[102],"Double-weight":[104],"rules,":[106],"utilize":[107],"knowledge":[109],"distillation":[110],"framework.":[111],"Experiments":[112],"were":[113],"using":[115],"dataset":[117],"having":[118],"various":[119],"illuminations,":[120],"where":[121],"achieved":[123],"3.5%":[125],"improvement":[126],"in":[127],"precision":[128],"dynamic":[131],"compared":[135],"state-of-the-art":[138],"YOLOv8":[139],"YOLOS":[141],"models.":[142],"Further-more,":[143],"generalizes":[145],"well":[146],"across":[147],"distributions":[149],"(e.g.":[150],"dark":[151],"illumination,":[152],"shadows":[153],"etc.)":[154],"better":[156],"predictions.":[157],"Our":[158],"codes":[159],"datasets":[161],"will":[162],"publicly":[164],"available.":[165]},"counts_by_year":[],"updated_date":"2026-02-19T06:27:42.648592","created_date":"2026-02-18T00:00:00"}
