{"id":"https://openalex.org/W4398230590","doi":"https://doi.org/10.48550/arxiv.2405.12944","title":"AMFD: Distillation via Adaptive Multimodal Fusion for Multispectral Pedestrian Detection","display_name":"AMFD: Distillation via Adaptive Multimodal Fusion for Multispectral Pedestrian Detection","publication_year":2024,"publication_date":"2024-05-21","ids":{"openalex":"https://openalex.org/W4398230590","doi":"https://doi.org/10.48550/arxiv.2405.12944"},"language":"en","primary_location":{"id":"pmh:oai:arXiv.org:2405.12944","is_oa":true,"landing_page_url":"http://arxiv.org/abs/2405.12944","pdf_url":"https://arxiv.org/pdf/2405.12944","source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":"","raw_type":"text"},"type":"preprint","indexed_in":["arxiv","datacite"],"open_access":{"is_oa":true,"oa_status":"green","oa_url":"https://arxiv.org/pdf/2405.12944","any_repository_has_fulltext":true},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5044974889","display_name":"Zizhao Chen","orcid":"https://orcid.org/0000-0002-3851-4803"},"institutions":[],"countries":[],"is_corresponding":true,"raw_author_name":"Chen, Zizhao","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5030832323","display_name":"Yeqiang Qian","orcid":"https://orcid.org/0000-0003-0831-8702"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Qian, Yeqiang","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5005205790","display_name":"Xiaoxiao Yang","orcid":"https://orcid.org/0000-0003-0290-2844"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Yang, Xiaoxiao","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5048517656","display_name":"Chunxiang Wang","orcid":"https://orcid.org/0000-0002-6885-6740"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Wang, Chunxiang","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"last","author":{"id":"https://openalex.org/A5100418319","display_name":"Ming\u2013Hsuan Yang","orcid":"https://orcid.org/0000-0003-4848-2304"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Yang, Ming","raw_affiliation_strings":[],"affiliations":[]}],"institutions":[],"countries_distinct_count":0,"institutions_distinct_count":5,"corresponding_author_ids":["https://openalex.org/A5044974889"],"corresponding_institution_ids":[],"apc_list":null,"apc_paid":null,"fwci":null,"has_fulltext":false,"cited_by_count":2,"citation_normalized_percentile":null,"cited_by_percentile_year":null,"biblio":{"volume":null,"issue":null,"first_page":null,"last_page":null},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10331","display_name":"Video Surveillance and Tracking Methods","score":0.9388999938964844,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10331","display_name":"Video Surveillance and Tracking Methods","score":0.9388999938964844,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10689","display_name":"Remote-Sensing Image Classification","score":0.9136000275611877,"subfield":{"id":"https://openalex.org/subfields/2214","display_name":"Media Technology"},"field":{"id":"https://openalex.org/fields/22","display_name":"Engineering"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/multispectral-image","display_name":"Multispectral image","score":0.8369021415710449},{"id":"https://openalex.org/keywords/pedestrian-detection","display_name":"Pedestrian detection","score":0.7411987781524658},{"id":"https://openalex.org/keywords/pedestrian","display_name":"Pedestrian","score":0.615952730178833},{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.5520400404930115},{"id":"https://openalex.org/keywords/distillation","display_name":"Distillation","score":0.531134307384491},{"id":"https://openalex.org/keywords/sensor-fusion","display_name":"Sensor fusion","score":0.5129029750823975},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.5093711614608765},{"id":"https://openalex.org/keywords/fusion","display_name":"Fusion","score":0.4919831454753876},{"id":"https://openalex.org/keywords/computer-vision","display_name":"Computer vision","score":0.4521784782409668},{"id":"https://openalex.org/keywords/pattern-recognition","display_name":"Pattern recognition (psychology)","score":0.3541069030761719},{"id":"https://openalex.org/keywords/environmental-science","display_name":"Environmental science","score":0.33779144287109375},{"id":"https://openalex.org/keywords/chromatography","display_name":"Chromatography","score":0.23751720786094666},{"id":"https://openalex.org/keywords/chemistry","display_name":"Chemistry","score":0.23186567425727844},{"id":"https://openalex.org/keywords/engineering","display_name":"Engineering","score":0.18199819326400757},{"id":"https://openalex.org/keywords/transport-engineering","display_name":"Transport engineering","score":0.08473560214042664}],"concepts":[{"id":"https://openalex.org/C173163844","wikidata":"https://www.wikidata.org/wiki/Q1761440","display_name":"Multispectral image","level":2,"score":0.8369021415710449},{"id":"https://openalex.org/C2780156472","wikidata":"https://www.wikidata.org/wiki/Q2355550","display_name":"Pedestrian detection","level":3,"score":0.7411987781524658},{"id":"https://openalex.org/C2777113093","wikidata":"https://www.wikidata.org/wiki/Q221488","display_name":"Pedestrian","level":2,"score":0.615952730178833},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.5520400404930115},{"id":"https://openalex.org/C204030448","wikidata":"https://www.wikidata.org/wiki/Q101017","display_name":"Distillation","level":2,"score":0.531134307384491},{"id":"https://openalex.org/C33954974","wikidata":"https://www.wikidata.org/wiki/Q486494","display_name":"Sensor fusion","level":2,"score":0.5129029750823975},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.5093711614608765},{"id":"https://openalex.org/C158525013","wikidata":"https://www.wikidata.org/wiki/Q2593739","display_name":"Fusion","level":2,"score":0.4919831454753876},{"id":"https://openalex.org/C31972630","wikidata":"https://www.wikidata.org/wiki/Q844240","display_name":"Computer vision","level":1,"score":0.4521784782409668},{"id":"https://openalex.org/C153180895","wikidata":"https://www.wikidata.org/wiki/Q7148389","display_name":"Pattern recognition (psychology)","level":2,"score":0.3541069030761719},{"id":"https://openalex.org/C39432304","wikidata":"https://www.wikidata.org/wiki/Q188847","display_name":"Environmental science","level":0,"score":0.33779144287109375},{"id":"https://openalex.org/C43617362","wikidata":"https://www.wikidata.org/wiki/Q170050","display_name":"Chromatography","level":1,"score":0.23751720786094666},{"id":"https://openalex.org/C185592680","wikidata":"https://www.wikidata.org/wiki/Q2329","display_name":"Chemistry","level":0,"score":0.23186567425727844},{"id":"https://openalex.org/C127413603","wikidata":"https://www.wikidata.org/wiki/Q11023","display_name":"Engineering","level":0,"score":0.18199819326400757},{"id":"https://openalex.org/C22212356","wikidata":"https://www.wikidata.org/wiki/Q775325","display_name":"Transport engineering","level":1,"score":0.08473560214042664},{"id":"https://openalex.org/C41895202","wikidata":"https://www.wikidata.org/wiki/Q8162","display_name":"Linguistics","level":1,"score":0.0},{"id":"https://openalex.org/C138885662","wikidata":"https://www.wikidata.org/wiki/Q5891","display_name":"Philosophy","level":0,"score":0.0}],"mesh":[],"locations_count":2,"locations":[{"id":"pmh:oai:arXiv.org:2405.12944","is_oa":true,"landing_page_url":"http://arxiv.org/abs/2405.12944","pdf_url":"https://arxiv.org/pdf/2405.12944","source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":"","raw_type":"text"},{"id":"doi:10.48550/arxiv.2405.12944","is_oa":true,"landing_page_url":"https://doi.org/10.48550/arxiv.2405.12944","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":null,"is_accepted":false,"is_published":null,"raw_source_name":null,"raw_type":"article"}],"best_oa_location":{"id":"pmh:oai:arXiv.org:2405.12944","is_oa":true,"landing_page_url":"http://arxiv.org/abs/2405.12944","pdf_url":"https://arxiv.org/pdf/2405.12944","source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":"","raw_type":"text"},"sustainable_development_goals":[],"awards":[],"funders":[],"has_content":{"grobid_xml":false,"pdf":false},"content_urls":null,"referenced_works_count":0,"referenced_works":[],"related_works":["https://openalex.org/W4318664220","https://openalex.org/W2771047279","https://openalex.org/W4388409104","https://openalex.org/W2124951708","https://openalex.org/W3132270449","https://openalex.org/W4377289091","https://openalex.org/W2972620127","https://openalex.org/W3013647784","https://openalex.org/W2981141433","https://openalex.org/W2997281059"],"abstract_inverted_index":{"Multispectral":[0],"pedestrian":[1,60],"detection":[2,22,61],"has":[3,53],"been":[4,77],"shown":[5],"to":[6,33,40,141,160,203],"be":[7],"effective":[8],"in":[9,20,62,96,219],"improving":[10,226],"performance":[11],"within":[12],"complex":[13],"illumination":[14],"scenarios.":[15],"However,":[16,79],"prevalent":[17],"double-stream":[18],"networks":[19,42],"multispectral":[21,59,187],"employ":[23],"two":[24],"separate":[25],"feature":[26,46,175],"extraction":[27,47],"branches":[28],"for":[29,65,145,189],"multi-modal":[30,99],"data,":[31],"leading":[32],"nearly":[34],"double":[35],"the":[36,55,86,91,97,103,109,113,124,129,157,181,194,205],"inference":[37,51],"time":[38,52],"compared":[39],"single-stream":[41],"utilizing":[43],"only":[44,84],"one":[45],"branch.":[48],"This":[49,154],"increased":[50],"hindered":[54],"widespread":[56],"employment":[57],"of":[58,94,128,168,207],"embedded":[63],"devices":[64],"autonomous":[66],"systems.":[67],"To":[68,107],"address":[69],"this":[70],"limitation,":[71],"various":[72],"knowledge":[73],"distillation":[74,81],"methods":[75,82,218],"have":[76],"proposed.":[78],"traditional":[80],"focus":[83],"on":[85,193],"fusion":[87,163,176],"features":[88,127],"and":[89,150,198,225],"ignore":[90],"large":[92],"amount":[93],"information":[95],"original":[98,125],"features,":[100],"thereby":[101],"restricting":[102],"student":[104,146,158],"network's":[105],"performance.":[106],"tackle":[108],"challenge,":[110],"we":[111,179],"introduce":[112],"Adaptive":[114],"Modal":[115,134],"Fusion":[116],"Distillation":[117],"(AMFD)":[118],"framework,":[119],"which":[120],"can":[121],"fully":[122],"utilize":[123],"modal":[126],"teacher":[130,169],"network.":[131],"Specifically,":[132],"a":[133,184],"Extraction":[135],"Alignment":[136],"(MEA)":[137],"module":[138],"is":[139,232],"utilized":[140],"derive":[142],"learning":[143],"weights":[144],"networks,":[147],"integrating":[148],"focal":[149],"global":[151],"attention":[152],"mechanisms.":[153],"methodology":[155],"enables":[156],"network":[159,170],"acquire":[161],"optimal":[162],"strategies":[164],"independent":[165],"from":[166],"that":[167,212],"without":[171],"necessitating":[172],"an":[173],"additional":[174],"module.":[177],"Furthermore,":[178],"present":[180],"SMOD":[182,199],"dataset,":[183],"well-aligned":[185],"challenging":[186,195],"dataset":[188],"detection.":[190],"Extensive":[191],"experiments":[192],"KAIST,":[196],"LLVIP":[197],"datasets":[200],"are":[201],"conducted":[202],"validate":[204],"effectiveness":[206],"AMFD.":[208],"The":[209,230],"results":[210],"demonstrate":[211],"our":[213],"method":[214],"outperforms":[215],"existing":[216],"state-of-the-art":[217],"both":[220],"reducing":[221],"log-average":[222],"Miss":[223],"Rate":[224],"mean":[227],"Average":[228],"Precision.":[229],"code":[231],"available":[233],"at":[234],"https://github.com/bigD233/AMFD.git.":[235]},"counts_by_year":[{"year":2025,"cited_by_count":2}],"updated_date":"2026-03-31T06:02:25.137627","created_date":"2024-05-23T00:00:00"}
