{"id":"https://openalex.org/W3158128549","doi":"https://doi.org/10.1109/tcsvt.2021.3076466","title":"Uncertainty-Guided Cross-Modal Learning for Robust Multispectral Pedestrian Detection","display_name":"Uncertainty-Guided Cross-Modal Learning for Robust Multispectral Pedestrian Detection","publication_year":2021,"publication_date":"2021-04-29","ids":{"openalex":"https://openalex.org/W3158128549","doi":"https://doi.org/10.1109/tcsvt.2021.3076466","mag":"3158128549"},"language":"en","primary_location":{"id":"doi:10.1109/tcsvt.2021.3076466","is_oa":false,"landing_page_url":"https://doi.org/10.1109/tcsvt.2021.3076466","pdf_url":null,"source":{"id":"https://openalex.org/S115173108","display_name":"IEEE Transactions on Circuits and Systems for Video Technology","issn_l":"1051-8215","issn":["1051-8215","1558-2205"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310319808","host_organization_name":"Institute of Electrical and Electronics Engineers","host_organization_lineage":["https://openalex.org/P4310319808"],"host_organization_lineage_names":["Institute of Electrical and Electronics Engineers"],"type":"journal"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"IEEE Transactions on Circuits and Systems for Video Technology","raw_type":"journal-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":false,"oa_status":"closed","oa_url":null,"any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5036936141","display_name":"Jung Uk Kim","orcid":"https://orcid.org/0000-0003-4533-4875"},"institutions":[{"id":"https://openalex.org/I157485424","display_name":"Korea Advanced Institute of Science and Technology","ror":"https://ror.org/05apxxy63","country_code":"KR","type":"education","lineage":["https://openalex.org/I157485424"]}],"countries":["KR"],"is_corresponding":false,"raw_author_name":"Jung Uk Kim","raw_affiliation_strings":["Image and Video Systems Laboratory, School of Electrical Engineering, Korea Advanced Institute of Science and Technology (KAIST), Daejeon, South Korea"],"raw_orcid":"https://orcid.org/0000-0003-4533-4875","affiliations":[{"raw_affiliation_string":"Image and Video Systems Laboratory, School of Electrical Engineering, Korea Advanced Institute of Science and Technology (KAIST), Daejeon, South Korea","institution_ids":["https://openalex.org/I157485424"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5103104504","display_name":"Sungjune Park","orcid":"https://orcid.org/0000-0001-7482-4553"},"institutions":[{"id":"https://openalex.org/I157485424","display_name":"Korea Advanced Institute of Science and Technology","ror":"https://ror.org/05apxxy63","country_code":"KR","type":"education","lineage":["https://openalex.org/I157485424"]}],"countries":["KR"],"is_corresponding":false,"raw_author_name":"Sungjune Park","raw_affiliation_strings":["Image and Video Systems Laboratory, School of Electrical Engineering, Korea Advanced Institute of Science and Technology (KAIST), Daejeon, South Korea"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"Image and Video Systems Laboratory, School of Electrical Engineering, Korea Advanced Institute of Science and Technology (KAIST), Daejeon, South Korea","institution_ids":["https://openalex.org/I157485424"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5038798134","display_name":"Yong Man Ro","orcid":"https://orcid.org/0000-0001-5306-6853"},"institutions":[{"id":"https://openalex.org/I157485424","display_name":"Korea Advanced Institute of Science and Technology","ror":"https://ror.org/05apxxy63","country_code":"KR","type":"education","lineage":["https://openalex.org/I157485424"]}],"countries":["KR"],"is_corresponding":false,"raw_author_name":"Yong Man Ro","raw_affiliation_strings":["Image and Video Systems Laboratory, School of Electrical Engineering, Korea Advanced Institute of Science and Technology (KAIST), Daejeon, South Korea"],"raw_orcid":"https://orcid.org/0000-0001-5306-6853","affiliations":[{"raw_affiliation_string":"Image and Video Systems Laboratory, School of Electrical Engineering, Korea Advanced Institute of Science and Technology (KAIST), Daejeon, South Korea","institution_ids":["https://openalex.org/I157485424"]}]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":3,"corresponding_author_ids":[],"corresponding_institution_ids":[],"apc_list":null,"apc_paid":null,"fwci":10.3755,"has_fulltext":false,"cited_by_count":121,"citation_normalized_percentile":{"value":0.98564735,"is_in_top_1_percent":false,"is_in_top_10_percent":true},"cited_by_percentile_year":{"min":89,"max":100},"biblio":{"volume":"32","issue":"3","first_page":"1510","last_page":"1523"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10689","display_name":"Remote-Sensing Image Classification","score":0.9991000294685364,"subfield":{"id":"https://openalex.org/subfields/2214","display_name":"Media Technology"},"field":{"id":"https://openalex.org/fields/22","display_name":"Engineering"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10689","display_name":"Remote-Sensing Image Classification","score":0.9991000294685364,"subfield":{"id":"https://openalex.org/subfields/2214","display_name":"Media Technology"},"field":{"id":"https://openalex.org/fields/22","display_name":"Engineering"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10331","display_name":"Video Surveillance and Tracking Methods","score":0.9987000226974487,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11019","display_name":"Image Enhancement Techniques","score":0.9944000244140625,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/multispectral-image","display_name":"Multispectral image","score":0.7968580722808838},{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.7315497398376465},{"id":"https://openalex.org/keywords/pedestrian-detection","display_name":"Pedestrian detection","score":0.7255033850669861},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.7230316400527954},{"id":"https://openalex.org/keywords/discriminative-model","display_name":"Discriminative model","score":0.7054151296615601},{"id":"https://openalex.org/keywords/feature","display_name":"Feature (linguistics)","score":0.6878763437271118},{"id":"https://openalex.org/keywords/modality","display_name":"Modality (human\u2013computer interaction)","score":0.6429042220115662},{"id":"https://openalex.org/keywords/region-of-interest","display_name":"Region of interest","score":0.5458997488021851},{"id":"https://openalex.org/keywords/pattern-recognition","display_name":"Pattern recognition (psychology)","score":0.5310224890708923},{"id":"https://openalex.org/keywords/modal","display_name":"Modal","score":0.4961009919643402},{"id":"https://openalex.org/keywords/computer-vision","display_name":"Computer vision","score":0.48044201731681824},{"id":"https://openalex.org/keywords/modalities","display_name":"Modalities","score":0.4268644452095032},{"id":"https://openalex.org/keywords/pedestrian","display_name":"Pedestrian","score":0.242925226688385},{"id":"https://openalex.org/keywords/engineering","display_name":"Engineering","score":0.10892188549041748}],"concepts":[{"id":"https://openalex.org/C173163844","wikidata":"https://www.wikidata.org/wiki/Q1761440","display_name":"Multispectral image","level":2,"score":0.7968580722808838},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.7315497398376465},{"id":"https://openalex.org/C2780156472","wikidata":"https://www.wikidata.org/wiki/Q2355550","display_name":"Pedestrian detection","level":3,"score":0.7255033850669861},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.7230316400527954},{"id":"https://openalex.org/C97931131","wikidata":"https://www.wikidata.org/wiki/Q5282087","display_name":"Discriminative model","level":2,"score":0.7054151296615601},{"id":"https://openalex.org/C2776401178","wikidata":"https://www.wikidata.org/wiki/Q12050496","display_name":"Feature (linguistics)","level":2,"score":0.6878763437271118},{"id":"https://openalex.org/C2780226545","wikidata":"https://www.wikidata.org/wiki/Q6888030","display_name":"Modality (human\u2013computer interaction)","level":2,"score":0.6429042220115662},{"id":"https://openalex.org/C19609008","wikidata":"https://www.wikidata.org/wiki/Q2138203","display_name":"Region of interest","level":2,"score":0.5458997488021851},{"id":"https://openalex.org/C153180895","wikidata":"https://www.wikidata.org/wiki/Q7148389","display_name":"Pattern recognition (psychology)","level":2,"score":0.5310224890708923},{"id":"https://openalex.org/C71139939","wikidata":"https://www.wikidata.org/wiki/Q910194","display_name":"Modal","level":2,"score":0.4961009919643402},{"id":"https://openalex.org/C31972630","wikidata":"https://www.wikidata.org/wiki/Q844240","display_name":"Computer vision","level":1,"score":0.48044201731681824},{"id":"https://openalex.org/C2779903281","wikidata":"https://www.wikidata.org/wiki/Q6888026","display_name":"Modalities","level":2,"score":0.4268644452095032},{"id":"https://openalex.org/C2777113093","wikidata":"https://www.wikidata.org/wiki/Q221488","display_name":"Pedestrian","level":2,"score":0.242925226688385},{"id":"https://openalex.org/C127413603","wikidata":"https://www.wikidata.org/wiki/Q11023","display_name":"Engineering","level":0,"score":0.10892188549041748},{"id":"https://openalex.org/C22212356","wikidata":"https://www.wikidata.org/wiki/Q775325","display_name":"Transport engineering","level":1,"score":0.0},{"id":"https://openalex.org/C41895202","wikidata":"https://www.wikidata.org/wiki/Q8162","display_name":"Linguistics","level":1,"score":0.0},{"id":"https://openalex.org/C36289849","wikidata":"https://www.wikidata.org/wiki/Q34749","display_name":"Social science","level":1,"score":0.0},{"id":"https://openalex.org/C185592680","wikidata":"https://www.wikidata.org/wiki/Q2329","display_name":"Chemistry","level":0,"score":0.0},{"id":"https://openalex.org/C144024400","wikidata":"https://www.wikidata.org/wiki/Q21201","display_name":"Sociology","level":0,"score":0.0},{"id":"https://openalex.org/C138885662","wikidata":"https://www.wikidata.org/wiki/Q5891","display_name":"Philosophy","level":0,"score":0.0},{"id":"https://openalex.org/C188027245","wikidata":"https://www.wikidata.org/wiki/Q750446","display_name":"Polymer chemistry","level":1,"score":0.0}],"mesh":[],"locations_count":2,"locations":[{"id":"doi:10.1109/tcsvt.2021.3076466","is_oa":false,"landing_page_url":"https://doi.org/10.1109/tcsvt.2021.3076466","pdf_url":null,"source":{"id":"https://openalex.org/S115173108","display_name":"IEEE Transactions on Circuits and Systems for Video Technology","issn_l":"1051-8215","issn":["1051-8215","1558-2205"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310319808","host_organization_name":"Institute of Electrical and Electronics Engineers","host_organization_lineage":["https://openalex.org/P4310319808"],"host_organization_lineage_names":["Institute of Electrical and Electronics Engineers"],"type":"journal"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"IEEE Transactions on Circuits and Systems for Video Technology","raw_type":"journal-article"},{"id":"pmh:oai:koasas.kaist.ac.kr:10203/292815","is_oa":false,"landing_page_url":"http://hdl.handle.net/10203/292815","pdf_url":null,"source":{"id":"https://openalex.org/S4306402435","display_name":"KAIST Institutional Repository (KAIST)","issn_l":null,"issn":null,"is_oa":false,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I157485424","host_organization_name":"Korea Advanced Institute of Science and Technology","host_organization_lineage":["https://openalex.org/I157485424"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"Article"}],"best_oa_location":null,"sustainable_development_goals":[{"score":0.7099999785423279,"id":"https://metadata.un.org/sdg/10","display_name":"Reduced inequalities"}],"awards":[],"funders":[],"has_content":{"pdf":false,"grobid_xml":false},"content_urls":null,"referenced_works_count":85,"referenced_works":["https://openalex.org/W1497910407","https://openalex.org/W1650122911","https://openalex.org/W1686810756","https://openalex.org/W1910108985","https://openalex.org/W2024046085","https://openalex.org/W2031454541","https://openalex.org/W2060300932","https://openalex.org/W2150066425","https://openalex.org/W2161969291","https://openalex.org/W2162409668","https://openalex.org/W2194775991","https://openalex.org/W2315907656","https://openalex.org/W2331956852","https://openalex.org/W2344132218","https://openalex.org/W2344556193","https://openalex.org/W2415234561","https://openalex.org/W2428342532","https://openalex.org/W2497039038","https://openalex.org/W2565639579","https://openalex.org/W2608096492","https://openalex.org/W2626967530","https://openalex.org/W2741620214","https://openalex.org/W2752263152","https://openalex.org/W2777705169","https://openalex.org/W2789621390","https://openalex.org/W2792925809","https://openalex.org/W2883363148","https://openalex.org/W2885641989","https://openalex.org/W2887564556","https://openalex.org/W2888527098","https://openalex.org/W2892614179","https://openalex.org/W2895077992","https://openalex.org/W2902502320","https://openalex.org/W2911671827","https://openalex.org/W2912984848","https://openalex.org/W2913889214","https://openalex.org/W2917092108","https://openalex.org/W2929607865","https://openalex.org/W2962677013","https://openalex.org/W2962721361","https://openalex.org/W2963037989","https://openalex.org/W2963150697","https://openalex.org/W2963167203","https://openalex.org/W2963188557","https://openalex.org/W2963315052","https://openalex.org/W2963351448","https://openalex.org/W2963579094","https://openalex.org/W2963786238","https://openalex.org/W2963905288","https://openalex.org/W2964027659","https://openalex.org/W2964444661","https://openalex.org/W2969875432","https://openalex.org/W2982509564","https://openalex.org/W2984009799","https://openalex.org/W2987131085","https://openalex.org/W2988452521","https://openalex.org/W2989294831","https://openalex.org/W2989604896","https://openalex.org/W2989753085","https://openalex.org/W2990130718","https://openalex.org/W2993592664","https://openalex.org/W3000346474","https://openalex.org/W3015352266","https://openalex.org/W3015777237","https://openalex.org/W3016916515","https://openalex.org/W3033116542","https://openalex.org/W3034307881","https://openalex.org/W3034896527","https://openalex.org/W3034955056","https://openalex.org/W3035376925","https://openalex.org/W3035694605","https://openalex.org/W3084389333","https://openalex.org/W3092873533","https://openalex.org/W3099389178","https://openalex.org/W3104732503","https://openalex.org/W3110525903","https://openalex.org/W3110686003","https://openalex.org/W3116967329","https://openalex.org/W6620707391","https://openalex.org/W6637373629","https://openalex.org/W6676855097","https://openalex.org/W6739651123","https://openalex.org/W6753836424","https://openalex.org/W6761586423","https://openalex.org/W6763087592"],"related_works":["https://openalex.org/W4318664220","https://openalex.org/W2771047279","https://openalex.org/W4388409104","https://openalex.org/W2965546495","https://openalex.org/W1544811710","https://openalex.org/W3132270449","https://openalex.org/W4377289091","https://openalex.org/W3013647784","https://openalex.org/W2997281059","https://openalex.org/W2349354464"],"abstract_inverted_index":{"Multispectral":[0],"pedestrian":[1,30,76],"detection":[2,77],"has":[3],"received":[4],"great":[5],"attention":[6],"in":[7,28],"recent":[8],"years":[9],"as":[10],"multispectral":[11,29,75,226],"modalities":[12,38,216],"(i.e.":[13],"color":[14],"and":[15,94,239],"thermal)":[16],"can":[17,205],"provide":[18],"complementary":[19],"visual":[20],"information.":[21],"However,":[22],"there":[23],"are":[24,47,58],"major":[25],"inherent":[26],"issues":[27],"detection.":[31],"First,":[32],"the":[33,36,99,108,111,115,132,150,154,159,166,169,175,178,182,224,234,237,241],"cameras":[34],"of":[35,86,90,110,134,168,185,195,214,236],"two":[37,84,120,215],"have":[39],"different":[40,61],"field-of-views":[41],"(FoVs),":[42],"so":[43],"that":[44,194,230],"image":[45,56],"pairs":[46,57],"often":[48],"miscalibrated.":[49],"Second,":[50],"modality":[51,151,191,242],"discrepancy":[52],"is":[53],"observed,":[54],"because":[55],"captured":[59],"at":[60],"wavelengths.":[62],"In":[63,79,153],"this":[64],"paper,":[65],"to":[66,130,192,217],"alleviate":[67],"these":[68],"issues,":[69],"we":[70,82,102,123,157,228],"propose":[71,103,143],"a":[72],"new":[73],"uncertainty-aware":[74,125,144],"framework.":[78],"our":[80,231],"framework,":[81],"consider":[83],"types":[85],"uncertainties:":[87],"1)":[88],"Region":[89],"Interest":[91],"(RoI)":[92],"uncertainty":[93,105],"2)":[95],"predictive":[96,160,176,187,197],"uncertainty.":[97,140],"For":[98],"miscalibration":[100,238],"issue,":[101],"RoI":[104,112,116,135,139,170],"which":[106,162],"represents":[107],"reliability":[109],"candidates.":[113],"With":[114,220],"uncertainty,":[117,161,177],"when":[118],"combining":[119],"modal":[121],"features,":[122],"devise":[124],"feature":[126,171,183,212],"fusion":[127],"(UFF)":[128],"module":[129,148,180,204],"reduce":[131],"effect":[133,235],"features":[136,209],"with":[137],"high":[138,186],"We":[141],"also":[142],"cross-modal":[145],"guiding":[146,211],"(UCG)":[147],"for":[149],"discrepancy.":[152],"UCG":[155,179,203],"module,":[156],"use":[158],"indicates":[163],"how":[164],"reliable":[165],"prediction":[167],"is.":[172],"Based":[173],"on":[174,223],"guides":[181],"distribution":[184],"uncertain":[188,198],"(less":[189],"reliable)":[190,200],"resemble":[193],"low":[196],"(more":[199],"modality.":[201],"The":[202],"encode":[206],"more":[207],"discriminative":[208],"by":[210],"distributions":[213],"be":[218],"similar.":[219],"comprehensive":[221],"experiments":[222],"public":[225],"datasets,":[227],"verified":[229],"method":[232],"reduces":[233],"alleviates":[240],"discrepancy,":[243],"outperforming":[244],"existing":[245],"state-of-the-art":[246],"methods.":[247]},"counts_by_year":[{"year":2026,"cited_by_count":8},{"year":2025,"cited_by_count":30},{"year":2024,"cited_by_count":33},{"year":2023,"cited_by_count":34},{"year":2022,"cited_by_count":11},{"year":2021,"cited_by_count":4},{"year":2020,"cited_by_count":1}],"updated_date":"2026-06-11T09:08:48.828518","created_date":"2025-10-10T00:00:00"}
