{"id":"https://openalex.org/W4416251586","doi":"https://doi.org/10.1109/ijcnn64981.2025.11228068","title":"HEFNet: Hierarchical Unimodal Enhancement and Multi-modal Fusion for RGB-T Salient Object Detection","display_name":"HEFNet: Hierarchical Unimodal Enhancement and Multi-modal Fusion for RGB-T Salient Object Detection","publication_year":2025,"publication_date":"2025-06-30","ids":{"openalex":"https://openalex.org/W4416251586","doi":"https://doi.org/10.1109/ijcnn64981.2025.11228068"},"language":null,"primary_location":{"id":"doi:10.1109/ijcnn64981.2025.11228068","is_oa":false,"landing_page_url":"https://doi.org/10.1109/ijcnn64981.2025.11228068","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"2025 International Joint Conference on Neural Networks (IJCNN)","raw_type":"proceedings-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":false,"oa_status":"closed","oa_url":null,"any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5065342667","display_name":"Jiayun Wu","orcid":null},"institutions":[{"id":"https://openalex.org/I67001856","display_name":"Shanghai Institute of Technology","ror":"https://ror.org/00fjzqj15","country_code":"CN","type":"education","lineage":["https://openalex.org/I67001856"]}],"countries":["CN"],"is_corresponding":true,"raw_author_name":"Jiayun Wu","raw_affiliation_strings":["Shanghai Institute of Technology,Faculty of Intelligence Technology,China"],"affiliations":[{"raw_affiliation_string":"Shanghai Institute of Technology,Faculty of Intelligence Technology,China","institution_ids":["https://openalex.org/I67001856"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5022170736","display_name":"Qing Zhang","orcid":"https://orcid.org/0000-0002-8846-5587"},"institutions":[{"id":"https://openalex.org/I67001856","display_name":"Shanghai Institute of Technology","ror":"https://ror.org/00fjzqj15","country_code":"CN","type":"education","lineage":["https://openalex.org/I67001856"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Qing Zhang","raw_affiliation_strings":["Shanghai Institute of Technology,Faculty of Intelligence Technology,China"],"affiliations":[{"raw_affiliation_string":"Shanghai Institute of Technology,Faculty of Intelligence Technology,China","institution_ids":["https://openalex.org/I67001856"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5100361488","display_name":"Chenxi Zhang","orcid":"https://orcid.org/0000-0002-5736-9285"},"institutions":[{"id":"https://openalex.org/I67001856","display_name":"Shanghai Institute of Technology","ror":"https://ror.org/00fjzqj15","country_code":"CN","type":"education","lineage":["https://openalex.org/I67001856"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Chenxi Zhang","raw_affiliation_strings":["Shanghai Institute of Technology,Faculty of Intelligence Technology,China"],"affiliations":[{"raw_affiliation_string":"Shanghai Institute of Technology,Faculty of Intelligence Technology,China","institution_ids":["https://openalex.org/I67001856"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5013600952","display_name":"Yanjiao Shi","orcid":"https://orcid.org/0000-0001-9689-4165"},"institutions":[{"id":"https://openalex.org/I67001856","display_name":"Shanghai Institute of Technology","ror":"https://ror.org/00fjzqj15","country_code":"CN","type":"education","lineage":["https://openalex.org/I67001856"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Yanjiao Shi","raw_affiliation_strings":["Shanghai Institute of Technology,Faculty of Intelligence Technology,China"],"affiliations":[{"raw_affiliation_string":"Shanghai Institute of Technology,Faculty of Intelligence Technology,China","institution_ids":["https://openalex.org/I67001856"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5110493142","display_name":"Qiangqiang Zhou","orcid":null},"institutions":[{"id":"https://openalex.org/I53592917","display_name":"Jiangxi Normal University","ror":"https://ror.org/05nkgk822","country_code":"CN","type":"education","lineage":["https://openalex.org/I53592917"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Qiangqiang Zhou","raw_affiliation_strings":["Jiangxi Normal University,School of Software,Nanchang,China"],"affiliations":[{"raw_affiliation_string":"Jiangxi Normal University,School of Software,Nanchang,China","institution_ids":["https://openalex.org/I53592917"]}]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":5,"corresponding_author_ids":["https://openalex.org/A5065342667"],"corresponding_institution_ids":["https://openalex.org/I67001856"],"apc_list":null,"apc_paid":null,"fwci":0.0,"has_fulltext":false,"cited_by_count":0,"citation_normalized_percentile":{"value":0.3451722,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":null,"biblio":{"volume":null,"issue":null,"first_page":"1","last_page":"8"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T11605","display_name":"Visual Attention and Saliency Detection","score":0.9904000163078308,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T11605","display_name":"Visual Attention and Saliency Detection","score":0.9904000163078308,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10036","display_name":"Advanced Neural Network Applications","score":0.005900000222027302,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11714","display_name":"Multimodal Machine Learning Applications","score":0.00019999999494757503,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/discriminative-model","display_name":"Discriminative model","score":0.7389000058174133},{"id":"https://openalex.org/keywords/feature","display_name":"Feature (linguistics)","score":0.6697999835014343},{"id":"https://openalex.org/keywords/pattern-recognition","display_name":"Pattern recognition (psychology)","score":0.6240000128746033},{"id":"https://openalex.org/keywords/rgb-color-model","display_name":"RGB color model","score":0.5562999844551086},{"id":"https://openalex.org/keywords/salient","display_name":"Salient","score":0.54830002784729},{"id":"https://openalex.org/keywords/fusion","display_name":"Fusion","score":0.5259000062942505},{"id":"https://openalex.org/keywords/noise","display_name":"Noise (video)","score":0.43689998984336853},{"id":"https://openalex.org/keywords/object-detection","display_name":"Object detection","score":0.4284999966621399},{"id":"https://openalex.org/keywords/object","display_name":"Object (grammar)","score":0.41100001335144043}],"concepts":[{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.7748000025749207},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.7423999905586243},{"id":"https://openalex.org/C97931131","wikidata":"https://www.wikidata.org/wiki/Q5282087","display_name":"Discriminative model","level":2,"score":0.7389000058174133},{"id":"https://openalex.org/C2776401178","wikidata":"https://www.wikidata.org/wiki/Q12050496","display_name":"Feature (linguistics)","level":2,"score":0.6697999835014343},{"id":"https://openalex.org/C153180895","wikidata":"https://www.wikidata.org/wiki/Q7148389","display_name":"Pattern recognition (psychology)","level":2,"score":0.6240000128746033},{"id":"https://openalex.org/C82990744","wikidata":"https://www.wikidata.org/wiki/Q166194","display_name":"RGB color model","level":2,"score":0.5562999844551086},{"id":"https://openalex.org/C2780719617","wikidata":"https://www.wikidata.org/wiki/Q1030752","display_name":"Salient","level":2,"score":0.54830002784729},{"id":"https://openalex.org/C158525013","wikidata":"https://www.wikidata.org/wiki/Q2593739","display_name":"Fusion","level":2,"score":0.5259000062942505},{"id":"https://openalex.org/C31972630","wikidata":"https://www.wikidata.org/wiki/Q844240","display_name":"Computer vision","level":1,"score":0.49459999799728394},{"id":"https://openalex.org/C99498987","wikidata":"https://www.wikidata.org/wiki/Q2210247","display_name":"Noise (video)","level":3,"score":0.43689998984336853},{"id":"https://openalex.org/C2776151529","wikidata":"https://www.wikidata.org/wiki/Q3045304","display_name":"Object detection","level":3,"score":0.4284999966621399},{"id":"https://openalex.org/C2781238097","wikidata":"https://www.wikidata.org/wiki/Q175026","display_name":"Object (grammar)","level":2,"score":0.41100001335144043},{"id":"https://openalex.org/C52622490","wikidata":"https://www.wikidata.org/wiki/Q1026626","display_name":"Feature extraction","level":2,"score":0.36910000443458557},{"id":"https://openalex.org/C26517878","wikidata":"https://www.wikidata.org/wiki/Q228039","display_name":"Key (lock)","level":2,"score":0.3686999976634979},{"id":"https://openalex.org/C33954974","wikidata":"https://www.wikidata.org/wiki/Q486494","display_name":"Sensor fusion","level":2,"score":0.35420000553131104},{"id":"https://openalex.org/C2780226545","wikidata":"https://www.wikidata.org/wiki/Q6888030","display_name":"Modality (human\u2013computer interaction)","level":2,"score":0.35420000553131104},{"id":"https://openalex.org/C36464697","wikidata":"https://www.wikidata.org/wiki/Q451553","display_name":"Visualization","level":2,"score":0.3513000011444092},{"id":"https://openalex.org/C69744172","wikidata":"https://www.wikidata.org/wiki/Q860822","display_name":"Image fusion","level":3,"score":0.32019999623298645},{"id":"https://openalex.org/C4679612","wikidata":"https://www.wikidata.org/wiki/Q866298","display_name":"Aggregate (composite)","level":2,"score":0.31310001015663147},{"id":"https://openalex.org/C12713177","wikidata":"https://www.wikidata.org/wiki/Q1900281","display_name":"Perspective (graphical)","level":2,"score":0.29109999537467957},{"id":"https://openalex.org/C165696696","wikidata":"https://www.wikidata.org/wiki/Q11287","display_name":"Exploit","level":2,"score":0.2881999909877777},{"id":"https://openalex.org/C83665646","wikidata":"https://www.wikidata.org/wiki/Q42139305","display_name":"Feature vector","level":2,"score":0.27300000190734863},{"id":"https://openalex.org/C59404180","wikidata":"https://www.wikidata.org/wiki/Q17013334","display_name":"Feature learning","level":2,"score":0.2720000147819519},{"id":"https://openalex.org/C48677424","wikidata":"https://www.wikidata.org/wiki/Q6888088","display_name":"Mode (computer interface)","level":2,"score":0.2711000144481659},{"id":"https://openalex.org/C173414695","wikidata":"https://www.wikidata.org/wiki/Q5510276","display_name":"Fusion mechanism","level":4,"score":0.2615000009536743},{"id":"https://openalex.org/C50644808","wikidata":"https://www.wikidata.org/wiki/Q192776","display_name":"Artificial neural network","level":2,"score":0.257999986410141},{"id":"https://openalex.org/C63479239","wikidata":"https://www.wikidata.org/wiki/Q7353546","display_name":"Robustness (evolution)","level":3,"score":0.25780001282691956}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.1109/ijcnn64981.2025.11228068","is_oa":false,"landing_page_url":"https://doi.org/10.1109/ijcnn64981.2025.11228068","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"2025 International Joint Conference on Neural Networks (IJCNN)","raw_type":"proceedings-article"}],"best_oa_location":null,"sustainable_development_goals":[],"awards":[],"funders":[{"id":"https://openalex.org/F4320321001","display_name":"National Natural Science Foundation of China","ror":"https://ror.org/01h0zpd94"}],"has_content":{"grobid_xml":false,"pdf":false},"content_urls":null,"referenced_works_count":35,"referenced_works":["https://openalex.org/W1994922096","https://openalex.org/W2151049637","https://openalex.org/W2160613239","https://openalex.org/W2780861787","https://openalex.org/W2887486131","https://openalex.org/W2921749009","https://openalex.org/W2938260698","https://openalex.org/W2939217524","https://openalex.org/W2945809413","https://openalex.org/W2963529609","https://openalex.org/W2963691377","https://openalex.org/W2963868681","https://openalex.org/W3039479109","https://openalex.org/W3047800102","https://openalex.org/W3138516171","https://openalex.org/W3164802490","https://openalex.org/W3173370190","https://openalex.org/W3177052299","https://openalex.org/W3185043317","https://openalex.org/W3212645988","https://openalex.org/W4285161446","https://openalex.org/W4289752563","https://openalex.org/W4295165408","https://openalex.org/W4312699294","https://openalex.org/W4313270788","https://openalex.org/W4315606099","https://openalex.org/W4319459168","https://openalex.org/W4319879007","https://openalex.org/W4386158864","https://openalex.org/W4387747474","https://openalex.org/W4387969358","https://openalex.org/W4389160548","https://openalex.org/W4392152057","https://openalex.org/W4392824656","https://openalex.org/W4405056285"],"related_works":[],"abstract_inverted_index":{"RGB-Thermal":[0],"salient":[1],"object":[2],"detection":[3],"(RGB-T":[4],"SOD)":[5],"aims":[6],"to":[7,38,57,84,127,171,177],"identify":[8],"and":[9,20,32,51,59,81,100,114,137,143,194],"segment":[10],"visually":[11],"prominent":[12],"objects":[13],"by":[14,103],"leveraging":[15],"complementary":[16,105],"information":[17,106],"from":[18,107],"RGB":[19,99],"thermal":[21,101],"modalities.":[22],"A":[23],"key":[24],"challenge":[25],"lies":[26],"in":[27],"exploiting":[28],"both":[29],"the":[30,46,52,91,119,141,150,156,163],"uniqueness":[31],"shared":[33],"characteristics":[34],"of":[35,48,152,158],"these":[36,66],"modalities":[37],"enhance":[39],"their":[40],"collaboration.":[41],"Existing":[42],"methods":[43],"often":[44],"ignore":[45],"optimization":[47],"unimodal":[49,79,92],"features":[50,102,174],"level-specific":[53],"modality":[54],"discrepancy,":[55],"leading":[56],"noisy":[58],"redundant":[60],"multi-modal":[61,82,121],"feature":[62,93,131,165],"representations.":[63],"To":[64],"address":[65],"limitations,":[67],"we":[68,89],"propose":[69],"a":[70],"novel":[71],"RGB-T":[72,198],"SOD":[73,199],"network,":[74],"HEFNet,":[75],"which":[76,97],"employs":[77],"hierarchical":[78,120],"enhancement":[80,94],"fusion":[83,122,138],"achieve":[85],"precise":[86],"segmentation.":[87],"Specifically,":[88],"introduce":[90],"(UFE)":[95],"module,":[96],"refines":[98],"incorporating":[104],"adjacent":[108],"levels,":[109],"thereby":[110],"enhancing":[111],"saliency":[112,180],"cues":[113],"suppressing":[115],"noise":[116],"distractions.":[117],"Additionally,":[118],"(HMF)":[123],"module":[124,168],"is":[125,169],"designed":[126],"generate":[128],"robust":[129],"cross-modal":[130,160],"representation.":[132],"By":[133],"employing":[134],"tailored":[135],"refinement":[136],"strategies":[139],"within":[140],"UFE":[142],"HMF":[144],"modules,":[145],"our":[146,186],"network":[147],"fully":[148],"exploits":[149],"strengths":[151],"each":[153],"modality,":[154],"facilitating":[155],"generation":[157],"discriminative":[159],"features.":[161],"Finally,":[162],"multi-level":[164],"integration":[166],"(MFI)":[167],"introduced":[170],"progressively":[172],"aggregate":[173],"across":[175],"levels":[176],"ensure":[178],"accurate":[179],"predictions.":[181],"Extensive":[182],"experiments":[183],"demonstrate":[184],"that":[185],"method":[187],"achieves":[188],"state-of-the-art":[189],"performance,":[190],"verifying":[191],"its":[192],"effectiveness":[193],"superiority":[195],"over":[196],"existing":[197],"approaches.":[200],"Our":[201],"results":[202],"are":[203],"available":[204],"at":[205],"https://github.com/ZhangQing0329/HEFNet":[206]},"counts_by_year":[],"updated_date":"2026-04-09T08:11:56.329763","created_date":"2025-11-14T00:00:00"}
