{"id":"https://openalex.org/W4415537699","doi":"https://doi.org/10.1145/3746027.3754863","title":"LEAF-Mamba: Local Emphatic and Adaptive Fusion State Space Model for RGB-D Salient Object Detection","display_name":"LEAF-Mamba: Local Emphatic and Adaptive Fusion State Space Model for RGB-D Salient Object Detection","publication_year":2025,"publication_date":"2025-10-25","ids":{"openalex":"https://openalex.org/W4415537699","doi":"https://doi.org/10.1145/3746027.3754863"},"language":"en","primary_location":{"id":"doi:10.1145/3746027.3754863","is_oa":true,"landing_page_url":"https://doi.org/10.1145/3746027.3754863","pdf_url":null,"source":null,"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Proceedings of the 33rd ACM International Conference on Multimedia","raw_type":"proceedings-article"},"type":"article","indexed_in":["arxiv","crossref"],"open_access":{"is_oa":true,"oa_status":"gold","oa_url":"https://doi.org/10.1145/3746027.3754863","any_repository_has_fulltext":true},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5114231023","display_name":"Lanhu Wu","orcid":"https://orcid.org/0009-0006-6420-5971"},"institutions":[{"id":"https://openalex.org/I27357992","display_name":"Dalian University of Technology","ror":"https://ror.org/023hj5876","country_code":"CN","type":"education","lineage":["https://openalex.org/I27357992"]}],"countries":["CN"],"is_corresponding":true,"raw_author_name":"Lanhu Wu","raw_affiliation_strings":["Dalian University of Technology, Dalian, China"],"affiliations":[{"raw_affiliation_string":"Dalian University of Technology, Dalian, China","institution_ids":["https://openalex.org/I27357992"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5010623154","display_name":"Zilin Gao","orcid":"https://orcid.org/0000-0003-1757-9349"},"institutions":[{"id":"https://openalex.org/I27357992","display_name":"Dalian University of Technology","ror":"https://ror.org/023hj5876","country_code":"CN","type":"education","lineage":["https://openalex.org/I27357992"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Zilin Gao","raw_affiliation_strings":["Dalian University of Technology, Dalian, China"],"affiliations":[{"raw_affiliation_string":"Dalian University of Technology, Dalian, China","institution_ids":["https://openalex.org/I27357992"]}]},{"author_position":"middle","author":{"id":null,"display_name":"Hao Fei","orcid":"https://orcid.org/0000-0003-3026-6347"},"institutions":[{"id":"https://openalex.org/I165932596","display_name":"National University of Singapore","ror":"https://ror.org/01tgyzw49","country_code":"SG","type":"education","lineage":["https://openalex.org/I165932596"]}],"countries":["SG"],"is_corresponding":false,"raw_author_name":"Hao Fei","raw_affiliation_strings":["National University of Singapore, Singapore, Singapore"],"affiliations":[{"raw_affiliation_string":"National University of Singapore, Singapore, Singapore","institution_ids":["https://openalex.org/I165932596"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5019988958","display_name":"Mong Li Lee","orcid":"https://orcid.org/0000-0002-9636-388X"},"institutions":[{"id":"https://openalex.org/I165932596","display_name":"National University of Singapore","ror":"https://ror.org/01tgyzw49","country_code":"SG","type":"education","lineage":["https://openalex.org/I165932596"]}],"countries":["SG"],"is_corresponding":false,"raw_author_name":"Mong-Li Lee","raw_affiliation_strings":["National University of Singapore, Singapore, Singapore"],"affiliations":[{"raw_affiliation_string":"National University of Singapore, Singapore, Singapore","institution_ids":["https://openalex.org/I165932596"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5051209739","display_name":"Wynne Hsu","orcid":"https://orcid.org/0000-0002-4142-8893"},"institutions":[{"id":"https://openalex.org/I165932596","display_name":"National University of Singapore","ror":"https://ror.org/01tgyzw49","country_code":"SG","type":"education","lineage":["https://openalex.org/I165932596"]}],"countries":["SG"],"is_corresponding":false,"raw_author_name":"Wynne Hsu","raw_affiliation_strings":["National University of Singapore, Singapore, Singapore"],"affiliations":[{"raw_affiliation_string":"National University of Singapore, Singapore, Singapore","institution_ids":["https://openalex.org/I165932596"]}]}],"institutions":[],"countries_distinct_count":2,"institutions_distinct_count":5,"corresponding_author_ids":["https://openalex.org/A5114231023"],"corresponding_institution_ids":["https://openalex.org/I27357992"],"apc_list":null,"apc_paid":null,"fwci":0.0,"has_fulltext":false,"cited_by_count":0,"citation_normalized_percentile":{"value":0.3045719,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":null,"biblio":{"volume":null,"issue":null,"first_page":"1013","last_page":"1022"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T11605","display_name":"Visual Attention and Saliency Detection","score":0.9998999834060669,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T11605","display_name":"Visual Attention and Saliency Detection","score":0.9998999834060669,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10331","display_name":"Video Surveillance and Tracking Methods","score":0.9879000186920166,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11165","display_name":"Image and Video Quality Assessment","score":0.98580002784729,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/salient","display_name":"Salient","score":0.6089000105857849},{"id":"https://openalex.org/keywords/object-detection","display_name":"Object detection","score":0.5314000248908997},{"id":"https://openalex.org/keywords/fusion","display_name":"Fusion","score":0.44780001044273376},{"id":"https://openalex.org/keywords/code","display_name":"Code (set theory)","score":0.4372999966144562},{"id":"https://openalex.org/keywords/generalization","display_name":"Generalization","score":0.43369999527931213},{"id":"https://openalex.org/keywords/pattern-recognition","display_name":"Pattern recognition (psychology)","score":0.4226999878883362},{"id":"https://openalex.org/keywords/sensor-fusion","display_name":"Sensor fusion","score":0.41280001401901245},{"id":"https://openalex.org/keywords/dependency","display_name":"Dependency (UML)","score":0.3506999909877777}],"concepts":[{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.6326000094413757},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.619700014591217},{"id":"https://openalex.org/C2780719617","wikidata":"https://www.wikidata.org/wiki/Q1030752","display_name":"Salient","level":2,"score":0.6089000105857849},{"id":"https://openalex.org/C2776151529","wikidata":"https://www.wikidata.org/wiki/Q3045304","display_name":"Object detection","level":3,"score":0.5314000248908997},{"id":"https://openalex.org/C158525013","wikidata":"https://www.wikidata.org/wiki/Q2593739","display_name":"Fusion","level":2,"score":0.44780001044273376},{"id":"https://openalex.org/C31972630","wikidata":"https://www.wikidata.org/wiki/Q844240","display_name":"Computer vision","level":1,"score":0.4375},{"id":"https://openalex.org/C2776760102","wikidata":"https://www.wikidata.org/wiki/Q5139990","display_name":"Code (set theory)","level":3,"score":0.4372999966144562},{"id":"https://openalex.org/C177148314","wikidata":"https://www.wikidata.org/wiki/Q170084","display_name":"Generalization","level":2,"score":0.43369999527931213},{"id":"https://openalex.org/C153180895","wikidata":"https://www.wikidata.org/wiki/Q7148389","display_name":"Pattern recognition (psychology)","level":2,"score":0.4226999878883362},{"id":"https://openalex.org/C33954974","wikidata":"https://www.wikidata.org/wiki/Q486494","display_name":"Sensor fusion","level":2,"score":0.41280001401901245},{"id":"https://openalex.org/C19768560","wikidata":"https://www.wikidata.org/wiki/Q320727","display_name":"Dependency (UML)","level":2,"score":0.3506999909877777},{"id":"https://openalex.org/C129844170","wikidata":"https://www.wikidata.org/wiki/Q41299","display_name":"Quadratic equation","level":2,"score":0.34529998898506165},{"id":"https://openalex.org/C2778572836","wikidata":"https://www.wikidata.org/wiki/Q380933","display_name":"Space (punctuation)","level":2,"score":0.3407999873161316},{"id":"https://openalex.org/C2776502983","wikidata":"https://www.wikidata.org/wiki/Q690182","display_name":"Contrast (vision)","level":2,"score":0.33739998936653137},{"id":"https://openalex.org/C2781020372","wikidata":"https://www.wikidata.org/wiki/Q533093","display_name":"On the fly","level":2,"score":0.33719998598098755},{"id":"https://openalex.org/C2781238097","wikidata":"https://www.wikidata.org/wiki/Q175026","display_name":"Object (grammar)","level":2,"score":0.3359000086784363},{"id":"https://openalex.org/C2780695315","wikidata":"https://www.wikidata.org/wiki/Q3799040","display_name":"Unobservable","level":2,"score":0.3287999927997589},{"id":"https://openalex.org/C48103436","wikidata":"https://www.wikidata.org/wiki/Q599031","display_name":"State (computer science)","level":2,"score":0.32600000500679016},{"id":"https://openalex.org/C72434380","wikidata":"https://www.wikidata.org/wiki/Q230930","display_name":"State space","level":2,"score":0.3111000061035156},{"id":"https://openalex.org/C157202957","wikidata":"https://www.wikidata.org/wiki/Q1659609","display_name":"Image warping","level":2,"score":0.3091999888420105},{"id":"https://openalex.org/C185798385","wikidata":"https://www.wikidata.org/wiki/Q1161707","display_name":"Benchmark (surveying)","level":2,"score":0.3086000084877014},{"id":"https://openalex.org/C184337299","wikidata":"https://www.wikidata.org/wiki/Q1437428","display_name":"Semantics (computer science)","level":2,"score":0.296999990940094},{"id":"https://openalex.org/C124101348","wikidata":"https://www.wikidata.org/wiki/Q172491","display_name":"Data mining","level":1,"score":0.2782999873161316},{"id":"https://openalex.org/C119857082","wikidata":"https://www.wikidata.org/wiki/Q2539","display_name":"Machine learning","level":1,"score":0.27140000462532043},{"id":"https://openalex.org/C63479239","wikidata":"https://www.wikidata.org/wiki/Q7353546","display_name":"Robustness (evolution)","level":3,"score":0.2590999901294708}],"mesh":[],"locations_count":2,"locations":[{"id":"doi:10.1145/3746027.3754863","is_oa":true,"landing_page_url":"https://doi.org/10.1145/3746027.3754863","pdf_url":null,"source":null,"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Proceedings of the 33rd ACM International Conference on Multimedia","raw_type":"proceedings-article"},{"id":"pmh:oai:arXiv.org:2509.18683","is_oa":true,"landing_page_url":"http://arxiv.org/abs/2509.18683","pdf_url":"https://arxiv.org/pdf/2509.18683","source":{"id":"https://openalex.org/S4393918464","display_name":"ArXiv.org","issn_l":"2331-8422","issn":["2331-8422"],"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":null,"host_organization_name":null,"host_organization_lineage":[],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"text"}],"best_oa_location":{"id":"doi:10.1145/3746027.3754863","is_oa":true,"landing_page_url":"https://doi.org/10.1145/3746027.3754863","pdf_url":null,"source":null,"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Proceedings of the 33rd ACM International Conference on Multimedia","raw_type":"proceedings-article"},"sustainable_development_goals":[],"awards":[],"funders":[],"has_content":{"pdf":false,"grobid_xml":false},"content_urls":null,"referenced_works_count":26,"referenced_works":["https://openalex.org/W2565639579","https://openalex.org/W2945809413","https://openalex.org/W2957414648","https://openalex.org/W2998449272","https://openalex.org/W3003376220","https://openalex.org/W3114848016","https://openalex.org/W3166092877","https://openalex.org/W4206420686","https://openalex.org/W4214831601","https://openalex.org/W4285163934","https://openalex.org/W4292896077","https://openalex.org/W4307771365","https://openalex.org/W4312612915","https://openalex.org/W4315606099","https://openalex.org/W4319866558","https://openalex.org/W4319879007","https://openalex.org/W4376467320","https://openalex.org/W4386902928","https://openalex.org/W4391791419","https://openalex.org/W4391827269","https://openalex.org/W4392346283","https://openalex.org/W4392824656","https://openalex.org/W4395470960","https://openalex.org/W4399207208","https://openalex.org/W4401557909","https://openalex.org/W4413146378"],"related_works":[],"abstract_inverted_index":{"RGB-D":[0,75,152],"salient":[1],"object":[2],"detection":[3],"(SOD)":[4],"aims":[5],"to":[6,74,79,119],"identify":[7],"the":[8,16,29,39,86,146,168],"most":[9],"conspicuous":[10],"objects":[11],"in":[12,47,155],"a":[13,45,96,112,173],"scene":[14],"with":[15,67],"incorporation":[17],"of":[18,41],"depth":[19],"cues.":[20],"Existing":[21],"methods":[22,154],"mainly":[23],"rely":[24],"on":[25,167],"CNNs,":[26],"limited":[27],"by":[28],"local":[30,81,113,122],"receptive":[31],"fields,":[32],"or":[33],"Vision":[34],"Transformers":[35],"that":[36,106,145],"suffer":[37],"from":[38],"cost":[40],"quadratic":[42],"complexity,":[43],"posing":[44],"challenge":[46],"balancing":[48],"performance":[49,166],"and":[50,99,138,158],"computational":[51],"efficiency.":[52,159],"Recently,":[53],"state":[54,102,115],"space":[55,103,116],"models":[56],"(SSM),":[57],"Mamba,":[58],"have":[59],"shown":[60],"great":[61],"potential":[62],"for":[63,124,134],"modeling":[64],"long-range":[65],"dependency":[66],"linear":[68],"complexity.":[69],"However,":[70],"directly":[71],"applying":[72],"SSM":[73],"SOD":[76,153,170],"may":[77],"lead":[78],"deficient":[80],"semantics":[82],"as":[83,85],"well":[84],"inadequate":[87],"cross-modality":[88,136,140],"fusion.":[89],"To":[90],"address":[91],"these":[92],"issues,":[93],"we":[94],"propose":[95],"Local":[97],"Emphatic":[98],"Adaptive":[100],"Fusion":[101],"model":[104],"(LEAF-Mamba)":[105],"contains":[107],"two":[108],"novel":[109],"components:":[110],"1)":[111],"emphatic":[114],"module":[117,132],"(LE-SSM)":[118],"capture":[120],"multi-scale":[121],"dependencies":[123],"both":[125,156],"modalities.":[126],"2)":[127],"an":[128],"SSM-based":[129],"adaptive":[130],"fusion":[131],"(AFM)":[133],"complementary":[135],"interaction":[137],"reliable":[139],"integration.":[141],"Extensive":[142],"experiments":[143],"demonstrate":[144],"LEAF-Mamba":[147],"consistently":[148],"outperforms":[149],"16":[150],"state-of-the-art":[151],"efficacy":[157],"Moreover,":[160],"our":[161],"method":[162],"can":[163],"achieve":[164],"excellent":[165],"RGB-T":[169],"task,":[171],"proving":[172],"powerful":[174],"generalization":[175],"ability.":[176],"Our":[177],"code":[178],"is":[179],"publicly":[180],"available":[181],"at":[182],"https://github.com/LanhooNg/LEAF-Mamba.":[183]},"counts_by_year":[],"updated_date":"2026-03-27T05:58:40.876381","created_date":"2025-10-25T00:00:00"}
