{"id":"https://openalex.org/W4308234205","doi":"https://doi.org/10.1109/icip46576.2022.9897410","title":"Multi-Modality Diversity Fusion Network with Swintransformer for RGB-D Salient Object Detection","display_name":"Multi-Modality Diversity Fusion Network with Swintransformer for RGB-D Salient Object Detection","publication_year":2022,"publication_date":"2022-10-16","ids":{"openalex":"https://openalex.org/W4308234205","doi":"https://doi.org/10.1109/icip46576.2022.9897410"},"language":"en","primary_location":{"id":"doi:10.1109/icip46576.2022.9897410","is_oa":false,"landing_page_url":"https://doi.org/10.1109/icip46576.2022.9897410","pdf_url":null,"source":{"id":"https://openalex.org/S4363607719","display_name":"2022 IEEE International Conference on Image Processing (ICIP)","issn_l":null,"issn":null,"is_oa":false,"is_in_doaj":false,"is_core":false,"host_organization":null,"host_organization_name":null,"host_organization_lineage":[],"host_organization_lineage_names":[],"type":"conference"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"2022 IEEE International Conference on Image Processing (ICIP)","raw_type":"proceedings-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":false,"oa_status":"closed","oa_url":null,"any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5067515645","display_name":"Songsong Duan","orcid":"https://orcid.org/0000-0003-2983-4044"},"institutions":[{"id":"https://openalex.org/I184681353","display_name":"Anhui University of Science and Technology","ror":"https://ror.org/00q9atg80","country_code":"CN","type":"education","lineage":["https://openalex.org/I184681353"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Songsong Duan","raw_affiliation_strings":["Anhui University of Science and Technology,College of Computer Science and Engineering,China","College of Computer Science and Engineering, Anhui University of Science and Technology, China"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"Anhui University of Science and Technology,College of Computer Science and Engineering,China","institution_ids":["https://openalex.org/I184681353"]},{"raw_affiliation_string":"College of Computer Science and Engineering, Anhui University of Science and Technology, China","institution_ids":["https://openalex.org/I184681353"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5103259110","display_name":"Chenxing Xia","orcid":"https://orcid.org/0009-0007-8138-9204"},"institutions":[{"id":"https://openalex.org/I184681353","display_name":"Anhui University of Science and Technology","ror":"https://ror.org/00q9atg80","country_code":"CN","type":"education","lineage":["https://openalex.org/I184681353"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Chenxing Xia","raw_affiliation_strings":["Anhui University of Science and Technology,College of Computer Science and Engineering,China","College of Computer Science and Engineering, Anhui University of Science and Technology, China","Hefei Comprehensive National Science Center, Institute of Energy, China"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"Anhui University of Science and Technology,College of Computer Science and Engineering,China","institution_ids":["https://openalex.org/I184681353"]},{"raw_affiliation_string":"College of Computer Science and Engineering, Anhui University of Science and Technology, China","institution_ids":["https://openalex.org/I184681353"]},{"raw_affiliation_string":"Hefei Comprehensive National Science Center, Institute of Energy, China","institution_ids":[]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5068221881","display_name":"Xiuju Gao","orcid":null},"institutions":[{"id":"https://openalex.org/I184681353","display_name":"Anhui University of Science and Technology","ror":"https://ror.org/00q9atg80","country_code":"CN","type":"education","lineage":["https://openalex.org/I184681353"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Xiuju Gao","raw_affiliation_strings":["Anhui University of Science and Technology,College of Computer Science and Engineering,China","College of Computer Science and Engineering, Anhui University of Science and Technology, China"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"Anhui University of Science and Technology,College of Computer Science and Engineering,China","institution_ids":["https://openalex.org/I184681353"]},{"raw_affiliation_string":"College of Computer Science and Engineering, Anhui University of Science and Technology, China","institution_ids":["https://openalex.org/I184681353"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5033351506","display_name":"Bin Ge","orcid":"https://orcid.org/0000-0001-9050-1105"},"institutions":[{"id":"https://openalex.org/I184681353","display_name":"Anhui University of Science and Technology","ror":"https://ror.org/00q9atg80","country_code":"CN","type":"education","lineage":["https://openalex.org/I184681353"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Bin Ge","raw_affiliation_strings":["Anhui University of Science and Technology,College of Computer Science and Engineering,China","College of Computer Science and Engineering, Anhui University of Science and Technology, China"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"Anhui University of Science and Technology,College of Computer Science and Engineering,China","institution_ids":["https://openalex.org/I184681353"]},{"raw_affiliation_string":"College of Computer Science and Engineering, Anhui University of Science and Technology, China","institution_ids":["https://openalex.org/I184681353"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5039718270","display_name":"Hanling Zhang","orcid":"https://orcid.org/0000-0002-8242-9139"},"institutions":[{"id":"https://openalex.org/I16609230","display_name":"Hunan University","ror":"https://ror.org/05htk5m33","country_code":"CN","type":"education","lineage":["https://openalex.org/I16609230"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Hanling Zhang","raw_affiliation_strings":["Hunan University,School of Design,China","School of Design, Hunan University, China"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"Hunan University,School of Design,China","institution_ids":["https://openalex.org/I16609230"]},{"raw_affiliation_string":"School of Design, Hunan University, China","institution_ids":["https://openalex.org/I16609230"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5063188437","display_name":"Kuan\u2010Ching Li","orcid":"https://orcid.org/0000-0003-1381-4364"},"institutions":[{"id":"https://openalex.org/I177918364","display_name":"Providence University","ror":"https://ror.org/03fcpsq87","country_code":"TW","type":"education","lineage":["https://openalex.org/I177918364"]}],"countries":["TW"],"is_corresponding":false,"raw_author_name":"Kuan-Ching Li","raw_affiliation_strings":["Providence University,Department of Computer Science and Information Engineering,Taiwan","Department of Computer Science and Information Engineering, Providence University, Taiwan"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"Providence University,Department of Computer Science and Information Engineering,Taiwan","institution_ids":["https://openalex.org/I177918364"]},{"raw_affiliation_string":"Department of Computer Science and Information Engineering, Providence University, Taiwan","institution_ids":["https://openalex.org/I177918364"]}]}],"institutions":[],"countries_distinct_count":2,"institutions_distinct_count":6,"corresponding_author_ids":[],"corresponding_institution_ids":[],"apc_list":null,"apc_paid":null,"fwci":0.2359,"has_fulltext":false,"cited_by_count":4,"citation_normalized_percentile":{"value":0.58493647,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":{"min":90,"max":97},"biblio":{"volume":null,"issue":null,"first_page":"1076","last_page":"1080"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T11605","display_name":"Visual Attention and Saliency Detection","score":1.0,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T11605","display_name":"Visual Attention and Saliency Detection","score":1.0,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10036","display_name":"Advanced Neural Network Applications","score":0.9984999895095825,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10627","display_name":"Advanced Image and Video Retrieval Techniques","score":0.9904999732971191,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/rgb-color-model","display_name":"RGB color model","score":0.7295902967453003},{"id":"https://openalex.org/keywords/modality","display_name":"Modality (human\u2013computer interaction)","score":0.6452764272689819},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.615339994430542},{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.6083564162254333},{"id":"https://openalex.org/keywords/modalities","display_name":"Modalities","score":0.5463292598724365},{"id":"https://openalex.org/keywords/benchmark","display_name":"Benchmark (surveying)","score":0.4738769233226776},{"id":"https://openalex.org/keywords/subnet","display_name":"Subnet","score":0.4223592281341553},{"id":"https://openalex.org/keywords/perspective","display_name":"Perspective (graphical)","score":0.41368740797042847},{"id":"https://openalex.org/keywords/pattern-recognition","display_name":"Pattern recognition (psychology)","score":0.33931219577789307},{"id":"https://openalex.org/keywords/information-retrieval","display_name":"Information retrieval","score":0.33067166805267334},{"id":"https://openalex.org/keywords/computer-vision","display_name":"Computer vision","score":0.32050013542175293}],"concepts":[{"id":"https://openalex.org/C82990744","wikidata":"https://www.wikidata.org/wiki/Q166194","display_name":"RGB color model","level":2,"score":0.7295902967453003},{"id":"https://openalex.org/C2780226545","wikidata":"https://www.wikidata.org/wiki/Q6888030","display_name":"Modality (human\u2013computer interaction)","level":2,"score":0.6452764272689819},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.615339994430542},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.6083564162254333},{"id":"https://openalex.org/C2779903281","wikidata":"https://www.wikidata.org/wiki/Q6888026","display_name":"Modalities","level":2,"score":0.5463292598724365},{"id":"https://openalex.org/C185798385","wikidata":"https://www.wikidata.org/wiki/Q1161707","display_name":"Benchmark (surveying)","level":2,"score":0.4738769233226776},{"id":"https://openalex.org/C21099817","wikidata":"https://www.wikidata.org/wiki/Q7631721","display_name":"Subnet","level":2,"score":0.4223592281341553},{"id":"https://openalex.org/C12713177","wikidata":"https://www.wikidata.org/wiki/Q1900281","display_name":"Perspective (graphical)","level":2,"score":0.41368740797042847},{"id":"https://openalex.org/C153180895","wikidata":"https://www.wikidata.org/wiki/Q7148389","display_name":"Pattern recognition (psychology)","level":2,"score":0.33931219577789307},{"id":"https://openalex.org/C23123220","wikidata":"https://www.wikidata.org/wiki/Q816826","display_name":"Information retrieval","level":1,"score":0.33067166805267334},{"id":"https://openalex.org/C31972630","wikidata":"https://www.wikidata.org/wiki/Q844240","display_name":"Computer vision","level":1,"score":0.32050013542175293},{"id":"https://openalex.org/C36289849","wikidata":"https://www.wikidata.org/wiki/Q34749","display_name":"Social science","level":1,"score":0.0},{"id":"https://openalex.org/C31258907","wikidata":"https://www.wikidata.org/wiki/Q1301371","display_name":"Computer network","level":1,"score":0.0},{"id":"https://openalex.org/C144024400","wikidata":"https://www.wikidata.org/wiki/Q21201","display_name":"Sociology","level":0,"score":0.0},{"id":"https://openalex.org/C13280743","wikidata":"https://www.wikidata.org/wiki/Q131089","display_name":"Geodesy","level":1,"score":0.0},{"id":"https://openalex.org/C205649164","wikidata":"https://www.wikidata.org/wiki/Q1071","display_name":"Geography","level":0,"score":0.0}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.1109/icip46576.2022.9897410","is_oa":false,"landing_page_url":"https://doi.org/10.1109/icip46576.2022.9897410","pdf_url":null,"source":{"id":"https://openalex.org/S4363607719","display_name":"2022 IEEE International Conference on Image Processing (ICIP)","issn_l":null,"issn":null,"is_oa":false,"is_in_doaj":false,"is_core":false,"host_organization":null,"host_organization_name":null,"host_organization_lineage":[],"host_organization_lineage_names":[],"type":"conference"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"2022 IEEE International Conference on Image Processing (ICIP)","raw_type":"proceedings-article"}],"best_oa_location":null,"sustainable_development_goals":[{"display_name":"Peace, Justice and strong institutions","id":"https://metadata.un.org/sdg/16","score":0.44999998807907104}],"awards":[],"funders":[{"id":"https://openalex.org/F4320321001","display_name":"National Natural Science Foundation of China","ror":"https://ror.org/01h0zpd94"}],"has_content":{"pdf":false,"grobid_xml":false},"content_urls":null,"referenced_works_count":22,"referenced_works":["https://openalex.org/W2071549734","https://openalex.org/W2953950151","https://openalex.org/W2957414648","https://openalex.org/W3010616503","https://openalex.org/W3022015146","https://openalex.org/W3035284915","https://openalex.org/W3035357085","https://openalex.org/W3035633116","https://openalex.org/W3035687312","https://openalex.org/W3106587394","https://openalex.org/W3108421143","https://openalex.org/W3108822985","https://openalex.org/W3114152269","https://openalex.org/W3120113457","https://openalex.org/W3135874576","https://openalex.org/W3138516171","https://openalex.org/W3163411367","https://openalex.org/W3173882198","https://openalex.org/W3177040887","https://openalex.org/W3206198586","https://openalex.org/W3207804100","https://openalex.org/W3211246039"],"related_works":["https://openalex.org/W73545470","https://openalex.org/W4224266612","https://openalex.org/W2383394264","https://openalex.org/W4320153225","https://openalex.org/W4293261942","https://openalex.org/W3125968744","https://openalex.org/W2167701463","https://openalex.org/W2110287964","https://openalex.org/W4307407935","https://openalex.org/W649759291"],"abstract_inverted_index":{"Multi-modality":[0],"complementary":[1],"information":[2,34,126],"brings":[3],"new":[4],"impetus":[5],"and":[6,24,86,97,123],"innovation":[7],"to":[8,105,119,129],"saliency":[9],"object":[10],"detection":[11],"(SOD).":[12],"However,":[13],"most":[14],"existing":[15],"RGB-D":[16,68,158],"SOD":[17,46,69,159],"methods":[18],"either":[19],"indiscriminately":[20],"handle":[21],"RGB":[22,36,85],"features":[23,26,31,122],"depth":[25,30,87],"or":[27],"only":[28],"take":[29],"as":[32],"additional":[33],"of":[35,42,73,77,84,109,136],"subnet-work,":[37],"ignoring":[38],"the":[39,71,74,82,107,134,146],"different":[40,75,110],"roles":[41,83],"two":[43],"modalities":[44],"for":[45,67],"tasks.":[47],"To":[48,89],"tackle":[49],"this":[50,90],"issue,":[51],"we":[52,113],"propose":[53],"a":[54,92,98,115],"novel":[55],"multi-modality":[56],"diversity":[57,99],"fusion":[58,100],"network":[59],"with":[60],"SwinTransformer":[61],"(M":[62],"<sup":[63,149],"xmlns:mml=\"http://www.w3.org/1998/Math/MathML\"":[64,150],"xmlns:xlink=\"http://www.w3.org/1999/xlink\">2</sup>":[65,151],"DFNet)":[66],"from":[70,127],"perspective":[72],"status":[76],"multi-modality,":[78],"which":[79,131],"adequately":[80],"explores":[81],"modalities.":[88,111],"end,":[91],"triple-diversity":[93],"supervision":[94],"mechanism":[95],"(TDSM)":[96],"module":[101],"(DFM)":[102],"are":[103],"designed":[104,114],"parse":[106],"function":[108],"Besides,":[112],"dense":[116],"decoder":[117],"(DSD)":[118],"integrate":[120],"multi-scale":[121],"transfer":[124],"gain":[125],"top":[128],"bottom,":[130],"can":[132],"improve":[133],"performance":[135],"SOD.":[137],"Extensive":[138],"experiments":[139],"on":[140],"five":[141],"benchmark":[142],"datasets":[143],"demonstrate":[144],"that":[145],"proposed":[147],"M":[148],"DFNet":[152],"outperforms":[153],"17":[154],"other":[155],"state-of-the-art":[156],"(SOTA)":[157],"methods.":[160]},"counts_by_year":[{"year":2024,"cited_by_count":3},{"year":2023,"cited_by_count":1}],"updated_date":"2026-06-11T09:08:48.828518","created_date":"2025-10-10T00:00:00"}
