{"id":"https://openalex.org/W4408355364","doi":"https://doi.org/10.1109/icassp49660.2025.10888019","title":"Easy-to-hard Instance-level Feature Fusion for Co-saliency Detection","display_name":"Easy-to-hard Instance-level Feature Fusion for Co-saliency Detection","publication_year":2025,"publication_date":"2025-03-12","ids":{"openalex":"https://openalex.org/W4408355364","doi":"https://doi.org/10.1109/icassp49660.2025.10888019"},"language":"en","primary_location":{"id":"doi:10.1109/icassp49660.2025.10888019","is_oa":false,"landing_page_url":"https://doi.org/10.1109/icassp49660.2025.10888019","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"ICASSP 2025 - 2025 IEEE International Conference on Acoustics, Speech and Signal Processing (ICASSP)","raw_type":"proceedings-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":false,"oa_status":"closed","oa_url":null,"any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5113730802","display_name":"Chuang Ding","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Chuang Ding","raw_affiliation_strings":["NUIST"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"NUIST","institution_ids":[]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5100450850","display_name":"Zhidong Han","orcid":"https://orcid.org/0000-0002-4990-2211"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Zhidong Han","raw_affiliation_strings":["NUIST"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"NUIST","institution_ids":[]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5019485232","display_name":"Gang Dong","orcid":"https://orcid.org/0000-0002-9515-6643"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Gang Dong","raw_affiliation_strings":["IEIT SYSTEMS Co., Ltd"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"IEIT SYSTEMS Co., Ltd","institution_ids":[]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5112801316","display_name":"Lingyan Liang","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Lingyan Liang","raw_affiliation_strings":["IEIT SYSTEMS Co., Ltd"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"IEIT SYSTEMS Co., Ltd","institution_ids":[]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5013433372","display_name":"Dongchao Wen","orcid":"https://orcid.org/0000-0001-7311-1842"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Dongchao Wen","raw_affiliation_strings":["IEIT SYSTEMS Co., Ltd"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"IEIT SYSTEMS Co., Ltd","institution_ids":[]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5075412755","display_name":"Kaihua Zhang","orcid":"https://orcid.org/0000-0002-1613-3401"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Kaihua Zhang","raw_affiliation_strings":["IEIT SYSTEMS Co., Ltd"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"IEIT SYSTEMS Co., Ltd","institution_ids":[]}]}],"institutions":[],"countries_distinct_count":0,"institutions_distinct_count":6,"corresponding_author_ids":[],"corresponding_institution_ids":[],"apc_list":null,"apc_paid":null,"fwci":0.0,"has_fulltext":false,"cited_by_count":0,"citation_normalized_percentile":{"value":0.03043766,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":null,"biblio":{"volume":null,"issue":null,"first_page":"1","last_page":"5"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T11605","display_name":"Visual Attention and Saliency Detection","score":0.9986000061035156,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T11605","display_name":"Visual Attention and Saliency Detection","score":0.9986000061035156,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.7121633291244507},{"id":"https://openalex.org/keywords/feature","display_name":"Feature (linguistics)","score":0.6010260581970215},{"id":"https://openalex.org/keywords/fusion","display_name":"Fusion","score":0.5526769161224365},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.5496011972427368},{"id":"https://openalex.org/keywords/pattern-recognition","display_name":"Pattern recognition (psychology)","score":0.4875916838645935}],"concepts":[{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.7121633291244507},{"id":"https://openalex.org/C2776401178","wikidata":"https://www.wikidata.org/wiki/Q12050496","display_name":"Feature (linguistics)","level":2,"score":0.6010260581970215},{"id":"https://openalex.org/C158525013","wikidata":"https://www.wikidata.org/wiki/Q2593739","display_name":"Fusion","level":2,"score":0.5526769161224365},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.5496011972427368},{"id":"https://openalex.org/C153180895","wikidata":"https://www.wikidata.org/wiki/Q7148389","display_name":"Pattern recognition (psychology)","level":2,"score":0.4875916838645935},{"id":"https://openalex.org/C41895202","wikidata":"https://www.wikidata.org/wiki/Q8162","display_name":"Linguistics","level":1,"score":0.0},{"id":"https://openalex.org/C138885662","wikidata":"https://www.wikidata.org/wiki/Q5891","display_name":"Philosophy","level":0,"score":0.0}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.1109/icassp49660.2025.10888019","is_oa":false,"landing_page_url":"https://doi.org/10.1109/icassp49660.2025.10888019","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"ICASSP 2025 - 2025 IEEE International Conference on Acoustics, Speech and Signal Processing (ICASSP)","raw_type":"proceedings-article"}],"best_oa_location":null,"sustainable_development_goals":[{"score":0.4300000071525574,"id":"https://metadata.un.org/sdg/13","display_name":"Climate action"}],"awards":[],"funders":[],"has_content":{"pdf":false,"grobid_xml":false},"content_urls":null,"referenced_works_count":29,"referenced_works":["https://openalex.org/W1522973599","https://openalex.org/W1891496504","https://openalex.org/W2044465660","https://openalex.org/W2100470808","https://openalex.org/W2165612380","https://openalex.org/W2342491128","https://openalex.org/W2504335775","https://openalex.org/W2904945062","https://openalex.org/W2963529609","https://openalex.org/W2963868681","https://openalex.org/W2971889950","https://openalex.org/W3023562424","https://openalex.org/W3034499925","https://openalex.org/W3035666869","https://openalex.org/W3039991645","https://openalex.org/W3096289386","https://openalex.org/W3173349970","https://openalex.org/W3202242435","https://openalex.org/W4221145551","https://openalex.org/W4291653109","https://openalex.org/W4362654014","https://openalex.org/W4386065895","https://openalex.org/W4386076585","https://openalex.org/W4386159059","https://openalex.org/W4392152057","https://openalex.org/W4402981691","https://openalex.org/W6698333214","https://openalex.org/W6793183881","https://openalex.org/W6847957277"],"related_works":["https://openalex.org/W4391375266","https://openalex.org/W2899084033","https://openalex.org/W2748952813","https://openalex.org/W2390279801","https://openalex.org/W4391913857","https://openalex.org/W2358668433","https://openalex.org/W4396701345","https://openalex.org/W2376932109","https://openalex.org/W2033914206","https://openalex.org/W2042327336"],"abstract_inverted_index":{"Existing":[0],"leading":[1,69],"deep":[2],"learning-based":[3],"Co-saliency":[4],"Detection":[5],"(CoD)":[6],"methods":[7],"often":[8],"learn":[9,174],"the":[10,14,20,26,29,51,59,93,100,109,114,139,143,161,166,170,175,183,187,204,208,216,221,226,229,235,246],"consensus":[11,97,179,184,205],"features":[12,112,206,218,231],"from":[13,99,165,186,207],"input":[15,30],"image":[16,127],"group":[17],"without":[18],"considering":[19],"complexity":[21,128],"of":[22],"each":[23],"image.":[24],"Despite":[25],"demonstrated":[27],"success,":[28],"images":[31],"may":[32],"contain":[33],"hard":[34,115,209],"samples":[35,102,145,168,189,210],"with":[36,146,182,203],"high":[37],"complexity,":[38],"e.g.,":[39],"those":[40],"containing":[41],"distractors":[42,65],"that":[43,125,219,245],"have":[44],"similar":[45],"appearance":[46],"but":[47],"different":[48],"semantics":[49],"to":[50,57,62,70,106,141,173],"co-salient":[52,67,95,110,162,177,222],"objects.":[53],"This":[54],"is":[55],"prone":[56],"mislead":[58],"learned":[60],"model":[61,140],"treat":[63],"these":[64],"as":[66,103,169,190],"objects,":[68],"classification":[71],"ambiguity.":[72],"To":[73],"address":[74],"this":[75,77],"issue,":[76],"paper":[78],"presents":[79],"an":[80,153,194],"easy-to-hard":[81],"instance-level":[82,94,171],"feature":[83],"Fusion":[84,197],"framework":[85],"for":[86],"CoD,":[87],"termed":[88],"E2HCoD.":[89],"The":[90],"E2HCoD":[91,248],"exploits":[92],"object":[96,111,163,178],"cues":[98],"easy":[101,144,148,167,188],"reliable":[104],"guidance":[105,172],"accurately":[107,159],"fuse":[108],"in":[113],"samples.":[116],"First,":[117],"we":[118,151,192],"design":[119],"a":[120,212,238],"Feature":[121],"Filtering":[122],"Module":[123],"(FFM)":[124],"evaluates":[126],"by":[129],"integrating":[130],"entropy,":[131],"variance,":[132],"texture,":[133],"and":[134,255],"edge":[135],"density":[136],"cues,":[137],"allowing":[138],"select":[142],"relatively":[147],"backgrounds.":[149],"Then,":[150,181],"develop":[152],"Easy-instance":[154,195],"Embedding":[155],"Branch":[156,198],"(EEB),":[157],"which":[158,200],"segments":[160],"masks":[164],"accurate":[176],"cues.":[180],"knowledge":[185],"guidance,":[191],"construct":[193],"guided":[196],"(EFB),":[199],"fully":[201],"interacts":[202],"via":[211],"cross-attention":[213],"mechanism,":[214],"yielding":[215],"refined":[217,230],"highlight":[220],"objects":[223],"while":[224],"suppressing":[225],"distractors.":[227],"Finally,":[228],"are":[232],"fed":[233],"into":[234],"decoder,":[236],"generating":[237],"high-quality":[239],"CoD":[240],"prediction.":[241],"Extensive":[242],"experiments":[243],"demonstrate":[244],"proposed":[247],"achieves":[249],"state-of-the-art":[250],"performance":[251],"on":[252],"CoSal2015,":[253],"CoCA,":[254],"CoSOD3k.":[256]},"counts_by_year":[],"updated_date":"2026-06-11T09:08:48.828518","created_date":"2025-10-10T00:00:00"}
