{"id":"https://openalex.org/W7124439889","doi":"https://doi.org/10.1109/tip.2026.3651951","title":"Boosting Segment Anything Model to Generalize Visually Non-Salient Scenarios","display_name":"Boosting Segment Anything Model to Generalize Visually Non-Salient Scenarios","publication_year":2026,"publication_date":"2026-01-01","ids":{"openalex":"https://openalex.org/W7124439889","doi":"https://doi.org/10.1109/tip.2026.3651951","pmid":"https://pubmed.ncbi.nlm.nih.gov/41538350"},"language":"en","primary_location":{"id":"doi:10.1109/tip.2026.3651951","is_oa":false,"landing_page_url":"https://doi.org/10.1109/tip.2026.3651951","pdf_url":null,"source":{"id":"https://openalex.org/S4210173141","display_name":"IEEE Transactions on Image Processing","issn_l":"1057-7149","issn":["1057-7149","1941-0042"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310319808","host_organization_name":"Institute of Electrical and Electronics Engineers","host_organization_lineage":["https://openalex.org/P4310319808"],"host_organization_lineage_names":["Institute of Electrical and Electronics Engineers"],"type":"journal"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"IEEE Transactions on Image Processing","raw_type":"journal-article"},"type":"article","indexed_in":["crossref","pubmed"],"open_access":{"is_oa":false,"oa_status":"closed","oa_url":null,"any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5002446197","display_name":"Guangqian Guo","orcid":"https://orcid.org/0000-0002-8940-1382"},"institutions":[{"id":"https://openalex.org/I17145004","display_name":"Northwestern Polytechnical University","ror":"https://ror.org/01y0j0j86","country_code":"CN","type":"education","lineage":["https://openalex.org/I17145004"]}],"countries":["CN"],"is_corresponding":true,"raw_author_name":"Guangqian Guo","raw_affiliation_strings":["Unmanned System Research Institute, Northwestern Polytechnical University, Xi&#x2019;an, China"],"raw_orcid":"https://orcid.org/0000-0002-8940-1382","affiliations":[{"raw_affiliation_string":"Unmanned System Research Institute, Northwestern Polytechnical University, Xi&#x2019;an, China","institution_ids":["https://openalex.org/I17145004"]}]},{"author_position":"middle","author":{"id":null,"display_name":"Pengfei Chen","orcid":"https://orcid.org/0000-0003-4883-201X"},"institutions":[{"id":"https://openalex.org/I17747738","display_name":"Beijing University of Chinese Medicine","ror":"https://ror.org/05damtm70","country_code":"CN","type":"education","lineage":["https://openalex.org/I17747738"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Pengfei Chen","raw_affiliation_strings":["School of Electronic, Electrical, and Communication Engineering, University of Chinese Academic of Sciences, Beijing, China"],"raw_orcid":"https://orcid.org/0000-0003-4883-201X","affiliations":[{"raw_affiliation_string":"School of Electronic, Electrical, and Communication Engineering, University of Chinese Academic of Sciences, Beijing, China","institution_ids":["https://openalex.org/I17747738"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5123181668","display_name":"Yong Guo","orcid":null},"institutions":[{"id":"https://openalex.org/I4210109712","display_name":"Max Planck Institute for Informatics","ror":"https://ror.org/01w19ak89","country_code":"DE","type":"facility","lineage":["https://openalex.org/I149899117","https://openalex.org/I4210109712"]}],"countries":["DE"],"is_corresponding":false,"raw_author_name":"Yong Guo","raw_affiliation_strings":["Max Planck Institute for Informatics (MPI-INF), Saarbr&#x00FC;cken, Germany"],"raw_orcid":"https://orcid.org/0000-0002-3444-4588","affiliations":[{"raw_affiliation_string":"Max Planck Institute for Informatics (MPI-INF), Saarbr&#x00FC;cken, Germany","institution_ids":["https://openalex.org/I4210109712"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5018905757","display_name":"Huafeng Chen","orcid":"https://orcid.org/0000-0001-8371-0216"},"institutions":[{"id":"https://openalex.org/I17145004","display_name":"Northwestern Polytechnical University","ror":"https://ror.org/01y0j0j86","country_code":"CN","type":"education","lineage":["https://openalex.org/I17145004"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Huafeng Chen","raw_affiliation_strings":["Unmanned System Research Institute, Northwestern Polytechnical University, Xi&#x2019;an, China"],"raw_orcid":"https://orcid.org/0000-0001-8371-0216","affiliations":[{"raw_affiliation_string":"Unmanned System Research Institute, Northwestern Polytechnical University, Xi&#x2019;an, China","institution_ids":["https://openalex.org/I17145004"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5122284882","display_name":"Boqiang Zhang","orcid":null},"institutions":[{"id":"https://openalex.org/I126520041","display_name":"University of Science and Technology of China","ror":"https://ror.org/04c4dkn09","country_code":"CN","type":"education","lineage":["https://openalex.org/I126520041","https://openalex.org/I19820366"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Boqiang Zhang","raw_affiliation_strings":["University of Science and Technology of China, Hefei, China"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"University of Science and Technology of China, Hefei, China","institution_ids":["https://openalex.org/I126520041"]}]},{"author_position":"last","author":{"id":null,"display_name":"Shan Gao","orcid":"https://orcid.org/0000-0002-3427-5825"},"institutions":[{"id":"https://openalex.org/I17145004","display_name":"Northwestern Polytechnical University","ror":"https://ror.org/01y0j0j86","country_code":"CN","type":"education","lineage":["https://openalex.org/I17145004"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Shan Gao","raw_affiliation_strings":["Unmanned System Research Institute, Northwestern Polytechnical University, Xi&#x2019;an, China"],"raw_orcid":"https://orcid.org/0000-0002-3427-5825","affiliations":[{"raw_affiliation_string":"Unmanned System Research Institute, Northwestern Polytechnical University, Xi&#x2019;an, China","institution_ids":["https://openalex.org/I17145004"]}]}],"institutions":[],"countries_distinct_count":2,"institutions_distinct_count":6,"corresponding_author_ids":["https://openalex.org/A5002446197"],"corresponding_institution_ids":["https://openalex.org/I17145004"],"apc_list":null,"apc_paid":null,"fwci":0.0,"has_fulltext":false,"cited_by_count":0,"citation_normalized_percentile":{"value":0.09272071,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":null,"biblio":{"volume":"35","issue":null,"first_page":"1143","last_page":"1157"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T11605","display_name":"Visual Attention and Saliency Detection","score":0.9872999787330627,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T11605","display_name":"Visual Attention and Saliency Detection","score":0.9872999787330627,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10036","display_name":"Advanced Neural Network Applications","score":0.005499999970197678,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10775","display_name":"Generative Adversarial Networks and Image Synthesis","score":0.0005000000237487257,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/boosting","display_name":"Boosting (machine learning)","score":0.744700014591217},{"id":"https://openalex.org/keywords/segmentation","display_name":"Segmentation","score":0.7314000129699707},{"id":"https://openalex.org/keywords/generalizability-theory","display_name":"Generalizability theory","score":0.548799991607666},{"id":"https://openalex.org/keywords/benchmark","display_name":"Benchmark (surveying)","score":0.5329999923706055},{"id":"https://openalex.org/keywords/contrast","display_name":"Contrast (vision)","score":0.482699990272522},{"id":"https://openalex.org/keywords/image-segmentation","display_name":"Image segmentation","score":0.4699000120162964},{"id":"https://openalex.org/keywords/pattern-recognition","display_name":"Pattern recognition (psychology)","score":0.40290001034736633},{"id":"https://openalex.org/keywords/feature","display_name":"Feature (linguistics)","score":0.3995000123977661}],"concepts":[{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.7925999760627747},{"id":"https://openalex.org/C46686674","wikidata":"https://www.wikidata.org/wiki/Q466303","display_name":"Boosting (machine learning)","level":2,"score":0.744700014591217},{"id":"https://openalex.org/C89600930","wikidata":"https://www.wikidata.org/wiki/Q1423946","display_name":"Segmentation","level":2,"score":0.7314000129699707},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.6656000018119812},{"id":"https://openalex.org/C27158222","wikidata":"https://www.wikidata.org/wiki/Q5532422","display_name":"Generalizability theory","level":2,"score":0.548799991607666},{"id":"https://openalex.org/C185798385","wikidata":"https://www.wikidata.org/wiki/Q1161707","display_name":"Benchmark (surveying)","level":2,"score":0.5329999923706055},{"id":"https://openalex.org/C2776502983","wikidata":"https://www.wikidata.org/wiki/Q690182","display_name":"Contrast (vision)","level":2,"score":0.482699990272522},{"id":"https://openalex.org/C124504099","wikidata":"https://www.wikidata.org/wiki/Q56933","display_name":"Image segmentation","level":3,"score":0.4699000120162964},{"id":"https://openalex.org/C119857082","wikidata":"https://www.wikidata.org/wiki/Q2539","display_name":"Machine learning","level":1,"score":0.42800000309944153},{"id":"https://openalex.org/C153180895","wikidata":"https://www.wikidata.org/wiki/Q7148389","display_name":"Pattern recognition (psychology)","level":2,"score":0.40290001034736633},{"id":"https://openalex.org/C2776401178","wikidata":"https://www.wikidata.org/wiki/Q12050496","display_name":"Feature (linguistics)","level":2,"score":0.3995000123977661},{"id":"https://openalex.org/C52622490","wikidata":"https://www.wikidata.org/wiki/Q1026626","display_name":"Feature extraction","level":2,"score":0.37299999594688416},{"id":"https://openalex.org/C26760741","wikidata":"https://www.wikidata.org/wiki/Q160402","display_name":"Perception","level":2,"score":0.3562999963760376},{"id":"https://openalex.org/C31972630","wikidata":"https://www.wikidata.org/wiki/Q844240","display_name":"Computer vision","level":1,"score":0.34599998593330383},{"id":"https://openalex.org/C48145219","wikidata":"https://www.wikidata.org/wiki/Q1335365","display_name":"Security token","level":2,"score":0.3149000108242035},{"id":"https://openalex.org/C57273362","wikidata":"https://www.wikidata.org/wiki/Q576722","display_name":"Decoding methods","level":2,"score":0.31380000710487366},{"id":"https://openalex.org/C65885262","wikidata":"https://www.wikidata.org/wiki/Q7429708","display_name":"Scale-space segmentation","level":4,"score":0.3018999993801117},{"id":"https://openalex.org/C36464697","wikidata":"https://www.wikidata.org/wiki/Q451553","display_name":"Visualization","level":2,"score":0.29820001125335693},{"id":"https://openalex.org/C97256817","wikidata":"https://www.wikidata.org/wiki/Q1462316","display_name":"Spurious relationship","level":2,"score":0.2944999933242798},{"id":"https://openalex.org/C63479239","wikidata":"https://www.wikidata.org/wiki/Q7353546","display_name":"Robustness (evolution)","level":3,"score":0.2854999899864197},{"id":"https://openalex.org/C179799912","wikidata":"https://www.wikidata.org/wiki/Q205084","display_name":"Computational complexity theory","level":2,"score":0.2791999876499176},{"id":"https://openalex.org/C175154964","wikidata":"https://www.wikidata.org/wiki/Q380077","display_name":"Task analysis","level":3,"score":0.27720001339912415},{"id":"https://openalex.org/C183322885","wikidata":"https://www.wikidata.org/wiki/Q17007702","display_name":"Context model","level":3,"score":0.250900000333786}],"mesh":[],"locations_count":2,"locations":[{"id":"doi:10.1109/tip.2026.3651951","is_oa":false,"landing_page_url":"https://doi.org/10.1109/tip.2026.3651951","pdf_url":null,"source":{"id":"https://openalex.org/S4210173141","display_name":"IEEE Transactions on Image Processing","issn_l":"1057-7149","issn":["1057-7149","1941-0042"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310319808","host_organization_name":"Institute of Electrical and Electronics Engineers","host_organization_lineage":["https://openalex.org/P4310319808"],"host_organization_lineage_names":["Institute of Electrical and Electronics Engineers"],"type":"journal"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"IEEE Transactions on Image Processing","raw_type":"journal-article"},{"id":"pmid:41538350","is_oa":false,"landing_page_url":"https://pubmed.ncbi.nlm.nih.gov/41538350","pdf_url":null,"source":{"id":"https://openalex.org/S4306525036","display_name":"PubMed","issn_l":null,"issn":null,"is_oa":false,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I1299303238","host_organization_name":"National Institutes of Health","host_organization_lineage":["https://openalex.org/I1299303238"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"IEEE transactions on image processing : a publication of the IEEE Signal Processing Society","raw_type":null}],"best_oa_location":null,"sustainable_development_goals":[],"awards":[{"id":"https://openalex.org/G3618867521","display_name":null,"funder_award_id":"62372382","funder_id":"https://openalex.org/F4320321001","funder_display_name":"National Natural Science Foundation of China"}],"funders":[{"id":"https://openalex.org/F4320321001","display_name":"National Natural Science Foundation of China","ror":"https://ror.org/01h0zpd94"}],"has_content":{"grobid_xml":false,"pdf":false},"content_urls":null,"referenced_works_count":68,"referenced_works":["https://openalex.org/W1861492603","https://openalex.org/W1994922096","https://openalex.org/W2008359794","https://openalex.org/W2021088830","https://openalex.org/W2044465660","https://openalex.org/W2101946599","https://openalex.org/W2128262343","https://openalex.org/W2150587757","https://openalex.org/W2285968993","https://openalex.org/W2933794321","https://openalex.org/W2943545929","https://openalex.org/W2961348656","https://openalex.org/W2962793481","https://openalex.org/W2963529609","https://openalex.org/W2965729941","https://openalex.org/W2989684653","https://openalex.org/W2990984982","https://openalex.org/W2993182889","https://openalex.org/W2997286550","https://openalex.org/W2998249728","https://openalex.org/W2998449272","https://openalex.org/W2999219213","https://openalex.org/W3023282579","https://openalex.org/W3034552520","https://openalex.org/W3034684132","https://openalex.org/W3109733326","https://openalex.org/W3119387259","https://openalex.org/W3164098653","https://openalex.org/W3170019900","https://openalex.org/W3171516518","https://openalex.org/W3176152216","https://openalex.org/W3198494235","https://openalex.org/W4285601297","https://openalex.org/W4299652825","https://openalex.org/W4312964941","https://openalex.org/W4313023779","https://openalex.org/W4313590837","https://openalex.org/W4315606099","https://openalex.org/W4378375546","https://openalex.org/W4379928223","https://openalex.org/W4382491114","https://openalex.org/W4385481295","https://openalex.org/W4385809408","https://openalex.org/W4386075673","https://openalex.org/W4386076039","https://openalex.org/W4388129777","https://openalex.org/W4388574886","https://openalex.org/W4390872559","https://openalex.org/W4390874575","https://openalex.org/W4391021462","https://openalex.org/W4391109864","https://openalex.org/W4391991763","https://openalex.org/W4392719481","https://openalex.org/W4392824656","https://openalex.org/W4393184662","https://openalex.org/W4393571644","https://openalex.org/W4394597311","https://openalex.org/W4394625830","https://openalex.org/W4394758452","https://openalex.org/W4399409690","https://openalex.org/W4400579361","https://openalex.org/W4402703114","https://openalex.org/W4402754258","https://openalex.org/W4402754280","https://openalex.org/W4402952511","https://openalex.org/W4402979381","https://openalex.org/W4408634392","https://openalex.org/W4413146203"],"related_works":[],"abstract_inverted_index":{"Segment":[0],"Anything":[1],"Model":[2],"(SAM),":[3],"known":[4],"for":[5,153,212],"its":[6,19,81,139,210],"remarkable":[7],"zero-shot":[8,83,207],"segmentation":[9,59,185,197],"capabilities,":[10],"has":[11],"garnered":[12],"significant":[13],"attention":[14],"in":[15,162],"the":[16,40,109,173,183,200],"community.":[17],"Nevertheless,":[18],"performance":[20,186,202],"is":[21,36,169],"challenged":[22],"when":[23],"dealing":[24],"with":[25,119,157],"what":[26],"we":[27,64,147],"refer":[28],"to":[29,56,71,164,171],"as":[30],"visually":[31,76],"non-salient":[32,77,117],"scenarios,":[33,156],"where":[34],"there":[35],"low":[37],"contrast":[38,163],"between":[39],"foreground":[41],"and":[42,54,101,124,141,180,187,217],"background.":[43],"In":[44,61,143],"these":[45],"cases,":[46],"existing":[47],"methods":[48],"often":[49],"cannot":[50],"capture":[51],"accurate":[52],"contours":[53],"fail":[55],"produce":[57],"promising":[58],"results.":[60],"this":[62,87],"paper,":[63],"propose":[65],"Visually":[66],"Non-Salient":[67,102],"SAM":[68,110],"(VNS-SAM),":[69],"aiming":[70],"enhance":[72],"SAM's":[73,91],"perception":[74],"of":[75,116,130,145,203],"scenarios":[78],"while":[79],"preserving":[80],"original":[82],"generalizability.":[84],"We":[85],"achieve":[86],"by":[88],"effectively":[89],"exploiting":[90],"low-level":[92],"features":[93,179],"through":[94],"two":[95],"designs:":[96],"Mask-Edge":[97],"Token":[98],"Interactive":[99],"decoder":[100,111],"Feature":[103],"Mining":[104],"module.":[105],"These":[106],"designs":[107],"help":[108],"gain":[112],"a":[113,150],"deeper":[114],"understanding":[115],"characteristics":[118],"only":[120],"marginal":[121],"parameter":[122],"increments":[123],"computational":[125],"requirements.":[126],"The":[127],"additional":[128],"parameters":[129],"VNS-SAM":[131],"can":[132],"be":[133],"optimized":[134],"within":[135],"4":[136],"hours,":[137],"demonstrating":[138],"feasibility":[140],"practicality.":[142],"terms":[144],"data,":[146],"established":[148],"VNS-SEG,":[149],"unified":[151],"dataset":[152],"various":[154,195],"VNS":[155,178,190,196],"more":[158,176],"than":[159],"35K":[160],"images,":[161],"previous":[165],"single-task":[166],"adaptations.":[167],"It":[168],"designed":[170],"make":[172],"model":[174],"learn":[175],"robust":[177],"comprehensively":[181],"benchmark":[182],"model's":[184],"generalizability":[188],"on":[189],"scenarios.":[191],"Extensive":[192],"experiments":[193],"across":[194],"tasks":[198],"demonstrate":[199],"superior":[201],"VNS-SAM,":[204],"particularly":[205],"under":[206],"settings,":[208],"highlighting":[209],"potential":[211],"broad":[213],"real-world":[214],"applications.":[215],"Codes":[216],"datasets":[218],"are":[219],"publicly":[220],"available":[221],"at":[222],"https://guangqian-guo.github.io/VNS-SAM/.":[223]},"counts_by_year":[],"updated_date":"2026-03-27T05:58:40.876381","created_date":"2026-01-17T00:00:00"}
