{"id":"https://openalex.org/W4412353449","doi":"https://doi.org/10.1109/tnnls.2025.3585887","title":"DefectSAM: Hierarchically Adapting SAM for Pixel-Wise Surface Defect Detection","display_name":"DefectSAM: Hierarchically Adapting SAM for Pixel-Wise Surface Defect Detection","publication_year":2025,"publication_date":"2025-07-11","ids":{"openalex":"https://openalex.org/W4412353449","doi":"https://doi.org/10.1109/tnnls.2025.3585887","pmid":"https://pubmed.ncbi.nlm.nih.gov/40644089"},"language":"en","primary_location":{"id":"doi:10.1109/tnnls.2025.3585887","is_oa":false,"landing_page_url":"https://doi.org/10.1109/tnnls.2025.3585887","pdf_url":null,"source":{"id":"https://openalex.org/S4210175523","display_name":"IEEE Transactions on Neural Networks and Learning Systems","issn_l":"2162-237X","issn":["2162-237X","2162-2388"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310319808","host_organization_name":"Institute of Electrical and Electronics Engineers","host_organization_lineage":["https://openalex.org/P4310319808"],"host_organization_lineage_names":["Institute of Electrical and Electronics Engineers"],"type":"journal"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"IEEE Transactions on Neural Networks and Learning Systems","raw_type":"journal-article"},"type":"article","indexed_in":["crossref","pubmed"],"open_access":{"is_oa":false,"oa_status":"closed","oa_url":null,"any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5101527301","display_name":"Feng Yan","orcid":"https://orcid.org/0000-0002-2683-8878"},"institutions":[{"id":"https://openalex.org/I38877650","display_name":"Zhengzhou University","ror":"https://ror.org/04ypx8c21","country_code":"CN","type":"education","lineage":["https://openalex.org/I38877650"]}],"countries":["CN"],"is_corresponding":true,"raw_author_name":"Feng Yan","raw_affiliation_strings":["School of Computer and Artificial Intelligence, Zhengzhou University, Zhengzhou, China"],"affiliations":[{"raw_affiliation_string":"School of Computer and Artificial Intelligence, Zhengzhou University, Zhengzhou, China","institution_ids":["https://openalex.org/I38877650"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5060665015","display_name":"Xiaoheng Jiang","orcid":"https://orcid.org/0000-0002-5770-0417"},"institutions":[{"id":"https://openalex.org/I38877650","display_name":"Zhengzhou University","ror":"https://ror.org/04ypx8c21","country_code":"CN","type":"education","lineage":["https://openalex.org/I38877650"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Xiaoheng Jiang","raw_affiliation_strings":["School of Computer and Artificial Intelligence, Zhengzhou University, Zhengzhou, China"],"affiliations":[{"raw_affiliation_string":"School of Computer and Artificial Intelligence, Zhengzhou University, Zhengzhou, China","institution_ids":["https://openalex.org/I38877650"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5015452096","display_name":"Yang Lu","orcid":"https://orcid.org/0000-0002-2564-1993"},"institutions":[{"id":"https://openalex.org/I38877650","display_name":"Zhengzhou University","ror":"https://ror.org/04ypx8c21","country_code":"CN","type":"education","lineage":["https://openalex.org/I38877650"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Yang Lu","raw_affiliation_strings":["School of Computer and Artificial Intelligence, Zhengzhou University, Zhengzhou, China"],"affiliations":[{"raw_affiliation_string":"School of Computer and Artificial Intelligence, Zhengzhou University, Zhengzhou, China","institution_ids":["https://openalex.org/I38877650"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5037129512","display_name":"Jiale Cao","orcid":"https://orcid.org/0000-0002-5160-6841"},"institutions":[{"id":"https://openalex.org/I162868743","display_name":"Tianjin University","ror":"https://ror.org/012tb2g32","country_code":"CN","type":"education","lineage":["https://openalex.org/I162868743"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Jiale Cao","raw_affiliation_strings":["School of Electrical and Information Engineering, Tianjin University, Tianjin, China"],"affiliations":[{"raw_affiliation_string":"School of Electrical and Information Engineering, Tianjin University, Tianjin, China","institution_ids":["https://openalex.org/I162868743"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5081346568","display_name":"Mingliang Xu","orcid":"https://orcid.org/0000-0002-6885-3451"},"institutions":[{"id":"https://openalex.org/I38877650","display_name":"Zhengzhou University","ror":"https://ror.org/04ypx8c21","country_code":"CN","type":"education","lineage":["https://openalex.org/I38877650"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Mingliang Xu","raw_affiliation_strings":["School of Computer and Artificial Intelligence, Zhengzhou University, Zhengzhou, China"],"affiliations":[{"raw_affiliation_string":"School of Computer and Artificial Intelligence, Zhengzhou University, Zhengzhou, China","institution_ids":["https://openalex.org/I38877650"]}]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":5,"corresponding_author_ids":["https://openalex.org/A5101527301"],"corresponding_institution_ids":["https://openalex.org/I38877650"],"apc_list":null,"apc_paid":null,"fwci":1.3271,"has_fulltext":false,"cited_by_count":1,"citation_normalized_percentile":{"value":0.83836953,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":{"min":91,"max":95},"biblio":{"volume":"36","issue":"10","first_page":"18830","last_page":"18843"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T12111","display_name":"Industrial Vision Systems and Defect Detection","score":0.9998999834060669,"subfield":{"id":"https://openalex.org/subfields/2209","display_name":"Industrial and Manufacturing Engineering"},"field":{"id":"https://openalex.org/fields/22","display_name":"Engineering"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T12111","display_name":"Industrial Vision Systems and Defect Detection","score":0.9998999834060669,"subfield":{"id":"https://openalex.org/subfields/2209","display_name":"Industrial and Manufacturing Engineering"},"field":{"id":"https://openalex.org/fields/22","display_name":"Engineering"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10036","display_name":"Advanced Neural Network Applications","score":0.9973000288009644,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11606","display_name":"Infrastructure Maintenance and Monitoring","score":0.989300012588501,"subfield":{"id":"https://openalex.org/subfields/2205","display_name":"Civil and Structural Engineering"},"field":{"id":"https://openalex.org/fields/22","display_name":"Engineering"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.7402313947677612},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.7120245695114136},{"id":"https://openalex.org/keywords/encoder","display_name":"Encoder","score":0.6812170743942261},{"id":"https://openalex.org/keywords/feature","display_name":"Feature (linguistics)","score":0.6118010878562927},{"id":"https://openalex.org/keywords/pattern-recognition","display_name":"Pattern recognition (psychology)","score":0.6104591488838196},{"id":"https://openalex.org/keywords/adaptation","display_name":"Adaptation (eye)","score":0.5065451860427856},{"id":"https://openalex.org/keywords/computer-vision","display_name":"Computer vision","score":0.4831832945346832},{"id":"https://openalex.org/keywords/pixel","display_name":"Pixel","score":0.4738227128982544},{"id":"https://openalex.org/keywords/segmentation","display_name":"Segmentation","score":0.4690970182418823},{"id":"https://openalex.org/keywords/pyramid","display_name":"Pyramid (geometry)","score":0.45735234022140503},{"id":"https://openalex.org/keywords/mathematics","display_name":"Mathematics","score":0.10876187682151794}],"concepts":[{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.7402313947677612},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.7120245695114136},{"id":"https://openalex.org/C118505674","wikidata":"https://www.wikidata.org/wiki/Q42586063","display_name":"Encoder","level":2,"score":0.6812170743942261},{"id":"https://openalex.org/C2776401178","wikidata":"https://www.wikidata.org/wiki/Q12050496","display_name":"Feature (linguistics)","level":2,"score":0.6118010878562927},{"id":"https://openalex.org/C153180895","wikidata":"https://www.wikidata.org/wiki/Q7148389","display_name":"Pattern recognition (psychology)","level":2,"score":0.6104591488838196},{"id":"https://openalex.org/C139807058","wikidata":"https://www.wikidata.org/wiki/Q352374","display_name":"Adaptation (eye)","level":2,"score":0.5065451860427856},{"id":"https://openalex.org/C31972630","wikidata":"https://www.wikidata.org/wiki/Q844240","display_name":"Computer vision","level":1,"score":0.4831832945346832},{"id":"https://openalex.org/C160633673","wikidata":"https://www.wikidata.org/wiki/Q355198","display_name":"Pixel","level":2,"score":0.4738227128982544},{"id":"https://openalex.org/C89600930","wikidata":"https://www.wikidata.org/wiki/Q1423946","display_name":"Segmentation","level":2,"score":0.4690970182418823},{"id":"https://openalex.org/C142575187","wikidata":"https://www.wikidata.org/wiki/Q3358290","display_name":"Pyramid (geometry)","level":2,"score":0.45735234022140503},{"id":"https://openalex.org/C33923547","wikidata":"https://www.wikidata.org/wiki/Q395","display_name":"Mathematics","level":0,"score":0.10876187682151794},{"id":"https://openalex.org/C2524010","wikidata":"https://www.wikidata.org/wiki/Q8087","display_name":"Geometry","level":1,"score":0.0},{"id":"https://openalex.org/C120665830","wikidata":"https://www.wikidata.org/wiki/Q14620","display_name":"Optics","level":1,"score":0.0},{"id":"https://openalex.org/C111919701","wikidata":"https://www.wikidata.org/wiki/Q9135","display_name":"Operating system","level":1,"score":0.0},{"id":"https://openalex.org/C121332964","wikidata":"https://www.wikidata.org/wiki/Q413","display_name":"Physics","level":0,"score":0.0},{"id":"https://openalex.org/C41895202","wikidata":"https://www.wikidata.org/wiki/Q8162","display_name":"Linguistics","level":1,"score":0.0},{"id":"https://openalex.org/C138885662","wikidata":"https://www.wikidata.org/wiki/Q5891","display_name":"Philosophy","level":0,"score":0.0}],"mesh":[],"locations_count":2,"locations":[{"id":"doi:10.1109/tnnls.2025.3585887","is_oa":false,"landing_page_url":"https://doi.org/10.1109/tnnls.2025.3585887","pdf_url":null,"source":{"id":"https://openalex.org/S4210175523","display_name":"IEEE Transactions on Neural Networks and Learning Systems","issn_l":"2162-237X","issn":["2162-237X","2162-2388"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310319808","host_organization_name":"Institute of Electrical and Electronics Engineers","host_organization_lineage":["https://openalex.org/P4310319808"],"host_organization_lineage_names":["Institute of Electrical and Electronics Engineers"],"type":"journal"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"IEEE Transactions on Neural Networks and Learning Systems","raw_type":"journal-article"},{"id":"pmid:40644089","is_oa":false,"landing_page_url":"https://pubmed.ncbi.nlm.nih.gov/40644089","pdf_url":null,"source":{"id":"https://openalex.org/S4306525036","display_name":"PubMed","issn_l":null,"issn":null,"is_oa":false,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I1299303238","host_organization_name":"National Institutes of Health","host_organization_lineage":["https://openalex.org/I1299303238"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"IEEE transactions on neural networks and learning systems","raw_type":null}],"best_oa_location":null,"sustainable_development_goals":[],"awards":[{"id":"https://openalex.org/G5202935399","display_name":null,"funder_award_id":"ZDBJ202534","funder_id":"https://openalex.org/F4320321760","funder_display_name":"Henan University of Science and Technology"},{"id":"https://openalex.org/G5570243985","display_name":null,"funder_award_id":"232300421093","funder_id":"https://openalex.org/F4320323845","funder_display_name":"Natural Science Foundation of Henan Province"},{"id":"https://openalex.org/G7272499820","display_name":null,"funder_award_id":"U21B2037","funder_id":"https://openalex.org/F4320321001","funder_display_name":"National Natural Science Foundation of China"},{"id":"https://openalex.org/G8306412014","display_name":null,"funder_award_id":"62172371","funder_id":"https://openalex.org/F4320321001","funder_display_name":"National Natural Science Foundation of China"}],"funders":[{"id":"https://openalex.org/F4320321001","display_name":"National Natural Science Foundation of China","ror":"https://ror.org/01h0zpd94"},{"id":"https://openalex.org/F4320321760","display_name":"Henan University of Science and Technology","ror":"https://ror.org/05d80kz58"},{"id":"https://openalex.org/F4320323845","display_name":"Natural Science Foundation of Henan Province","ror":null}],"has_content":{"pdf":false,"grobid_xml":false},"content_urls":null,"referenced_works_count":54,"referenced_works":["https://openalex.org/W1982075130","https://openalex.org/W1994922096","https://openalex.org/W2012496675","https://openalex.org/W2100470808","https://openalex.org/W2132083787","https://openalex.org/W2194775991","https://openalex.org/W2560023338","https://openalex.org/W2565639579","https://openalex.org/W2780861787","https://openalex.org/W2884563051","https://openalex.org/W2888407265","https://openalex.org/W2963529609","https://openalex.org/W2963868681","https://openalex.org/W3034314048","https://openalex.org/W3035487542","https://openalex.org/W3122006940","https://openalex.org/W3135064036","https://openalex.org/W3164098653","https://openalex.org/W3191879248","https://openalex.org/W4214561053","https://openalex.org/W4226512186","https://openalex.org/W4283813802","https://openalex.org/W4285279978","https://openalex.org/W4292347849","https://openalex.org/W4304084053","https://openalex.org/W4312710812","https://openalex.org/W4312746376","https://openalex.org/W4313270795","https://openalex.org/W4313546627","https://openalex.org/W4320009770","https://openalex.org/W4320036807","https://openalex.org/W4322707121","https://openalex.org/W4381716707","https://openalex.org/W4384080166","https://openalex.org/W4385236855","https://openalex.org/W4385245566","https://openalex.org/W4386072314","https://openalex.org/W4386076039","https://openalex.org/W4387917853","https://openalex.org/W4389252811","https://openalex.org/W4390190100","https://openalex.org/W4390874575","https://openalex.org/W4391021462","https://openalex.org/W4392309443","https://openalex.org/W4393160910","https://openalex.org/W4400721967","https://openalex.org/W4402660119","https://openalex.org/W4402716453","https://openalex.org/W4402727285","https://openalex.org/W4403446611","https://openalex.org/W4403594096","https://openalex.org/W4403791281","https://openalex.org/W4404177154","https://openalex.org/W4406520988"],"related_works":["https://openalex.org/W3135697610","https://openalex.org/W4390516098","https://openalex.org/W2085033728","https://openalex.org/W4285411112","https://openalex.org/W2997567050","https://openalex.org/W2171299904","https://openalex.org/W4249847449","https://openalex.org/W2181948922","https://openalex.org/W2384362569","https://openalex.org/W1647606319"],"abstract_inverted_index":{"Segment":[0],"anything":[1],"model":[2],"(SAM)":[3],"has":[4],"recently":[5],"demonstrated":[6],"powerful":[7],"segmentation":[8],"ability":[9],"for":[10,46,136,160],"natural":[11],"scene":[12],"images":[13],"(NSIs).":[14],"However,":[15],"the":[16,26,61,76,80,89,99,106,141,144,189,202],"SAM":[17,45,205],"exhibits":[18],"limited":[19],"performance":[20,194],"in":[21,34,206],"defect":[22,49,65,138,166,176,207],"detection":[23,177],"owing":[24],"to":[25,63,82,120,153],"weak":[27],"appearance":[28],"of":[29,60,86,147,204],"defects":[30],"and":[31,56,79,105,127,157,168,184],"cluttered":[32],"backgrounds":[33],"industrial":[35],"images.":[36],"In":[37],"this":[38],"article,":[39],"we":[40,68],"propose":[41],"a":[42,70,123],"hierarchically":[43],"adapting":[44],"pixel-wise":[47],"surface":[48],"detection,":[50],"named":[51],"DefectSAM,":[52],"which":[53,133,199],"effectively":[54],"modulates":[55],"decodes":[57],"multilevel":[58],"features":[59,87,129,149],"encoder":[62,78],"capture":[64],"information.":[66],"Specifically,":[67],"introduce":[69],"learnable":[71,197],"feature":[72,101,108,125,131,161],"adaptation":[73,91,95,102,109],"component":[74],"between":[75],"image":[77],"decoder":[81],"modulate":[83],"each":[84],"level":[85],"via":[88],"dual-feature":[90,94],"unit.":[92],"The":[93,112],"unit":[96],"mainly":[97],"includes":[98],"correlation-gated":[100],"(CGFA)":[103],"module":[104],"mask-guided":[107],"(MGFA)":[110],"module.":[111],"CGFA":[113],"exploits":[114],"cross":[115],"correlation":[116],"spatial":[117],"gating":[118],"maps":[119],"adaptively":[121],"incorporate":[122],"convolutional":[124],"pyramid":[126],"Transformer":[128],"during":[130],"adaptation,":[132,162],"is":[134],"beneficial":[135],"capturing":[137],"details.":[139],"Moreover,":[140],"MGFA":[142],"utilizes":[143],"mask":[145],"prediction":[146],"high-level":[148],"as":[150],"semantic":[151],"guidance":[152],"select":[154],"top-confidence":[155],"foreground":[156],"background":[158,170],"tokens":[159],"focusing":[163],"more":[164],"on":[165,174],"details":[167],"suppressing":[169],"noise.":[171],"Extensive":[172],"experiments":[173],"three":[175],"datasets":[178],"(i.e.,":[179],"MVTec":[180],"AD,":[181],"CrackSeg9k,":[182],"ZJU-Leaper,":[183],"Magnetic":[185],"tile)":[186],"demonstrate":[187],"that":[188],"proposed":[190],"method":[191],"achieves":[192],"state-of-the-art":[193],"with":[195],"few":[196],"parameters,":[198],"greatly":[200],"improves":[201],"generalization":[203],"detection.":[208]},"counts_by_year":[{"year":2025,"cited_by_count":1}],"updated_date":"2025-12-11T23:09:37.256380","created_date":"2025-10-10T00:00:00"}
