{"id":"https://openalex.org/W4415709246","doi":"https://doi.org/10.1109/icme59968.2025.11209158","title":"EIAD: Explainable Industrial Anomaly Detection Via Multi-Modal Large Language Models","display_name":"EIAD: Explainable Industrial Anomaly Detection Via Multi-Modal Large Language Models","publication_year":2025,"publication_date":"2025-06-30","ids":{"openalex":"https://openalex.org/W4415709246","doi":"https://doi.org/10.1109/icme59968.2025.11209158"},"language":null,"primary_location":{"id":"doi:10.1109/icme59968.2025.11209158","is_oa":false,"landing_page_url":"https://doi.org/10.1109/icme59968.2025.11209158","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"2025 IEEE International Conference on Multimedia and Expo (ICME)","raw_type":"proceedings-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":false,"oa_status":"closed","oa_url":null,"any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5018742547","display_name":"Zongyun Zhang","orcid":null},"institutions":[{"id":"https://openalex.org/I183067930","display_name":"Shanghai Jiao Tong University","ror":"https://ror.org/0220qvk04","country_code":"CN","type":"education","lineage":["https://openalex.org/I183067930"]}],"countries":["CN"],"is_corresponding":true,"raw_author_name":"Zongyun Zhang","raw_affiliation_strings":["Shanghai Jiao Tong University"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"Shanghai Jiao Tong University","institution_ids":["https://openalex.org/I183067930"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5020776216","display_name":"Jiacheng Ruan","orcid":"https://orcid.org/0009-0002-1590-1955"},"institutions":[{"id":"https://openalex.org/I183067930","display_name":"Shanghai Jiao Tong University","ror":"https://ror.org/0220qvk04","country_code":"CN","type":"education","lineage":["https://openalex.org/I183067930"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Jiacheng Ruan","raw_affiliation_strings":["Shanghai Jiao Tong University"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"Shanghai Jiao Tong University","institution_ids":["https://openalex.org/I183067930"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5003889945","display_name":"Xian Gao","orcid":"https://orcid.org/0000-0002-5301-0515"},"institutions":[{"id":"https://openalex.org/I183067930","display_name":"Shanghai Jiao Tong University","ror":"https://ror.org/0220qvk04","country_code":"CN","type":"education","lineage":["https://openalex.org/I183067930"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Xian Gao","raw_affiliation_strings":["Shanghai Jiao Tong University"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"Shanghai Jiao Tong University","institution_ids":["https://openalex.org/I183067930"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5100418165","display_name":"Ting Liu","orcid":"https://orcid.org/0000-0003-3489-4578"},"institutions":[{"id":"https://openalex.org/I183067930","display_name":"Shanghai Jiao Tong University","ror":"https://ror.org/0220qvk04","country_code":"CN","type":"education","lineage":["https://openalex.org/I183067930"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Ting Liu","raw_affiliation_strings":["Shanghai Jiao Tong University"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"Shanghai Jiao Tong University","institution_ids":["https://openalex.org/I183067930"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5101704886","display_name":"Yuzhuo Fu","orcid":"https://orcid.org/0000-0001-5516-3016"},"institutions":[{"id":"https://openalex.org/I183067930","display_name":"Shanghai Jiao Tong University","ror":"https://ror.org/0220qvk04","country_code":"CN","type":"education","lineage":["https://openalex.org/I183067930"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Yuzhuo Fu","raw_affiliation_strings":["Shanghai Jiao Tong University"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"Shanghai Jiao Tong University","institution_ids":["https://openalex.org/I183067930"]}]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":5,"corresponding_author_ids":["https://openalex.org/A5018742547"],"corresponding_institution_ids":["https://openalex.org/I183067930"],"apc_list":null,"apc_paid":null,"fwci":6.1709,"has_fulltext":false,"cited_by_count":3,"citation_normalized_percentile":{"value":0.96366013,"is_in_top_1_percent":false,"is_in_top_10_percent":true},"cited_by_percentile_year":{"min":91,"max":99},"biblio":{"volume":null,"issue":null,"first_page":"1","last_page":"6"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T11512","display_name":"Anomaly Detection Techniques and Applications","score":0.29120001196861267,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T11512","display_name":"Anomaly Detection Techniques and Applications","score":0.29120001196861267,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10028","display_name":"Topic Modeling","score":0.0885000005364418,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10260","display_name":"Software Engineering Research","score":0.04479999840259552,"subfield":{"id":"https://openalex.org/subfields/1710","display_name":"Information Systems"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/anomaly-detection","display_name":"Anomaly detection","score":0.7333999872207642},{"id":"https://openalex.org/keywords/overfitting","display_name":"Overfitting","score":0.625},{"id":"https://openalex.org/keywords/reliability","display_name":"Reliability (semiconductor)","score":0.4341000020503998},{"id":"https://openalex.org/keywords/segmentation","display_name":"Segmentation","score":0.4205000102519989},{"id":"https://openalex.org/keywords/decoupling","display_name":"Decoupling (probability)","score":0.38909998536109924},{"id":"https://openalex.org/keywords/feature","display_name":"Feature (linguistics)","score":0.38580000400543213},{"id":"https://openalex.org/keywords/fault-detection-and-isolation","display_name":"Fault detection and isolation","score":0.33399999141693115}],"concepts":[{"id":"https://openalex.org/C739882","wikidata":"https://www.wikidata.org/wiki/Q3560506","display_name":"Anomaly detection","level":2,"score":0.7333999872207642},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.6861000061035156},{"id":"https://openalex.org/C22019652","wikidata":"https://www.wikidata.org/wiki/Q331309","display_name":"Overfitting","level":3,"score":0.625},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.5546000003814697},{"id":"https://openalex.org/C119857082","wikidata":"https://www.wikidata.org/wiki/Q2539","display_name":"Machine learning","level":1,"score":0.4408000111579895},{"id":"https://openalex.org/C43214815","wikidata":"https://www.wikidata.org/wiki/Q7310987","display_name":"Reliability (semiconductor)","level":3,"score":0.4341000020503998},{"id":"https://openalex.org/C89600930","wikidata":"https://www.wikidata.org/wiki/Q1423946","display_name":"Segmentation","level":2,"score":0.4205000102519989},{"id":"https://openalex.org/C205606062","wikidata":"https://www.wikidata.org/wiki/Q5249645","display_name":"Decoupling (probability)","level":2,"score":0.38909998536109924},{"id":"https://openalex.org/C2776401178","wikidata":"https://www.wikidata.org/wiki/Q12050496","display_name":"Feature (linguistics)","level":2,"score":0.38580000400543213},{"id":"https://openalex.org/C152745839","wikidata":"https://www.wikidata.org/wiki/Q5438153","display_name":"Fault detection and isolation","level":3,"score":0.33399999141693115},{"id":"https://openalex.org/C124101348","wikidata":"https://www.wikidata.org/wiki/Q172491","display_name":"Data mining","level":1,"score":0.31690001487731934},{"id":"https://openalex.org/C59404180","wikidata":"https://www.wikidata.org/wiki/Q17013334","display_name":"Feature learning","level":2,"score":0.3012999892234802},{"id":"https://openalex.org/C2779530757","wikidata":"https://www.wikidata.org/wiki/Q1207505","display_name":"Quality (philosophy)","level":2,"score":0.3010999858379364},{"id":"https://openalex.org/C204323151","wikidata":"https://www.wikidata.org/wiki/Q905424","display_name":"Range (aeronautics)","level":2,"score":0.28360000252723694},{"id":"https://openalex.org/C52622490","wikidata":"https://www.wikidata.org/wiki/Q1026626","display_name":"Feature extraction","level":2,"score":0.2736000120639801},{"id":"https://openalex.org/C90673727","wikidata":"https://www.wikidata.org/wiki/Q901718","display_name":"Product (mathematics)","level":2,"score":0.2572000026702881},{"id":"https://openalex.org/C108583219","wikidata":"https://www.wikidata.org/wiki/Q197536","display_name":"Deep learning","level":2,"score":0.2556000053882599}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.1109/icme59968.2025.11209158","is_oa":false,"landing_page_url":"https://doi.org/10.1109/icme59968.2025.11209158","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"2025 IEEE International Conference on Multimedia and Expo (ICME)","raw_type":"proceedings-article"}],"best_oa_location":null,"sustainable_development_goals":[],"awards":[],"funders":[],"has_content":{"pdf":false,"grobid_xml":false},"content_urls":null,"referenced_works_count":13,"referenced_works":["https://openalex.org/W2948982773","https://openalex.org/W3034314048","https://openalex.org/W3159648608","https://openalex.org/W4212919149","https://openalex.org/W4312605624","https://openalex.org/W4323647550","https://openalex.org/W4386065385","https://openalex.org/W4390874575","https://openalex.org/W4393158476","https://openalex.org/W4402702916","https://openalex.org/W4402727018","https://openalex.org/W4402754134","https://openalex.org/W4403940533"],"related_works":[],"abstract_inverted_index":{"Industrial":[0,159],"Anomaly":[1,160],"Detection":[2,116,161],"(IAD)":[3],"is":[4,92],"critical":[5],"to":[6,57,80,105],"ensure":[7],"product":[8],"quality":[9],"during":[10,59],"manufacturing.":[11],"Although":[12],"existing":[13],"zero-shot":[14],"defect":[15,77,125,168],"segmentation":[16],"and":[17,51,98,127,141,143,170],"detection":[18,111,169],"methods":[19],"have":[20],"shown":[21],"effectiveness,":[22],"they":[23],"cannot":[24],"provide":[25],"detailed":[26],"descriptions":[27],"of":[28,34,124,188],"the":[29,32,60,82,86,106,186],"defects.":[30],"Furthermore,":[31],"application":[33],"large":[35],"multi-modal":[36,76,108],"models":[37],"in":[38,41,46,167,193],"IAD":[39],"remains":[40],"its":[42],"infancy,":[43],"facing":[44],"challenges":[45],"balancing":[47],"question-answering":[48],"(QA)":[49],"performance":[50,166],"mask-based":[52],"grounding":[53],"capabilities,":[54],"often":[55],"owing":[56],"overfitting":[58],"fine-tuning":[61],"process.":[62],"To":[63],"address":[64],"these":[65],"challenges,":[66],"we":[67,103],"propose":[68],"a":[69,74,121,145],"novel":[70],"approach":[71],"that":[72,133,154],"introduces":[73],"dedicated":[75],"localization":[78,171],"module":[79],"decouple":[81],"dialog":[83],"functionality":[84],"from":[85],"core":[87],"feature":[88],"extraction.":[89],"This":[90],"decoupling":[91],"achieved":[93],"through":[94],"independent":[95],"optimization":[96],"objectives":[97],"tailored":[99],"learning":[100],"strategies.":[101],"Additionally,":[102],"contribute":[104],"first":[107],"industrial":[109,128,194],"anomaly":[110],"training":[112],"dataset,":[113],"named":[114],"Defect":[115],"Question":[117],"Answering":[118],"(DDQA),":[119],"encompassing":[120],"wide":[122],"range":[123],"types":[126],"scenarios.":[129],"Unlike":[130],"conventional":[131],"datasets":[132],"rely":[134],"on":[135],"GPT-generated":[136],"data,":[137],"DDQA":[138],"ensures":[139],"authenticity":[140],"reliability":[142],"offers":[144],"robust":[146],"foundation":[147],"for":[148,190],"model":[149],"training.":[150],"Experimental":[151],"results":[152],"demonstrate":[153],"our":[155],"proposed":[156],"method,":[157],"Explainable":[158],"Assistant":[162],"(EIAD),":[163],"achieves":[164],"outstanding":[165],"tasks.":[172],"It":[173],"not":[174],"only":[175],"significantly":[176],"enhances":[177],"accuracy":[178],"but":[179],"also":[180],"improves":[181],"interpretability.":[182],"These":[183],"advancements":[184],"highlight":[185],"potential":[187],"EIAD":[189],"practical":[191],"applications":[192],"settings.":[195]},"counts_by_year":[{"year":2026,"cited_by_count":2},{"year":2025,"cited_by_count":1}],"updated_date":"2026-05-07T13:39:58.223016","created_date":"2025-10-30T00:00:00"}
