{"id":"https://openalex.org/W4415538298","doi":"https://doi.org/10.1145/3746027.3754891","title":"HGCF: Hierarchical Geometry-Color Fusion for Multimodal Industrial Anomaly Detection","display_name":"HGCF: Hierarchical Geometry-Color Fusion for Multimodal Industrial Anomaly Detection","publication_year":2025,"publication_date":"2025-10-25","ids":{"openalex":"https://openalex.org/W4415538298","doi":"https://doi.org/10.1145/3746027.3754891"},"language":null,"primary_location":{"id":"doi:10.1145/3746027.3754891","is_oa":false,"landing_page_url":"https://doi.org/10.1145/3746027.3754891","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Proceedings of the 33rd ACM International Conference on Multimedia","raw_type":"proceedings-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":false,"oa_status":"closed","oa_url":null,"any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5076998721","display_name":"Min Li","orcid":"https://orcid.org/0000-0002-0507-5576"},"institutions":[{"id":"https://openalex.org/I152269853","display_name":"Qilu University of Technology","ror":"https://ror.org/04hyzq608","country_code":"CN","type":"education","lineage":["https://openalex.org/I152269853"]}],"countries":["CN"],"is_corresponding":true,"raw_author_name":"Min Li","raw_affiliation_strings":["Faculty of Data Science, City University of Macau, Macau, China and Key Laboratory of Computing Power Network and Information Security, Ministry of Education, Shandong Computer Science Center (National Supercomputer Center in Jinan), Qilu University of Technology (Shandong Academy of Sciences), Jinan, Shandong Province, China"],"raw_orcid":"https://orcid.org/0000-0002-0507-5576","affiliations":[{"raw_affiliation_string":"Faculty of Data Science, City University of Macau, Macau, China and Key Laboratory of Computing Power Network and Information Security, Ministry of Education, Shandong Computer Science Center (National Supercomputer Center in Jinan), Qilu University of Technology (Shandong Academy of Sciences), Jinan, Shandong Province, China","institution_ids":["https://openalex.org/I152269853"]}]},{"author_position":"middle","author":{"id":null,"display_name":"Jinghui He","orcid":"https://orcid.org/0009-0003-2249-1250"},"institutions":[{"id":"https://openalex.org/I152269853","display_name":"Qilu University of Technology","ror":"https://ror.org/04hyzq608","country_code":"CN","type":"education","lineage":["https://openalex.org/I152269853"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Jinghui He","raw_affiliation_strings":["Key Laboratory of Computing Power Network and Information Security, Ministry of Education, Shandong Computer Science Center (National Supercomputer Center in Jinan), Qilu University of Technology (Shandong Academy of Sciences), Jinan, Shandong Province, China"],"raw_orcid":"https://orcid.org/0009-0003-2249-1250","affiliations":[{"raw_affiliation_string":"Key Laboratory of Computing Power Network and Information Security, Ministry of Education, Shandong Computer Science Center (National Supercomputer Center in Jinan), Qilu University of Technology (Shandong Academy of Sciences), Jinan, Shandong Province, China","institution_ids":["https://openalex.org/I152269853"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5024716590","display_name":"Jiachen Li","orcid":"https://orcid.org/0000-0002-3543-6088"},"institutions":[{"id":"https://openalex.org/I154099455","display_name":"Shandong University","ror":"https://ror.org/0207yh398","country_code":"CN","type":"education","lineage":["https://openalex.org/I154099455"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Jiachen Li","raw_affiliation_strings":["Shandong Provincial Key Laboratory of Computing Power Internet and Service Computing, Shandong Fundamental Research Center for Computer Science, Jinan, Shandong Province, China"],"raw_orcid":"https://orcid.org/0000-0002-3543-6088","affiliations":[{"raw_affiliation_string":"Shandong Provincial Key Laboratory of Computing Power Internet and Service Computing, Shandong Fundamental Research Center for Computer Science, Jinan, Shandong Province, China","institution_ids":["https://openalex.org/I154099455"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5024839815","display_name":"Delong Han","orcid":"https://orcid.org/0000-0001-7195-3413"},"institutions":[{"id":"https://openalex.org/I152269853","display_name":"Qilu University of Technology","ror":"https://ror.org/04hyzq608","country_code":"CN","type":"education","lineage":["https://openalex.org/I152269853"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Delong Han","raw_affiliation_strings":["Key Laboratory of Computing Power Network and Information Security, Ministry of Education, Shandong Computer Science Center (National Supercomputer Center in Jinan), Qilu University of Technology (Shandong Academy of Sciences), Jinan, Shandong Province, China"],"raw_orcid":"https://orcid.org/0000-0001-7195-3413","affiliations":[{"raw_affiliation_string":"Key Laboratory of Computing Power Network and Information Security, Ministry of Education, Shandong Computer Science Center (National Supercomputer Center in Jinan), Qilu University of Technology (Shandong Academy of Sciences), Jinan, Shandong Province, China","institution_ids":["https://openalex.org/I152269853"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5049355981","display_name":"Jin Wan","orcid":"https://orcid.org/0000-0001-9245-0110"},"institutions":[{"id":"https://openalex.org/I154099455","display_name":"Shandong University","ror":"https://ror.org/0207yh398","country_code":"CN","type":"education","lineage":["https://openalex.org/I154099455"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Jin Wan","raw_affiliation_strings":["Shandong Provincial Key Laboratory of Computing Power Internet and Service Computing, Shandong Fundamental Research Center for Computer Science, Jinan, Shandong Province, China"],"raw_orcid":"https://orcid.org/0000-0001-9245-0110","affiliations":[{"raw_affiliation_string":"Shandong Provincial Key Laboratory of Computing Power Internet and Service Computing, Shandong Fundamental Research Center for Computer Science, Jinan, Shandong Province, China","institution_ids":["https://openalex.org/I154099455"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5056862464","display_name":"Gang Li","orcid":"https://orcid.org/0000-0002-7896-4833"},"institutions":[{"id":"https://openalex.org/I152269853","display_name":"Qilu University of Technology","ror":"https://ror.org/04hyzq608","country_code":"CN","type":"education","lineage":["https://openalex.org/I152269853"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Gang Li","raw_affiliation_strings":["Key Laboratory of Computing Power Network and Information Security, Ministry of Education, Shandong Computer Science Center (National Supercomputer Center in Jinan), Qilu University of Technology (Shandong Academy of Sciences), Jinan, Shandong Province, China and Faculty of Data Science, City University of Macau, Macau, China"],"raw_orcid":"https://orcid.org/0000-0002-7896-4833","affiliations":[{"raw_affiliation_string":"Key Laboratory of Computing Power Network and Information Security, Ministry of Education, Shandong Computer Science Center (National Supercomputer Center in Jinan), Qilu University of Technology (Shandong Academy of Sciences), Jinan, Shandong Province, China and Faculty of Data Science, City University of Macau, Macau, China","institution_ids":["https://openalex.org/I152269853"]}]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":6,"corresponding_author_ids":["https://openalex.org/A5076998721"],"corresponding_institution_ids":["https://openalex.org/I152269853"],"apc_list":null,"apc_paid":null,"fwci":0.0,"has_fulltext":false,"cited_by_count":0,"citation_normalized_percentile":{"value":0.15600304,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":null,"biblio":{"volume":null,"issue":null,"first_page":"1023","last_page":"1031"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T11512","display_name":"Anomaly Detection Techniques and Applications","score":0.9988999962806702,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T11512","display_name":"Anomaly Detection Techniques and Applications","score":0.9988999962806702,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T12111","display_name":"Industrial Vision Systems and Defect Detection","score":0.9811000227928162,"subfield":{"id":"https://openalex.org/subfields/2209","display_name":"Industrial and Manufacturing Engineering"},"field":{"id":"https://openalex.org/fields/22","display_name":"Engineering"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10876","display_name":"Fault Detection and Control Systems","score":0.9340999722480774,"subfield":{"id":"https://openalex.org/subfields/2207","display_name":"Control and Systems Engineering"},"field":{"id":"https://openalex.org/fields/22","display_name":"Engineering"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/point-cloud","display_name":"Point cloud","score":0.6396999955177307},{"id":"https://openalex.org/keywords/rgb-color-model","display_name":"RGB color model","score":0.6074000000953674},{"id":"https://openalex.org/keywords/pattern-recognition","display_name":"Pattern recognition (psychology)","score":0.5210000276565552},{"id":"https://openalex.org/keywords/consistency","display_name":"Consistency (knowledge bases)","score":0.5160999894142151},{"id":"https://openalex.org/keywords/feature","display_name":"Feature (linguistics)","score":0.5012000203132629},{"id":"https://openalex.org/keywords/feature-extraction","display_name":"Feature extraction","score":0.49619999527931213},{"id":"https://openalex.org/keywords/anomaly-detection","display_name":"Anomaly detection","score":0.49160000681877136},{"id":"https://openalex.org/keywords/key","display_name":"Key (lock)","score":0.4025999903678894},{"id":"https://openalex.org/keywords/fusion","display_name":"Fusion","score":0.39419999718666077}],"concepts":[{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.7204999923706055},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.7145000100135803},{"id":"https://openalex.org/C131979681","wikidata":"https://www.wikidata.org/wiki/Q1899648","display_name":"Point cloud","level":2,"score":0.6396999955177307},{"id":"https://openalex.org/C82990744","wikidata":"https://www.wikidata.org/wiki/Q166194","display_name":"RGB color model","level":2,"score":0.6074000000953674},{"id":"https://openalex.org/C153180895","wikidata":"https://www.wikidata.org/wiki/Q7148389","display_name":"Pattern recognition (psychology)","level":2,"score":0.5210000276565552},{"id":"https://openalex.org/C2776436953","wikidata":"https://www.wikidata.org/wiki/Q5163215","display_name":"Consistency (knowledge bases)","level":2,"score":0.5160999894142151},{"id":"https://openalex.org/C2776401178","wikidata":"https://www.wikidata.org/wiki/Q12050496","display_name":"Feature (linguistics)","level":2,"score":0.5012000203132629},{"id":"https://openalex.org/C52622490","wikidata":"https://www.wikidata.org/wiki/Q1026626","display_name":"Feature extraction","level":2,"score":0.49619999527931213},{"id":"https://openalex.org/C739882","wikidata":"https://www.wikidata.org/wiki/Q3560506","display_name":"Anomaly detection","level":2,"score":0.49160000681877136},{"id":"https://openalex.org/C31972630","wikidata":"https://www.wikidata.org/wiki/Q844240","display_name":"Computer vision","level":1,"score":0.45910000801086426},{"id":"https://openalex.org/C26517878","wikidata":"https://www.wikidata.org/wiki/Q228039","display_name":"Key (lock)","level":2,"score":0.4025999903678894},{"id":"https://openalex.org/C158525013","wikidata":"https://www.wikidata.org/wiki/Q2593739","display_name":"Fusion","level":2,"score":0.39419999718666077},{"id":"https://openalex.org/C89600930","wikidata":"https://www.wikidata.org/wiki/Q1423946","display_name":"Segmentation","level":2,"score":0.3808000087738037},{"id":"https://openalex.org/C28719098","wikidata":"https://www.wikidata.org/wiki/Q44946","display_name":"Point (geometry)","level":2,"score":0.3345000147819519},{"id":"https://openalex.org/C33954974","wikidata":"https://www.wikidata.org/wiki/Q486494","display_name":"Sensor fusion","level":2,"score":0.33309999108314514},{"id":"https://openalex.org/C108583219","wikidata":"https://www.wikidata.org/wiki/Q197536","display_name":"Deep learning","level":2,"score":0.32010000944137573},{"id":"https://openalex.org/C12997251","wikidata":"https://www.wikidata.org/wiki/Q567560","display_name":"Anomaly (physics)","level":2,"score":0.31700000166893005},{"id":"https://openalex.org/C36464697","wikidata":"https://www.wikidata.org/wiki/Q451553","display_name":"Visualization","level":2,"score":0.29989999532699585},{"id":"https://openalex.org/C173414695","wikidata":"https://www.wikidata.org/wiki/Q5510276","display_name":"Fusion mechanism","level":4,"score":0.28519999980926514},{"id":"https://openalex.org/C69744172","wikidata":"https://www.wikidata.org/wiki/Q860822","display_name":"Image fusion","level":3,"score":0.26899999380111694},{"id":"https://openalex.org/C165064840","wikidata":"https://www.wikidata.org/wiki/Q1321061","display_name":"Matching (statistics)","level":2,"score":0.2685999870300293},{"id":"https://openalex.org/C97931131","wikidata":"https://www.wikidata.org/wiki/Q5282087","display_name":"Discriminative model","level":2,"score":0.26080000400543213},{"id":"https://openalex.org/C61797465","wikidata":"https://www.wikidata.org/wiki/Q1188986","display_name":"Term (time)","level":2,"score":0.2581999897956848},{"id":"https://openalex.org/C2776151529","wikidata":"https://www.wikidata.org/wiki/Q3045304","display_name":"Object detection","level":3,"score":0.2526000142097473},{"id":"https://openalex.org/C124101348","wikidata":"https://www.wikidata.org/wiki/Q172491","display_name":"Data mining","level":1,"score":0.250900000333786},{"id":"https://openalex.org/C63099799","wikidata":"https://www.wikidata.org/wiki/Q17147001","display_name":"Image texture","level":4,"score":0.25}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.1145/3746027.3754891","is_oa":false,"landing_page_url":"https://doi.org/10.1145/3746027.3754891","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Proceedings of the 33rd ACM International Conference on Multimedia","raw_type":"proceedings-article"}],"best_oa_location":null,"sustainable_development_goals":[],"awards":[{"id":"https://openalex.org/G2741108683","display_name":null,"funder_award_id":"2023CXGC010112, NO.tsqnz20240834","funder_id":"https://openalex.org/F4320313895","funder_display_name":"Department of Science and Technology of Shandong Province"},{"id":"https://openalex.org/G575999342","display_name":null,"funder_award_id":"62401305, 62202425","funder_id":"https://openalex.org/F4320321540","funder_display_name":"Ministry of Science and Technology of the People's Republic of China"}],"funders":[{"id":"https://openalex.org/F4320313895","display_name":"Department of Science and Technology of Shandong Province","ror":"https://ror.org/01b9fvd84"},{"id":"https://openalex.org/F4320321540","display_name":"Ministry of Science and Technology of the People's Republic of China","ror":"https://ror.org/027s68j25"}],"has_content":{"pdf":false,"grobid_xml":false},"content_urls":null,"referenced_works_count":13,"referenced_works":["https://openalex.org/W4385805005","https://openalex.org/W4386065775","https://openalex.org/W4386065890","https://openalex.org/W4390875033","https://openalex.org/W4391669018","https://openalex.org/W4391962677","https://openalex.org/W4393147759","https://openalex.org/W4393148014","https://openalex.org/W4393237822","https://openalex.org/W4394597849","https://openalex.org/W4394625793","https://openalex.org/W4400411624","https://openalex.org/W4402753796"],"related_works":[],"abstract_inverted_index":{"While":[0],"current":[1],"multimodal":[2],"anomaly":[3],"detection":[4,124],"methods":[5],"predominantly":[6],"employ":[7],"intermediate":[8],"fusion":[9,60],"strategies,":[10],"they":[11],"often":[12],"suffer":[13],"from":[14],"inadequate":[15],"cross-modal":[16,58],"interaction":[17],"and":[18,48,70,113,139],"irreversible":[19],"information":[20,65],"loss":[21],"during":[22],"feature":[23,89,93],"alignment":[24],"processes.":[25],"To":[26],"overcome":[27],"these":[28],"limitations,":[29],"we":[30,54,78,101],"propose":[31,55,102],"Hierarchical":[32],"Geometry-Color":[33],"Fusion":[34],"(HGCF),":[35],"a":[36,56,80,103],"novel":[37],"framework":[38],"that":[39,62],"establishes":[40],"deep":[41],"synergistic":[42],"relationships":[43],"between":[44,67],"RGB":[45,71],"texture":[46],"features":[47,120],"point":[49,68],"cloud":[50,69],"geometric":[51,83],"representations.":[52],"Firstly,":[53],"bidirectional":[57],"early":[59],"mechanism":[61],"enables":[63],"complementary":[64],"exchange":[66],"modalities":[72],"at":[73],"the":[74,123],"input":[75],"level.":[76],"Secondly,":[77],"introduce":[79],"local":[81,104,118],"self-supervised":[82],"color":[84],"reconstruction":[85,98],"network":[86],"with":[87],"group-wise":[88],"alignment,":[90],"enhancing":[91],"fine-grained":[92],"extraction":[94],"through":[95],"joint":[96],"color-geometry":[97],"tasks.":[99],"Finally,":[100],"window":[105],"spatial-consistent":[106],"attention":[107],"fusion,":[108],"which":[109],"achieves":[110,133],"semantic":[111],"consistency":[112,115],"spatial":[114],"by":[116],"emphasizing":[117],"mutation":[119],"to":[121],"improve":[122],"of":[125],"subtle":[126],"anomalies.":[127],"Extensive":[128],"experiments":[129],"show":[130],"our":[131],"model":[132],"99.1%":[134],"I-AUROC":[135],"on":[136,141],"MVTec":[137],"3D-AD":[138],"91.7%":[140],"Eyecandies,":[142],"both":[143],"surpassing":[144],"state-of-the-art":[145],"methods.":[146]},"counts_by_year":[],"updated_date":"2025-11-06T03:46:38.306776","created_date":"2025-10-25T00:00:00"}
