{"id":"https://openalex.org/W4404078863","doi":"https://doi.org/10.1109/tcsvt.2024.3491865","title":"Cross-Modal Learning for Anomaly Detection in Complex Industrial Process: Methodology and Benchmark","display_name":"Cross-Modal Learning for Anomaly Detection in Complex Industrial Process: Methodology and Benchmark","publication_year":2024,"publication_date":"2024-11-05","ids":{"openalex":"https://openalex.org/W4404078863","doi":"https://doi.org/10.1109/tcsvt.2024.3491865"},"language":"en","primary_location":{"id":"doi:10.1109/tcsvt.2024.3491865","is_oa":false,"landing_page_url":"https://doi.org/10.1109/tcsvt.2024.3491865","pdf_url":null,"source":{"id":"https://openalex.org/S115173108","display_name":"IEEE Transactions on Circuits and Systems for Video Technology","issn_l":"1051-8215","issn":["1051-8215","1558-2205"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310319808","host_organization_name":"Institute of Electrical and Electronics Engineers","host_organization_lineage":["https://openalex.org/P4310319808"],"host_organization_lineage_names":["Institute of Electrical and Electronics Engineers"],"type":"journal"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"IEEE Transactions on Circuits and Systems for Video Technology","raw_type":"journal-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":false,"oa_status":"closed","oa_url":null,"any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5005210294","display_name":"Gaochang Wu","orcid":"https://orcid.org/0000-0002-5149-2995"},"institutions":[{"id":"https://openalex.org/I9224756","display_name":"Northeastern University","ror":"https://ror.org/03awzbc87","country_code":"CN","type":"education","lineage":["https://openalex.org/I9224756"]}],"countries":["CN"],"is_corresponding":true,"raw_author_name":"Gaochang Wu","raw_affiliation_strings":["State Key Laboratory of Synthetical Automation for Process Industries, Northeastern University, Shenyang, China","State Key Laboratory of Synthetical Automation for Process Industries, Northeastern University, Shenyang, P. R. China"],"affiliations":[{"raw_affiliation_string":"State Key Laboratory of Synthetical Automation for Process Industries, Northeastern University, Shenyang, China","institution_ids":["https://openalex.org/I9224756"]},{"raw_affiliation_string":"State Key Laboratory of Synthetical Automation for Process Industries, Northeastern University, Shenyang, P. R. China","institution_ids":["https://openalex.org/I9224756"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5100612457","display_name":"Yapeng Zhang","orcid":"https://orcid.org/0000-0003-0266-0443"},"institutions":[{"id":"https://openalex.org/I9224756","display_name":"Northeastern University","ror":"https://ror.org/03awzbc87","country_code":"CN","type":"education","lineage":["https://openalex.org/I9224756"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Yapeng Zhang","raw_affiliation_strings":["State Key Laboratory of Synthetical Automation for Process Industries, Northeastern University, Shenyang, China","State Key Laboratory of Synthetical Automation for Process Industries, Northeastern University, Shenyang, P. R. China"],"affiliations":[{"raw_affiliation_string":"State Key Laboratory of Synthetical Automation for Process Industries, Northeastern University, Shenyang, China","institution_ids":["https://openalex.org/I9224756"]},{"raw_affiliation_string":"State Key Laboratory of Synthetical Automation for Process Industries, Northeastern University, Shenyang, P. R. China","institution_ids":["https://openalex.org/I9224756"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5100894390","display_name":"Lan Deng","orcid":"https://orcid.org/0009-0002-4830-9544"},"institutions":[{"id":"https://openalex.org/I9224756","display_name":"Northeastern University","ror":"https://ror.org/03awzbc87","country_code":"CN","type":"education","lineage":["https://openalex.org/I9224756"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Lan Deng","raw_affiliation_strings":["State Key Laboratory of Synthetical Automation for Process Industries, Northeastern University, Shenyang, China","State Key Laboratory of Synthetical Automation for Process Industries, Northeastern University, Shenyang, P. R. China"],"affiliations":[{"raw_affiliation_string":"State Key Laboratory of Synthetical Automation for Process Industries, Northeastern University, Shenyang, China","institution_ids":["https://openalex.org/I9224756"]},{"raw_affiliation_string":"State Key Laboratory of Synthetical Automation for Process Industries, Northeastern University, Shenyang, P. R. China","institution_ids":["https://openalex.org/I9224756"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5100630363","display_name":"Jingxin Zhang","orcid":"https://orcid.org/0000-0002-9450-188X"},"institutions":[{"id":"https://openalex.org/I57093077","display_name":"Swinburne University of Technology","ror":"https://ror.org/031rekg67","country_code":"AU","type":"education","lineage":["https://openalex.org/I57093077"]}],"countries":["AU"],"is_corresponding":false,"raw_author_name":"Jingxin Zhang","raw_affiliation_strings":["School of Software and Electrical Engineering, Swinburne University of Technology, Melbourne, VIC, Australia"],"affiliations":[{"raw_affiliation_string":"School of Software and Electrical Engineering, Swinburne University of Technology, Melbourne, VIC, Australia","institution_ids":["https://openalex.org/I57093077"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5042520521","display_name":"Tianyou Chai","orcid":"https://orcid.org/0000-0002-4623-1483"},"institutions":[{"id":"https://openalex.org/I9224756","display_name":"Northeastern University","ror":"https://ror.org/03awzbc87","country_code":"CN","type":"education","lineage":["https://openalex.org/I9224756"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Tianyou Chai","raw_affiliation_strings":["State Key Laboratory of Synthetical Automation for Process Industries, Northeastern University, Shenyang, China","State Key Laboratory of Synthetical Automation for Process Industries, Northeastern University, Shenyang, P. R. China"],"affiliations":[{"raw_affiliation_string":"State Key Laboratory of Synthetical Automation for Process Industries, Northeastern University, Shenyang, China","institution_ids":["https://openalex.org/I9224756"]},{"raw_affiliation_string":"State Key Laboratory of Synthetical Automation for Process Industries, Northeastern University, Shenyang, P. R. China","institution_ids":["https://openalex.org/I9224756"]}]}],"institutions":[],"countries_distinct_count":2,"institutions_distinct_count":5,"corresponding_author_ids":["https://openalex.org/A5005210294"],"corresponding_institution_ids":["https://openalex.org/I9224756"],"apc_list":null,"apc_paid":null,"fwci":7.425,"has_fulltext":false,"cited_by_count":23,"citation_normalized_percentile":{"value":0.97858442,"is_in_top_1_percent":false,"is_in_top_10_percent":true},"cited_by_percentile_year":{"min":99,"max":100},"biblio":{"volume":"35","issue":"3","first_page":"2632","last_page":"2645"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10876","display_name":"Fault Detection and Control Systems","score":0.9765999913215637,"subfield":{"id":"https://openalex.org/subfields/2207","display_name":"Control and Systems Engineering"},"field":{"id":"https://openalex.org/fields/22","display_name":"Engineering"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10876","display_name":"Fault Detection and Control Systems","score":0.9765999913215637,"subfield":{"id":"https://openalex.org/subfields/2207","display_name":"Control and Systems Engineering"},"field":{"id":"https://openalex.org/fields/22","display_name":"Engineering"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11512","display_name":"Anomaly Detection Techniques and Applications","score":0.9333999752998352,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/anomaly-detection","display_name":"Anomaly detection","score":0.6590109467506409},{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.6477551460266113},{"id":"https://openalex.org/keywords/benchmark","display_name":"Benchmark (surveying)","score":0.6022562384605408},{"id":"https://openalex.org/keywords/process","display_name":"Process (computing)","score":0.5699482560157776},{"id":"https://openalex.org/keywords/modal","display_name":"Modal","score":0.5188832879066467},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.4991111755371094},{"id":"https://openalex.org/keywords/data-mining","display_name":"Data mining","score":0.3410302400588989},{"id":"https://openalex.org/keywords/pattern-recognition","display_name":"Pattern recognition (psychology)","score":0.32137805223464966},{"id":"https://openalex.org/keywords/geology","display_name":"Geology","score":0.08782094717025757}],"concepts":[{"id":"https://openalex.org/C739882","wikidata":"https://www.wikidata.org/wiki/Q3560506","display_name":"Anomaly detection","level":2,"score":0.6590109467506409},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.6477551460266113},{"id":"https://openalex.org/C185798385","wikidata":"https://www.wikidata.org/wiki/Q1161707","display_name":"Benchmark (surveying)","level":2,"score":0.6022562384605408},{"id":"https://openalex.org/C98045186","wikidata":"https://www.wikidata.org/wiki/Q205663","display_name":"Process (computing)","level":2,"score":0.5699482560157776},{"id":"https://openalex.org/C71139939","wikidata":"https://www.wikidata.org/wiki/Q910194","display_name":"Modal","level":2,"score":0.5188832879066467},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.4991111755371094},{"id":"https://openalex.org/C124101348","wikidata":"https://www.wikidata.org/wiki/Q172491","display_name":"Data mining","level":1,"score":0.3410302400588989},{"id":"https://openalex.org/C153180895","wikidata":"https://www.wikidata.org/wiki/Q7148389","display_name":"Pattern recognition (psychology)","level":2,"score":0.32137805223464966},{"id":"https://openalex.org/C127313418","wikidata":"https://www.wikidata.org/wiki/Q1069","display_name":"Geology","level":0,"score":0.08782094717025757},{"id":"https://openalex.org/C185592680","wikidata":"https://www.wikidata.org/wiki/Q2329","display_name":"Chemistry","level":0,"score":0.0},{"id":"https://openalex.org/C111919701","wikidata":"https://www.wikidata.org/wiki/Q9135","display_name":"Operating system","level":1,"score":0.0},{"id":"https://openalex.org/C13280743","wikidata":"https://www.wikidata.org/wiki/Q131089","display_name":"Geodesy","level":1,"score":0.0},{"id":"https://openalex.org/C188027245","wikidata":"https://www.wikidata.org/wiki/Q750446","display_name":"Polymer chemistry","level":1,"score":0.0}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.1109/tcsvt.2024.3491865","is_oa":false,"landing_page_url":"https://doi.org/10.1109/tcsvt.2024.3491865","pdf_url":null,"source":{"id":"https://openalex.org/S115173108","display_name":"IEEE Transactions on Circuits and Systems for Video Technology","issn_l":"1051-8215","issn":["1051-8215","1558-2205"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310319808","host_organization_name":"Institute of Electrical and Electronics Engineers","host_organization_lineage":["https://openalex.org/P4310319808"],"host_organization_lineage_names":["Institute of Electrical and Electronics Engineers"],"type":"journal"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"IEEE Transactions on Circuits and Systems for Video Technology","raw_type":"journal-article"}],"best_oa_location":null,"sustainable_development_goals":[{"display_name":"Industry, innovation and infrastructure","id":"https://metadata.un.org/sdg/9","score":0.46000000834465027}],"awards":[{"id":"https://openalex.org/G2407125372","display_name":null,"funder_award_id":"U20A20189","funder_id":"https://openalex.org/F4320321001","funder_display_name":"National Natural Science Foundation of China"},{"id":"https://openalex.org/G3613092334","display_name":null,"funder_award_id":"N2424004","funder_id":"https://openalex.org/F4320335787","funder_display_name":"Fundamental Research Funds for the Central Universities"},{"id":"https://openalex.org/G5898287775","display_name":null,"funder_award_id":"61991404","funder_id":"https://openalex.org/F4320321001","funder_display_name":"National Natural Science Foundation of China"},{"id":"https://openalex.org/G6449511876","display_name":null,"funder_award_id":"62103092","funder_id":"https://openalex.org/F4320321001","funder_display_name":"National Natural Science Foundation of China"},{"id":"https://openalex.org/G7967096143","display_name":null,"funder_award_id":"62173120","funder_id":"https://openalex.org/F4320321001","funder_display_name":"National Natural Science Foundation of China"},{"id":"https://openalex.org/G8012131583","display_name":null,"funder_award_id":"61991401","funder_id":"https://openalex.org/F4320321001","funder_display_name":"National Natural Science Foundation of China"}],"funders":[{"id":"https://openalex.org/F4320321001","display_name":"National Natural Science Foundation of China","ror":"https://ror.org/01h0zpd94"},{"id":"https://openalex.org/F4320335787","display_name":"Fundamental Research Funds for the Central Universities","ror":null}],"has_content":{"pdf":false,"grobid_xml":false},"content_urls":null,"referenced_works_count":61,"referenced_works":["https://openalex.org/W1965628919","https://openalex.org/W1983044509","https://openalex.org/W2009700261","https://openalex.org/W2031489346","https://openalex.org/W2064675550","https://openalex.org/W2122646361","https://openalex.org/W2170505850","https://openalex.org/W2766123902","https://openalex.org/W2766252842","https://openalex.org/W2766447205","https://openalex.org/W2797697401","https://openalex.org/W2803603634","https://openalex.org/W2919115771","https://openalex.org/W2963717374","https://openalex.org/W2998356391","https://openalex.org/W3004999940","https://openalex.org/W3046194589","https://openalex.org/W3156117144","https://openalex.org/W3168216528","https://openalex.org/W3168640669","https://openalex.org/W3177318507","https://openalex.org/W3180570338","https://openalex.org/W3202384916","https://openalex.org/W3210279979","https://openalex.org/W3214102707","https://openalex.org/W4205222700","https://openalex.org/W4214520160","https://openalex.org/W4214612132","https://openalex.org/W4226169791","https://openalex.org/W4283739673","https://openalex.org/W4283811196","https://openalex.org/W4312480274","https://openalex.org/W4312554543","https://openalex.org/W4312614039","https://openalex.org/W4312956471","https://openalex.org/W4313427304","https://openalex.org/W4318586084","https://openalex.org/W4323022360","https://openalex.org/W4376226279","https://openalex.org/W4382119107","https://openalex.org/W4382467086","https://openalex.org/W4385245566","https://openalex.org/W4386065852","https://openalex.org/W4386076398","https://openalex.org/W4386526950","https://openalex.org/W4388854793","https://openalex.org/W4389331911","https://openalex.org/W4392172944","https://openalex.org/W4400409509","https://openalex.org/W6696085341","https://openalex.org/W6757817989","https://openalex.org/W6766978945","https://openalex.org/W6778883912","https://openalex.org/W6791353385","https://openalex.org/W6798487212","https://openalex.org/W6802061597","https://openalex.org/W6809860847","https://openalex.org/W6838322825","https://openalex.org/W6838434436","https://openalex.org/W6850503672","https://openalex.org/W6857279128"],"related_works":["https://openalex.org/W2378211422","https://openalex.org/W4321353415","https://openalex.org/W2745001401","https://openalex.org/W2130974462","https://openalex.org/W2028665553","https://openalex.org/W2086519370","https://openalex.org/W4246352526","https://openalex.org/W2121910908","https://openalex.org/W915438175","https://openalex.org/W4230315250"],"abstract_inverted_index":{"Anomaly":[0],"detection":[1,19,64,152],"in":[2,10,77,110,203],"complex":[3],"industrial":[4,232],"processes":[5],"plays":[6],"a":[7,55,89,111,115,172],"pivotal":[8],"role":[9],"ensuring":[11],"efficient,":[12],"stable,":[13],"and":[14,73,105,134,154,186,214,225],"secure":[15],"operation.":[16],"Existing":[17],"anomaly":[18,63,120,159],"methods":[20],"primarily":[21],"focus":[22],"on":[23,40],"analyzing":[24],"dominant":[25],"anomalies":[26],"using":[27],"the":[28,46,67,78,81,96,101,106,123,144,150,157,163,166,177,197],"process":[29,74],"variables":[30,75],"(such":[31],"as":[32,211],"arc":[33],"current)":[34],"or":[35],"constructing":[36],"neural":[37],"networks":[38],"based":[39],"abnormal":[41],"visual":[42,70,215],"features,":[43,147],"while":[44],"overlooking":[45],"intrinsic":[47],"correlation":[48,68,146],"of":[49,80,118,165,176],"cross-modal":[50,56,174,195],"information.":[51],"This":[52],"paper":[53],"proposes":[54],"Transformer":[57],"(dubbed":[58],"FmFormer),":[59],"designed":[60],"to":[61,93,127,137,230],"facilitate":[62],"by":[65,218],"exploring":[66],"between":[69,100],"features":[71,130],"(video)":[72],"(current)":[76],"context":[79],"fused":[82,178],"magnesium":[83,179],"smelting":[84,180],"process.":[85],"Our":[86],"approach":[87],"introduces":[88],"novel":[90],"tokenization":[91],"paradigm":[92],"effectively":[94],"bridge":[95],"substantial":[97],"dimensionality":[98],"gap":[99],"3D":[102],"video":[103,185],"modality":[104,109,133],"1D":[107],"current":[108,187,212],"multiscale":[112],"manner,":[113],"enabling":[114],"hierarchical":[116],"reconstruction":[117],"pixel-level":[119],"detection.":[121],"Subsequently,":[122],"FmFormer":[124,199],"leverages":[125],"self-attention":[126],"learn":[128],"internal":[129],"within":[131],"each":[132],"bidirectional":[135,145],"cross-attention":[136],"capture":[138],"correlations":[139],"across":[140],"modalities.":[141],"By":[142],"decoding":[143],"we":[148,169],"obtain":[149],"final":[151],"result":[153],"even":[155],"locate":[156],"specific":[158],"region.":[160],"To":[161],"validate":[162],"effectiveness":[164],"proposed":[167,198],"method,":[168],"also":[170],"present":[171],"pioneering":[173],"benchmark":[175,226,238],"process,":[181],"featuring":[182],"synchronously":[183],"acquired":[184],"data":[188],"for":[189],"over":[190],"2.2":[191],"million":[192],"samples.":[193],"Leveraging":[194],"learning,":[196],"achieves":[200],"state-of-the-art":[201],"performance":[202],"detecting":[204],"anomalies,":[205],"particularly":[206],"under":[207],"extreme":[208],"interferences":[209],"such":[210],"fluctuations":[213],"occlusion":[216],"caused":[217],"heavy":[219],"water":[220],"mist.":[221],"The":[222,237],"presented":[223],"methodology":[224],"may":[227],"be":[228,240],"applicable":[229],"other":[231],"applications":[233],"with":[234],"some":[235],"amendments.":[236],"will":[239],"released":[241],"at":[242],"<uri":[243],"xmlns:mml=\"http://www.w3.org/1998/Math/MathML\"":[244],"xmlns:xlink=\"http://www.w3.org/1999/xlink\">https://github.com/GaochangWu/FMF-Benchmark</uri>.":[245]},"counts_by_year":[{"year":2026,"cited_by_count":4},{"year":2025,"cited_by_count":19}],"updated_date":"2026-04-09T08:11:56.329763","created_date":"2025-10-10T00:00:00"}
