{"id":"https://openalex.org/W7154300031","doi":"https://doi.org/10.48550/arxiv.2604.10971","title":"MMR-AD: A Large-Scale Multimodal Dataset for Benchmarking General Anomaly Detection with Multimodal Large Language Models","display_name":"MMR-AD: A Large-Scale Multimodal Dataset for Benchmarking General Anomaly Detection with Multimodal Large Language Models","publication_year":2026,"publication_date":"2026-04-13","ids":{"openalex":"https://openalex.org/W7154300031","doi":"https://doi.org/10.48550/arxiv.2604.10971"},"language":null,"primary_location":{"id":"doi:10.48550/arxiv.2604.10971","is_oa":true,"landing_page_url":"https://doi.org/10.48550/arxiv.2604.10971","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":null,"is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"article"},"type":"preprint","indexed_in":["datacite"],"open_access":{"is_oa":true,"oa_status":"green","oa_url":"https://doi.org/10.48550/arxiv.2604.10971","any_repository_has_fulltext":true},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5016491389","display_name":"Xincheng Yao","orcid":"https://orcid.org/0000-0002-0356-3242"},"institutions":[],"countries":[],"is_corresponding":true,"raw_author_name":"Yao, Xincheng","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5038906379","display_name":"Zefeng Qian","orcid":"https://orcid.org/0000-0001-7225-9239"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Qian, Zefeng","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5133560473","display_name":"Chao Shi","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Shi, Chao","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5133557597","display_name":"Jiayang Song","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Song, Jiayang","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"last","author":{"id":"https://openalex.org/A5125630004","display_name":"Chongyang Zhang","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Zhang, Chongyang","raw_affiliation_strings":[],"affiliations":[]}],"institutions":[],"countries_distinct_count":0,"institutions_distinct_count":5,"corresponding_author_ids":["https://openalex.org/A5016491389"],"corresponding_institution_ids":[],"apc_list":null,"apc_paid":null,"fwci":null,"has_fulltext":false,"cited_by_count":0,"citation_normalized_percentile":null,"cited_by_percentile_year":null,"biblio":{"volume":null,"issue":null,"first_page":null,"last_page":null},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T11512","display_name":"Anomaly Detection Techniques and Applications","score":0.968500018119812,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T11512","display_name":"Anomaly Detection Techniques and Applications","score":0.968500018119812,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T12127","display_name":"Software System Performance and Reliability","score":0.0024999999441206455,"subfield":{"id":"https://openalex.org/subfields/1705","display_name":"Computer Networks and Communications"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10220","display_name":"Machine Fault Diagnosis Techniques","score":0.002400000113993883,"subfield":{"id":"https://openalex.org/subfields/2207","display_name":"Control and Systems Engineering"},"field":{"id":"https://openalex.org/fields/22","display_name":"Engineering"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/anomaly-detection","display_name":"Anomaly detection","score":0.7843999862670898},{"id":"https://openalex.org/keywords/benchmark","display_name":"Benchmark (surveying)","score":0.635699987411499},{"id":"https://openalex.org/keywords/benchmarking","display_name":"Benchmarking","score":0.6101999878883362},{"id":"https://openalex.org/keywords/anomaly","display_name":"Anomaly (physics)","score":0.5924999713897705},{"id":"https://openalex.org/keywords/retraining","display_name":"Retraining","score":0.5738999843597412},{"id":"https://openalex.org/keywords/baseline","display_name":"Baseline (sea)","score":0.39879998564720154}],"concepts":[{"id":"https://openalex.org/C739882","wikidata":"https://www.wikidata.org/wiki/Q3560506","display_name":"Anomaly detection","level":2,"score":0.7843999862670898},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.7160000205039978},{"id":"https://openalex.org/C185798385","wikidata":"https://www.wikidata.org/wiki/Q1161707","display_name":"Benchmark (surveying)","level":2,"score":0.635699987411499},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.6243000030517578},{"id":"https://openalex.org/C86251818","wikidata":"https://www.wikidata.org/wiki/Q816754","display_name":"Benchmarking","level":2,"score":0.6101999878883362},{"id":"https://openalex.org/C12997251","wikidata":"https://www.wikidata.org/wiki/Q567560","display_name":"Anomaly (physics)","level":2,"score":0.5924999713897705},{"id":"https://openalex.org/C119857082","wikidata":"https://www.wikidata.org/wiki/Q2539","display_name":"Machine learning","level":1,"score":0.5802000164985657},{"id":"https://openalex.org/C2778712577","wikidata":"https://www.wikidata.org/wiki/Q3505966","display_name":"Retraining","level":2,"score":0.5738999843597412},{"id":"https://openalex.org/C12725497","wikidata":"https://www.wikidata.org/wiki/Q810247","display_name":"Baseline (sea)","level":2,"score":0.39879998564720154},{"id":"https://openalex.org/C137293760","wikidata":"https://www.wikidata.org/wiki/Q3621696","display_name":"Language model","level":2,"score":0.396699994802475},{"id":"https://openalex.org/C97541855","wikidata":"https://www.wikidata.org/wiki/Q830687","display_name":"Reinforcement learning","level":2,"score":0.35109999775886536},{"id":"https://openalex.org/C171078966","wikidata":"https://www.wikidata.org/wiki/Q111029","display_name":"Root (linguistics)","level":2,"score":0.3440000116825104},{"id":"https://openalex.org/C51632099","wikidata":"https://www.wikidata.org/wiki/Q3985153","display_name":"Training set","level":2,"score":0.31310001015663147},{"id":"https://openalex.org/C204321447","wikidata":"https://www.wikidata.org/wiki/Q30642","display_name":"Natural language processing","level":1,"score":0.3100999891757965},{"id":"https://openalex.org/C67186912","wikidata":"https://www.wikidata.org/wiki/Q367664","display_name":"Data modeling","level":2,"score":0.30660000443458557},{"id":"https://openalex.org/C2777508537","wikidata":"https://www.wikidata.org/wiki/Q7936620","display_name":"Visual reasoning","level":2,"score":0.2718999981880188}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.48550/arxiv.2604.10971","is_oa":true,"landing_page_url":"https://doi.org/10.48550/arxiv.2604.10971","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":null,"is_accepted":false,"is_published":null,"raw_source_name":null,"raw_type":"article"}],"best_oa_location":{"id":"doi:10.48550/arxiv.2604.10971","is_oa":true,"landing_page_url":"https://doi.org/10.48550/arxiv.2604.10971","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":null,"is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"article"},"sustainable_development_goals":[],"awards":[],"funders":[],"has_content":{"pdf":false,"grobid_xml":false},"content_urls":null,"referenced_works_count":0,"referenced_works":[],"related_works":[],"abstract_inverted_index":{"In":[0],"the":[1,17,21,51,98,107,113,167,179,201],"progress":[2],"of":[3,94,170],"industrial":[4,180],"anomaly":[5,8,67,227],"detection,":[6],"general":[7,27,33,66,81,143],"detection":[9,68,228],"(GAD)":[10],"is":[11,150,193,207],"an":[12],"emerging":[13],"trend":[14],"and":[15,24,75,133,157,206,229],"also":[16,119,186],"ultimate":[18],"goal.":[19],"Unlike":[20],"conventional":[22],"single-":[23],"multi-class":[25],"AD,":[26],"AD":[28,34,82,110,123,129,144,160,168,196],"aims":[29],"to":[30,70],"train":[31],"a":[32,151,188,194],"model":[35,197],"that":[36,166,198,216],"can":[37],"directly":[38],"detect":[39],"anomalies":[40],"in":[41,64,109,204,225],"diverse":[42],"novel":[43],"classes":[44],"without":[45],"any":[46],"retraining":[47],"or":[48],"fine-tuning":[49],"on":[50,92,183],"target":[52],"data.":[53],"Recently,":[54],"Multimodal":[55],"Large":[56],"Language":[57],"Models":[58],"(MLLMs)":[59],"have":[60,103],"shown":[61],"great":[62],"promise":[63],"achieving":[65],"due":[69,86],"their":[71],"revolutionary":[72],"visual":[73],"understanding":[74],"language":[76],"reasoning":[77],"capabilities.":[78],"However,":[79],"MLLM's":[80],"ability":[83],"remains":[84],"underexplored":[85],"to:":[87],"(1)":[88],"MLLMs":[89,174,224],"are":[90,118,131],"pretrained":[91],"amounts":[93],"data":[95,101,108,203],"sourced":[96],"from":[97,200],"Web,":[99],"these":[100],"still":[102,175],"significant":[104],"gaps":[105],"with":[106],"scenarios.":[111],"Moreover,":[112],"image-text":[114],"pairs":[115],"during":[116],"pretraining":[117],"not":[120,134],"specifically":[121],"for":[122,137,154],"tasks.":[124],"(2)":[125],"The":[126],"current":[127,171],"mainstream":[128],"datasets":[130],"image-based":[132],"yet":[135],"suitable":[136],"post-training":[138],"MLLMs.":[139],"To":[140],"facilitate":[141],"MLLM-based":[142,159],"research,":[145],"we":[146,164,185],"present":[147],"MMR-AD,":[148,163,184],"which":[149,192],"comprehensive":[152],"benchmark":[153],"both":[155,226],"training":[156],"evaluating":[158],"models.":[161],"With":[162],"reveal":[165],"performance":[169],"SOTA":[172],"generalist":[173,223],"falls":[176],"far":[177],"behind":[178],"requirements.":[181],"Based":[182],"propose":[187],"baseline":[189],"model,":[190],"Anomaly-R1,":[191],"reasoning-based":[195],"learns":[199],"CoT":[202],"MMR-AD":[205],"further":[208],"enhanced":[209],"by":[210],"reinforcement":[211],"learning.":[212],"Extensive":[213],"experiments":[214],"show":[215],"our":[217],"Anomaly-R1":[218],"achieves":[219],"remarkable":[220],"improvements":[221],"over":[222],"localization.":[230]},"counts_by_year":[],"updated_date":"2026-04-15T06:04:33.058270","created_date":"2026-04-15T00:00:00"}
