{"id":"https://openalex.org/W4415020787","doi":"https://doi.org/10.48550/arxiv.2505.13941","title":"MLZero: A Multi-Agent System for End-to-end Machine Learning Automation","display_name":"MLZero: A Multi-Agent System for End-to-end Machine Learning Automation","publication_year":2025,"publication_date":"2025-05-20","ids":{"openalex":"https://openalex.org/W4415020787","doi":"https://doi.org/10.48550/arxiv.2505.13941"},"language":"en","primary_location":{"id":"pmh:oai:arXiv.org:2505.13941","is_oa":true,"landing_page_url":"http://arxiv.org/abs/2505.13941","pdf_url":"https://arxiv.org/pdf/2505.13941","source":{"id":"https://openalex.org/S4393918464","display_name":"ArXiv.org","issn_l":"2331-8422","issn":["2331-8422"],"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":null,"host_organization_name":null,"host_organization_lineage":[],"host_organization_lineage_names":[],"type":"repository"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"text"},"type":"preprint","indexed_in":["arxiv","datacite"],"open_access":{"is_oa":true,"oa_status":"green","oa_url":"https://arxiv.org/pdf/2505.13941","any_repository_has_fulltext":true},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5113190707","display_name":"Haoyang Fang","orcid":null},"institutions":[],"countries":[],"is_corresponding":true,"raw_author_name":"Fang, Haoyang","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5100781695","display_name":"Boran Han","orcid":"https://orcid.org/0000-0002-3621-3134"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Han, Boran","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5011601027","display_name":"Nick Erickson","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Erickson, Nick","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5073395495","display_name":"X. Zhang","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Zhang, Xiyuan","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5060861535","display_name":"S. Zhou","orcid":"https://orcid.org/0000-0002-7517-9653"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Zhou, Su","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5111058345","display_name":"Anirudh Dagar","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Dagar, Anirudh","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5040806743","display_name":"Jiani Zhang","orcid":"https://orcid.org/0000-0003-0074-6761"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Zhang, Jiani","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5020675074","display_name":"Ali Caner T\u00fcrkmen","orcid":"https://orcid.org/0000-0003-2593-1824"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Turkmen, Ali Caner","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5100731479","display_name":"Cong Hu","orcid":"https://orcid.org/0000-0002-5309-5985"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Hu, Cuixiong","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5006581225","display_name":"Huzefa Rangwala","orcid":"https://orcid.org/0000-0003-0435-0035"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Rangwala, Huzefa","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5055935194","display_name":"Ying Wu","orcid":"https://orcid.org/0000-0002-5635-8090"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Wu, Ying Nian","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5055825320","display_name":"Bernie Wang","orcid":"https://orcid.org/0000-0002-0291-7184"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Wang, Bernie","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"last","author":{"id":"https://openalex.org/A5082384108","display_name":"George Karypis","orcid":"https://orcid.org/0000-0003-2753-1437"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Karypis, George","raw_affiliation_strings":[],"affiliations":[]}],"institutions":[],"countries_distinct_count":0,"institutions_distinct_count":13,"corresponding_author_ids":["https://openalex.org/A5113190707"],"corresponding_institution_ids":[],"apc_list":null,"apc_paid":null,"fwci":null,"has_fulltext":false,"cited_by_count":0,"citation_normalized_percentile":null,"cited_by_percentile_year":null,"biblio":{"volume":null,"issue":null,"first_page":null,"last_page":null},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T12761","display_name":"Data Stream Mining Techniques","score":0.9099000096321106,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T12761","display_name":"Data Stream Mining Techniques","score":0.9099000096321106,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/automation","display_name":"Automation","score":0.6802999973297119},{"id":"https://openalex.org/keywords/context","display_name":"Context (archaeology)","score":0.49470001459121704},{"id":"https://openalex.org/keywords/process","display_name":"Process (computing)","score":0.4609000086784363},{"id":"https://openalex.org/keywords/hallucinating","display_name":"Hallucinating","score":0.4462999999523163},{"id":"https://openalex.org/keywords/code","display_name":"Code (set theory)","score":0.4345000088214874},{"id":"https://openalex.org/keywords/margin","display_name":"Margin (machine learning)","score":0.400299996137619},{"id":"https://openalex.org/keywords/key","display_name":"Key (lock)","score":0.37630000710487366},{"id":"https://openalex.org/keywords/code-generation","display_name":"Code generation","score":0.33889999985694885}],"concepts":[{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.7203999757766724},{"id":"https://openalex.org/C115901376","wikidata":"https://www.wikidata.org/wiki/Q184199","display_name":"Automation","level":2,"score":0.6802999973297119},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.6503999829292297},{"id":"https://openalex.org/C119857082","wikidata":"https://www.wikidata.org/wiki/Q2539","display_name":"Machine learning","level":1,"score":0.6340000033378601},{"id":"https://openalex.org/C2779343474","wikidata":"https://www.wikidata.org/wiki/Q3109175","display_name":"Context (archaeology)","level":2,"score":0.49470001459121704},{"id":"https://openalex.org/C98045186","wikidata":"https://www.wikidata.org/wiki/Q205663","display_name":"Process (computing)","level":2,"score":0.4609000086784363},{"id":"https://openalex.org/C2911011789","wikidata":"https://www.wikidata.org/wiki/Q130741","display_name":"Hallucinating","level":2,"score":0.4462999999523163},{"id":"https://openalex.org/C2776760102","wikidata":"https://www.wikidata.org/wiki/Q5139990","display_name":"Code (set theory)","level":3,"score":0.4345000088214874},{"id":"https://openalex.org/C774472","wikidata":"https://www.wikidata.org/wiki/Q6760393","display_name":"Margin (machine learning)","level":2,"score":0.400299996137619},{"id":"https://openalex.org/C26517878","wikidata":"https://www.wikidata.org/wiki/Q228039","display_name":"Key (lock)","level":2,"score":0.37630000710487366},{"id":"https://openalex.org/C133162039","wikidata":"https://www.wikidata.org/wiki/Q1061077","display_name":"Code generation","level":3,"score":0.33889999985694885},{"id":"https://openalex.org/C165064840","wikidata":"https://www.wikidata.org/wiki/Q1321061","display_name":"Matching (statistics)","level":2,"score":0.3163999915122986},{"id":"https://openalex.org/C164226766","wikidata":"https://www.wikidata.org/wiki/Q7293202","display_name":"Rank (graph theory)","level":2,"score":0.3154999911785126},{"id":"https://openalex.org/C26760741","wikidata":"https://www.wikidata.org/wiki/Q160402","display_name":"Perception","level":2,"score":0.31200000643730164},{"id":"https://openalex.org/C2779038628","wikidata":"https://www.wikidata.org/wiki/Q7248497","display_name":"Programming by demonstration","level":3,"score":0.311599999666214},{"id":"https://openalex.org/C2779903281","wikidata":"https://www.wikidata.org/wiki/Q6888026","display_name":"Modalities","level":2,"score":0.30970001220703125},{"id":"https://openalex.org/C9652623","wikidata":"https://www.wikidata.org/wiki/Q190109","display_name":"Field (mathematics)","level":2,"score":0.3009999990463257},{"id":"https://openalex.org/C132964779","wikidata":"https://www.wikidata.org/wiki/Q2110223","display_name":"Raw data","level":2,"score":0.2874999940395355},{"id":"https://openalex.org/C77967617","wikidata":"https://www.wikidata.org/wiki/Q4677561","display_name":"Active learning (machine learning)","level":2,"score":0.2849999964237213},{"id":"https://openalex.org/C2776010242","wikidata":"https://www.wikidata.org/wiki/Q4677575","display_name":"Active perception","level":3,"score":0.2802000045776367},{"id":"https://openalex.org/C26713055","wikidata":"https://www.wikidata.org/wiki/Q245962","display_name":"Implementation","level":2,"score":0.2784000039100647}],"mesh":[],"locations_count":2,"locations":[{"id":"pmh:oai:arXiv.org:2505.13941","is_oa":true,"landing_page_url":"http://arxiv.org/abs/2505.13941","pdf_url":"https://arxiv.org/pdf/2505.13941","source":{"id":"https://openalex.org/S4393918464","display_name":"ArXiv.org","issn_l":"2331-8422","issn":["2331-8422"],"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":null,"host_organization_name":null,"host_organization_lineage":[],"host_organization_lineage_names":[],"type":"repository"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"text"},{"id":"doi:10.48550/arxiv.2505.13941","is_oa":true,"landing_page_url":"https://doi.org/10.48550/arxiv.2505.13941","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":null,"is_accepted":false,"is_published":null,"raw_source_name":null,"raw_type":"article"}],"best_oa_location":{"id":"pmh:oai:arXiv.org:2505.13941","is_oa":true,"landing_page_url":"http://arxiv.org/abs/2505.13941","pdf_url":"https://arxiv.org/pdf/2505.13941","source":{"id":"https://openalex.org/S4393918464","display_name":"ArXiv.org","issn_l":"2331-8422","issn":["2331-8422"],"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":null,"host_organization_name":null,"host_organization_lineage":[],"host_organization_lineage_names":[],"type":"repository"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"text"},"sustainable_development_goals":[],"awards":[],"funders":[],"has_content":{"grobid_xml":false,"pdf":true},"content_urls":{"pdf":"https://content.openalex.org/works/W4415020787.pdf"},"referenced_works_count":0,"referenced_works":[],"related_works":[],"abstract_inverted_index":{"Existing":[0],"AutoML":[1,126],"systems":[2,175],"have":[3],"advanced":[4],"the":[5,69,89,141],"automation":[6,43],"of":[7,76,152,159],"machine":[8],"learning":[9],"(ML);":[10],"however,":[11],"they":[12],"still":[13],"require":[14],"substantial":[15],"manual":[16],"configuration":[17],"and":[18,83,96,113,155],"expert":[19],"input,":[20],"particularly":[21],"when":[22,121],"handling":[23],"multimodal":[24,61],"data.":[25],"We":[26],"introduce":[27],"MLZero,":[28],"a":[29,145,149,169],"novel":[30],"multi-agent":[31],"framework":[32],"powered":[33],"by":[34,144],"Large":[35],"Language":[36],"Models":[37],"(LLMs)":[38],"that":[39,66],"enables":[40],"end-to-end":[41],"ML":[42],"across":[44],"diverse":[45,136],"data":[46,137],"modalities":[47],"with":[48,94,148,168],"minimal":[49],"human":[50],"intervention.":[51],"A":[52],"cognitive":[53],"perception":[54],"module":[55],"is":[56],"first":[57],"employed,":[58],"transforming":[59],"raw":[60],"inputs":[62],"into":[63],"perceptual":[64],"context":[65],"effectively":[67],"guides":[68],"subsequent":[70],"workflow.":[71],"To":[72],"address":[73],"key":[74],"limitations":[75],"LLMs,":[77],"such":[78],"as":[79],"hallucinated":[80],"code":[81,91],"generation":[82,92],"outdated":[84],"API":[85],"knowledge,":[86],"we":[87],"enhance":[88],"iterative":[90],"process":[93],"semantic":[95],"episodic":[97],"memory.":[98],"MLZero":[99,139],"demonstrates":[100],"superior":[101],"performance":[102],"on":[103,123],"MLE-Bench":[104],"Lite,":[105],"outperforming":[106,173],"all":[107],"competitors":[108],"in":[109],"both":[110],"success":[111,150],"rate":[112,151],"solution":[114],"quality,":[115],"securing":[116],"six":[117],"gold":[118],"medals.":[119],"Additionally,":[120],"evaluated":[122],"our":[124],"Multimodal":[125],"Agent":[127],"Benchmark,":[128],"which":[129],"includes":[130],"25":[131],"more":[132],"challenging":[133],"tasks":[134],"spanning":[135],"modalities,":[138],"outperforms":[140],"competing":[142],"methods":[143],"large":[146],"margin":[147],"0.92":[153],"(+263.6\\%)":[154],"an":[156],"average":[157],"rank":[158],"2.28.":[160],"Our":[161],"approach":[162],"maintains":[163],"its":[164],"robust":[165],"effectiveness":[166],"even":[167],"compact":[170],"8B":[171],"LLM,":[172],"full-size":[174],"from":[176],"existing":[177],"solutions.":[178]},"counts_by_year":[],"updated_date":"2026-03-07T16:01:11.037858","created_date":"2025-10-10T00:00:00"}
