{"id":"https://openalex.org/W4396849416","doi":"https://doi.org/10.1088/2632-2153/ad4ae5","title":"Reducing training data needs with minimal multilevel machine learning (M3L)","display_name":"Reducing training data needs with minimal multilevel machine learning (M3L)","publication_year":2024,"publication_date":"2024-05-13","ids":{"openalex":"https://openalex.org/W4396849416","doi":"https://doi.org/10.1088/2632-2153/ad4ae5"},"language":"en","primary_location":{"id":"doi:10.1088/2632-2153/ad4ae5","is_oa":true,"landing_page_url":"https://doi.org/10.1088/2632-2153/ad4ae5","pdf_url":null,"source":{"id":"https://openalex.org/S4210200687","display_name":"Machine Learning Science and Technology","issn_l":"2632-2153","issn":["2632-2153"],"is_oa":true,"is_in_doaj":true,"is_core":true,"host_organization":"https://openalex.org/P4310320083","host_organization_name":"IOP Publishing","host_organization_lineage":["https://openalex.org/P4310320083","https://openalex.org/P4310311669"],"host_organization_lineage_names":["IOP Publishing","Institute of Physics"],"type":"journal"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Machine Learning: Science and Technology","raw_type":"journal-article"},"type":"article","indexed_in":["crossref","doaj"],"open_access":{"is_oa":true,"oa_status":"gold","oa_url":"https://doi.org/10.1088/2632-2153/ad4ae5","any_repository_has_fulltext":true},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5024088138","display_name":"Stefan Heinen","orcid":"https://orcid.org/0000-0001-9382-2342"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Stefan Heinen","raw_affiliation_strings":[],"raw_orcid":"https://orcid.org/0000-0001-9382-2342","affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5074882900","display_name":"Danish Khan","orcid":"https://orcid.org/0000-0001-7529-2202"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Danish Khan","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5065581694","display_name":"Guido Falk von Rudorff","orcid":"https://orcid.org/0000-0001-7987-4330"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Guido Falk von Rudorff","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5041329613","display_name":"Konstantin Karandashev","orcid":"https://orcid.org/0000-0002-0943-3051"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Konstantin Karandashev","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5079763259","display_name":"Daniel Jose Arismendi Arrieta","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Daniel Jose Arismendi Arrieta","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5001121489","display_name":"Alastair J. A. Price","orcid":"https://orcid.org/0000-0003-3239-8319"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Alastair J A Price","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5087225504","display_name":"Surajit Nandi","orcid":"https://orcid.org/0000-0002-7105-2209"},"institutions":[{"id":"https://openalex.org/I96673099","display_name":"Technical University of Denmark","ror":"https://ror.org/04qtj9h94","country_code":"DK","type":"education","lineage":["https://openalex.org/I96673099"]}],"countries":["DK"],"is_corresponding":false,"raw_author_name":"Surajit Nandi","raw_affiliation_strings":["Technical University of Denmark, Department of Energy Conversion and Storage, DK"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"Technical University of Denmark, Department of Energy Conversion and Storage, DK","institution_ids":["https://openalex.org/I96673099"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5023121476","display_name":"Arghya Bhowmik","orcid":"https://orcid.org/0000-0003-3198-5116"},"institutions":[{"id":"https://openalex.org/I96673099","display_name":"Technical University of Denmark","ror":"https://ror.org/04qtj9h94","country_code":"DK","type":"education","lineage":["https://openalex.org/I96673099"]}],"countries":["DK"],"is_corresponding":false,"raw_author_name":"Arghya Bhowmik","raw_affiliation_strings":["Technical University of Denmark, Department of Energy Conversion and Storage, DK"],"raw_orcid":"https://orcid.org/0000-0003-3198-5116","affiliations":[{"raw_affiliation_string":"Technical University of Denmark, Department of Energy Conversion and Storage, DK","institution_ids":["https://openalex.org/I96673099"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5035932611","display_name":"Kersti Hermansson","orcid":"https://orcid.org/0000-0003-2352-0458"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Kersti Hermansson","raw_affiliation_strings":[],"raw_orcid":"https://orcid.org/0000-0003-2352-0458","affiliations":[]},{"author_position":"last","author":{"id":"https://openalex.org/A5088793872","display_name":"O. Anatole von Lilienfeld","orcid":"https://orcid.org/0000-0001-7419-0466"},"institutions":[],"countries":[],"is_corresponding":true,"raw_author_name":"O Anatole von Lilienfeld","raw_affiliation_strings":[],"raw_orcid":"https://orcid.org/0000-0001-7419-0466","affiliations":[]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":10,"corresponding_author_ids":["https://openalex.org/A5088793872"],"corresponding_institution_ids":[],"apc_list":{"value":1600,"currency":"GBP","value_usd":1962},"apc_paid":{"value":1600,"currency":"GBP","value_usd":1962},"fwci":1.7918,"has_fulltext":false,"cited_by_count":18,"citation_normalized_percentile":{"value":0.88509858,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":{"min":90,"max":100},"biblio":{"volume":"5","issue":"2","first_page":"025058","last_page":"025058"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T11948","display_name":"Machine Learning in Materials Science","score":0.9990000128746033,"subfield":{"id":"https://openalex.org/subfields/2505","display_name":"Materials Chemistry"},"field":{"id":"https://openalex.org/fields/25","display_name":"Materials Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T11948","display_name":"Machine Learning in Materials Science","score":0.9990000128746033,"subfield":{"id":"https://openalex.org/subfields/2505","display_name":"Materials Chemistry"},"field":{"id":"https://openalex.org/fields/25","display_name":"Materials Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10028","display_name":"Topic Modeling","score":0.9430999755859375,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/training","display_name":"Training (meteorology)","score":0.6611498594284058},{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.5796913504600525},{"id":"https://openalex.org/keywords/machine-learning","display_name":"Machine learning","score":0.5207234025001526},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.5119917988777161},{"id":"https://openalex.org/keywords/training-set","display_name":"Training set","score":0.4333122968673706},{"id":"https://openalex.org/keywords/geography","display_name":"Geography","score":0.09621307253837585}],"concepts":[{"id":"https://openalex.org/C2777211547","wikidata":"https://www.wikidata.org/wiki/Q17141490","display_name":"Training (meteorology)","level":2,"score":0.6611498594284058},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.5796913504600525},{"id":"https://openalex.org/C119857082","wikidata":"https://www.wikidata.org/wiki/Q2539","display_name":"Machine learning","level":1,"score":0.5207234025001526},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.5119917988777161},{"id":"https://openalex.org/C51632099","wikidata":"https://www.wikidata.org/wiki/Q3985153","display_name":"Training set","level":2,"score":0.4333122968673706},{"id":"https://openalex.org/C205649164","wikidata":"https://www.wikidata.org/wiki/Q1071","display_name":"Geography","level":0,"score":0.09621307253837585},{"id":"https://openalex.org/C153294291","wikidata":"https://www.wikidata.org/wiki/Q25261","display_name":"Meteorology","level":1,"score":0.0}],"mesh":[],"locations_count":3,"locations":[{"id":"doi:10.1088/2632-2153/ad4ae5","is_oa":true,"landing_page_url":"https://doi.org/10.1088/2632-2153/ad4ae5","pdf_url":null,"source":{"id":"https://openalex.org/S4210200687","display_name":"Machine Learning Science and Technology","issn_l":"2632-2153","issn":["2632-2153"],"is_oa":true,"is_in_doaj":true,"is_core":true,"host_organization":"https://openalex.org/P4310320083","host_organization_name":"IOP Publishing","host_organization_lineage":["https://openalex.org/P4310320083","https://openalex.org/P4310311669"],"host_organization_lineage_names":["IOP Publishing","Institute of Physics"],"type":"journal"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Machine Learning: Science and Technology","raw_type":"journal-article"},{"id":"pmh:oai:DiVA.org:uu-534289","is_oa":true,"landing_page_url":"http://urn.kb.se/resolve?urn=urn:nbn:se:uu:diva-534289","pdf_url":null,"source":{"id":"https://openalex.org/S4306401559","display_name":"KTH Publication Database DiVA (KTH Royal Institute of Technology)","issn_l":null,"issn":null,"is_oa":false,"is_in_doaj":false,"is_core":false,"host_organization":null,"host_organization_name":null,"host_organization_lineage":[],"host_organization_lineage_names":[],"type":"repository"},"license":"other-oa","license_id":"https://openalex.org/licenses/other-oa","version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":"","raw_type":"Article in journal"},{"id":"pmh:oai:doaj.org/article:0506d6d035634242bde078321393b2b8","is_oa":true,"landing_page_url":"https://doaj.org/article/0506d6d035634242bde078321393b2b8","pdf_url":null,"source":{"id":"https://openalex.org/S112646816","display_name":"SHILAP Revista de lepidopterolog\u00eda","issn_l":"0300-5267","issn":["0300-5267","2340-4078"],"is_oa":true,"is_in_doaj":true,"is_core":false,"host_organization":null,"host_organization_name":null,"host_organization_lineage":[],"host_organization_lineage_names":[],"type":"journal"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":"Machine Learning: Science and Technology, Vol 5, Iss 2, p 025058 (2024)","raw_type":"article"}],"best_oa_location":{"id":"doi:10.1088/2632-2153/ad4ae5","is_oa":true,"landing_page_url":"https://doi.org/10.1088/2632-2153/ad4ae5","pdf_url":null,"source":{"id":"https://openalex.org/S4210200687","display_name":"Machine Learning Science and Technology","issn_l":"2632-2153","issn":["2632-2153"],"is_oa":true,"is_in_doaj":true,"is_core":true,"host_organization":"https://openalex.org/P4310320083","host_organization_name":"IOP Publishing","host_organization_lineage":["https://openalex.org/P4310320083","https://openalex.org/P4310311669"],"host_organization_lineage_names":["IOP Publishing","Institute of Physics"],"type":"journal"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Machine Learning: Science and Technology","raw_type":"journal-article"},"sustainable_development_goals":[],"awards":[{"id":"https://openalex.org/G2827248422","display_name":"Quantum Machine Learning: Chemical Reactions with Unprecedented Speed and Accuracy","funder_award_id":"772834","funder_id":"https://openalex.org/F4320338335","funder_display_name":"H2020 European Research Council"},{"id":"https://openalex.org/G4626463381","display_name":null,"funder_award_id":"957189","funder_id":"https://openalex.org/F4320320300","funder_display_name":"European Commission"},{"id":"https://openalex.org/G7010704880","display_name":null,"funder_award_id":"772834","funder_id":"https://openalex.org/F4320320300","funder_display_name":"European Commission"},{"id":"https://openalex.org/G7842005466","display_name":null,"funder_award_id":"Horizon 2020","funder_id":"https://openalex.org/F4320320300","funder_display_name":"European Commission"}],"funders":[{"id":"https://openalex.org/F4320309949","display_name":"Canadian Institute for Advanced Research","ror":"https://ror.org/01sdtdd95"},{"id":"https://openalex.org/F4320320300","display_name":"European Commission","ror":"https://ror.org/00k4n6c32"},{"id":"https://openalex.org/F4320322015","display_name":"University of Toronto","ror":"https://ror.org/03dbr7087"},{"id":"https://openalex.org/F4320322581","display_name":"Vetenskapsr\u00e5det","ror":"https://ror.org/03zttf063"},{"id":"https://openalex.org/F4320326644","display_name":"Canada First Research Excellence Fund","ror":null},{"id":"https://openalex.org/F4320338335","display_name":"H2020 European Research Council","ror":"https://ror.org/0472cxd90"}],"has_content":{"grobid_xml":false,"pdf":false},"content_urls":null,"referenced_works_count":65,"referenced_works":["https://openalex.org/W755588900","https://openalex.org/W1971044734","https://openalex.org/W1974667766","https://openalex.org/W1975147762","https://openalex.org/W1981368803","https://openalex.org/W1993077801","https://openalex.org/W1999638776","https://openalex.org/W2006787354","https://openalex.org/W2016280381","https://openalex.org/W2023271753","https://openalex.org/W2024801181","https://openalex.org/W2029125182","https://openalex.org/W2030971064","https://openalex.org/W2033206800","https://openalex.org/W2037223803","https://openalex.org/W2037761619","https://openalex.org/W2058363175","https://openalex.org/W2072750586","https://openalex.org/W2080635178","https://openalex.org/W2104489082","https://openalex.org/W2114704115","https://openalex.org/W2134429390","https://openalex.org/W2143981217","https://openalex.org/W2153693853","https://openalex.org/W2160540043","https://openalex.org/W2169678694","https://openalex.org/W2726670313","https://openalex.org/W2732698050","https://openalex.org/W2753962198","https://openalex.org/W2766033847","https://openalex.org/W2780173879","https://openalex.org/W2886916841","https://openalex.org/W2891365537","https://openalex.org/W2900483837","https://openalex.org/W2921706278","https://openalex.org/W2967510802","https://openalex.org/W2976102057","https://openalex.org/W2990015413","https://openalex.org/W2997591727","https://openalex.org/W3000291311","https://openalex.org/W3003486042","https://openalex.org/W3035559885","https://openalex.org/W3040330580","https://openalex.org/W3085090411","https://openalex.org/W3089029843","https://openalex.org/W3101744125","https://openalex.org/W3105379789","https://openalex.org/W3126679164","https://openalex.org/W3176448302","https://openalex.org/W3193988690","https://openalex.org/W3209046823","https://openalex.org/W4220694746","https://openalex.org/W4293575590","https://openalex.org/W4296031723","https://openalex.org/W4300537282","https://openalex.org/W4319162181","https://openalex.org/W4384154882","https://openalex.org/W4384627417","https://openalex.org/W4385264179","https://openalex.org/W4385849703","https://openalex.org/W6675354045","https://openalex.org/W6679844677","https://openalex.org/W6740515311","https://openalex.org/W6842461873","https://openalex.org/W6842871304"],"related_works":["https://openalex.org/W2961085424","https://openalex.org/W4306674287","https://openalex.org/W4387369504","https://openalex.org/W4394896187","https://openalex.org/W3170094116","https://openalex.org/W4386462264","https://openalex.org/W3107602296","https://openalex.org/W4364306694","https://openalex.org/W4312192474","https://openalex.org/W4283697347"],"abstract_inverted_index":{"Abstract":[0],"For":[1],"many":[2],"machine":[3,44,155],"learning":[4,45,156,250],"applications":[5],"in":[6,27,63,130,290],"science,":[7],"data":[8,36,50,62,75,160],"acquisition,":[9],"not":[10,278],"training,":[11],"is":[12,38],"the":[13,159,240,254,259,273,286,294],"bottleneck":[14],"even":[15],"when":[16,149,246],"avoiding":[17],"experiments":[18],"and":[19,23,26,32,92,111,113,121,147,209,251,267,272,289,301,317,329],"relying":[20],"on":[21,253,296,307],"computation":[22],"simulation.":[24],"Correspondingly,":[25],"order":[28,64],"to":[29,65,151,238,313],"reduce":[30],"cost":[31,138],"carbon":[33],"footprint,":[34],"training":[35,49,74],"efficiency":[37],"key.":[39],"We":[40],"introduce":[41],"minimal":[42],"multilevel":[43,154,249],"(M3L)":[46],"which":[47],"optimizes":[48],"set":[51],"sizes":[52],"using":[53,309],"a":[54,67],"loss":[55],"function":[56],"at":[57,100],"multiple":[58],"levels":[59,102,256,303],"of":[60,69,95,97,103,142,261],"reference":[61],"minimize":[66],"combination":[68,291],"prediction":[70],"error":[71],"with":[72,116,292],"overall":[73],"acquisition":[76],"costs":[77],"(as":[78],"measured":[79],"by":[80,140],"computational":[81,137],"wall-times).":[82],"Numerical":[83],"evidence":[84],"has":[85],"been":[86],"obtained":[87],"for":[88,126,158,242,304],"calculated":[89],"atomization":[90,305],"energies":[91,306],"electron":[93],"affinities":[94],"thousands":[96],"organic":[98],"molecules":[99,274],"various":[101],"theory":[104],"including":[105],"HF,":[106],"MP2,":[107],"DLPNO-CCSD(T),":[108],"DFHFCABS,":[109],"PNOMP2F12,":[110],"PNOCCSD(T)F12,":[112],"treating":[114],"them":[115],"basis":[117],"sets":[118,161],"TZ,":[119],"cc-pVTZ,":[120],"AVTZ-F12.":[122],"Our":[123],"M3L":[124,310],"benchmarks":[125],"reaching":[127],"chemical":[128,132],"accuracy":[129],"distinct":[131],"compound":[133],"sub-spaces":[134],"indicate":[135],"substantial":[136],"reductions":[139],"factors":[141],"\u223c1.01,":[143],"1.1,":[144],"3.8,":[145],"13.8,":[146],"25.8":[148],"compared":[150],"heuristic":[152],"sub-optimal":[153],"(M2L)":[157],"QM7b,":[162],"QM9":[163,186,210,308],"<mml:math":[164,187,211,321],"xmlns:mml=\"http://www.w3.org/1998/Math/MathML\"":[165,188,212,322],"overflow=\"scroll\">":[166,189,213,323],"<mml:mrow>":[167,170,190,193,196,214,217,220,324],"<mml:msup>":[168],"<mml:mi/>":[169,192,216],"<mml:mi>LCCSD</mml:mi>":[171],"<mml:mo":[172,176,198,202,222,226],"stretchy=\"false\">(</mml:mo>":[173,199,223],"<mml:mi":[174,200,224],"mathvariant=\"normal\">T</mml:mi>":[175,201,225],"stretchy=\"false\">)</mml:mo>":[177,203,227],"</mml:mrow>":[178,180,195,204,206,219,228,230,326],"</mml:msup>":[179],"</mml:math>":[181,207,231,327],",":[182,208,232],"Electrolyte":[183],"Genome":[184],"Project,":[185],"<mml:msubsup>":[191,215],"<mml:mi>AE</mml:mi>":[194],"<mml:mi>CCSD</mml:mi>":[197,221],"</mml:msubsup>":[205,229],"<mml:mi>EA</mml:mi>":[218],"respectively.":[233],"Furthermore,":[234],"we":[235],"use":[236],"M2L":[237,271],"investigate":[239],"performance":[241],"76":[243],"density":[244],"functionals":[245,287],"used":[247],"within":[248],"building":[252],"following":[255],"drawn":[257],"from":[258],"hierarchy":[260],"Jacobs":[262],"Ladder:":[263],"LDA,":[264,293],"GGA,":[265],"mGGA,":[266],"hybrid":[268],"functionals.":[269],"Within":[270],"considered,":[275],"mGGAs":[276],"do":[277],"provide":[279],"any":[280],"noticeable":[281],"advantage":[282],"over":[283],"GGAs.":[284],"Among":[285],"considered":[288],"three":[295],"average":[297],"top":[298],"performing":[299],"GGA":[300],"Hybrid":[302],"correspond":[311],"respectively":[312],"PW91,":[314],"KT2,":[315],"B97D,":[316],"\u03c4":[318],"-HCTH,":[319],"B3LYP":[320],"<mml:mo>\u2217</mml:mo>":[325],"(VWN5),":[328],"TPSSH.":[330]},"counts_by_year":[{"year":2025,"cited_by_count":15},{"year":2024,"cited_by_count":1},{"year":2023,"cited_by_count":1},{"year":2022,"cited_by_count":1}],"updated_date":"2026-05-05T08:41:31.759640","created_date":"2025-10-10T00:00:00"}
