{"id":"https://openalex.org/W2925920795","doi":"https://doi.org/10.3390/make1010032","title":"Evaluation of Regression Models: Model Assessment, Model Selection and Generalization Error","display_name":"Evaluation of Regression Models: Model Assessment, Model Selection and Generalization Error","publication_year":2019,"publication_date":"2019-03-22","ids":{"openalex":"https://openalex.org/W2925920795","doi":"https://doi.org/10.3390/make1010032","mag":"2925920795"},"language":"en","primary_location":{"id":"doi:10.3390/make1010032","is_oa":true,"landing_page_url":"https://doi.org/10.3390/make1010032","pdf_url":"https://www.mdpi.com/2504-4990/1/1/32/pdf?version=1553678296","source":{"id":"https://openalex.org/S4210213891","display_name":"Machine Learning and Knowledge Extraction","issn_l":"2504-4990","issn":["2504-4990"],"is_oa":true,"is_in_doaj":true,"is_core":true,"host_organization":"https://openalex.org/P4310310987","host_organization_name":"Multidisciplinary Digital Publishing Institute","host_organization_lineage":["https://openalex.org/P4310310987"],"host_organization_lineage_names":["Multidisciplinary Digital Publishing Institute"],"type":"journal"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Machine Learning and Knowledge Extraction","raw_type":"journal-article"},"type":"article","indexed_in":["crossref","doaj"],"open_access":{"is_oa":true,"oa_status":"gold","oa_url":"https://www.mdpi.com/2504-4990/1/1/32/pdf?version=1553678296","any_repository_has_fulltext":true},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5057625030","display_name":"Frank Emmert\u2010Streib","orcid":"https://orcid.org/0000-0003-0745-5641"},"institutions":[{"id":"https://openalex.org/I166825849","display_name":"Tampere University","ror":"https://ror.org/033003e23","country_code":"FI","type":"education","lineage":["https://openalex.org/I166825849"]}],"countries":["FI"],"is_corresponding":true,"raw_author_name":"Frank Emmert-Streib","raw_affiliation_strings":["Institute of Biosciences and Medical Technology, 33520 Tampere, Finland","Predictive Society and Data Analytics Lab, Faculty of Information Technolgy and Communication Sciences, Tampere University, 33100 Tampere, Finland"],"raw_orcid":"https://orcid.org/0000-0003-0745-5641","affiliations":[{"raw_affiliation_string":"Institute of Biosciences and Medical Technology, 33520 Tampere, Finland","institution_ids":[]},{"raw_affiliation_string":"Predictive Society and Data Analytics Lab, Faculty of Information Technolgy and Communication Sciences, Tampere University, 33100 Tampere, Finland","institution_ids":["https://openalex.org/I166825849"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5044244385","display_name":"Matthias Dehmer","orcid":"https://orcid.org/0000-0001-8454-5857"},"institutions":[{"id":"https://openalex.org/I205237279","display_name":"Nankai University","ror":"https://ror.org/01y1kjr75","country_code":"CN","type":"education","lineage":["https://openalex.org/I205237279"]},{"id":"https://openalex.org/I4210114246","display_name":"UMIT - Private Universit\u00e4t f\u00fcr Gesundheitswissenschaften, Medizinische Informatik und Technik","ror":"https://ror.org/02d0kps43","country_code":"AT","type":"education","lineage":["https://openalex.org/I4210114246"]},{"id":"https://openalex.org/I4210136249","display_name":"University of Applied Sciences Upper Austria","ror":"https://ror.org/03jqp6d56","country_code":"AT","type":"education","lineage":["https://openalex.org/I4210136249"]}],"countries":["AT","CN"],"is_corresponding":false,"raw_author_name":"Matthias Dehmer","raw_affiliation_strings":["College of Computer and Control Engineering, Nankai University, Tianjin 300071, China","Department of Mechatronics and Biomedical Computer Science, University for Health Sciences, Medical Informatics and Technology, 6060 Hall in Tirol, Austria","Institute for Intelligent Production, Faculty for Management, University of Applied Sciences Upper Austria, Steyr Campus, 4400 Steyr, Austria"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"College of Computer and Control Engineering, Nankai University, Tianjin 300071, China","institution_ids":["https://openalex.org/I205237279"]},{"raw_affiliation_string":"Department of Mechatronics and Biomedical Computer Science, University for Health Sciences, Medical Informatics and Technology, 6060 Hall in Tirol, Austria","institution_ids":["https://openalex.org/I4210114246"]},{"raw_affiliation_string":"Institute for Intelligent Production, Faculty for Management, University of Applied Sciences Upper Austria, Steyr Campus, 4400 Steyr, Austria","institution_ids":["https://openalex.org/I4210136249"]}]}],"institutions":[],"countries_distinct_count":3,"institutions_distinct_count":2,"corresponding_author_ids":["https://openalex.org/A5057625030"],"corresponding_institution_ids":["https://openalex.org/I166825849"],"apc_list":{"value":1400,"currency":"CHF","value_usd":1515},"apc_paid":{"value":1400,"currency":"CHF","value_usd":1515},"fwci":6.9685,"has_fulltext":true,"cited_by_count":125,"citation_normalized_percentile":{"value":0.97462088,"is_in_top_1_percent":false,"is_in_top_10_percent":true},"cited_by_percentile_year":{"min":98,"max":100},"biblio":{"volume":"1","issue":"1","first_page":"521","last_page":"551"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T12535","display_name":"Machine Learning and Data Classification","score":0.9904000163078308,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T12535","display_name":"Machine Learning and Data Classification","score":0.9904000163078308,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T13398","display_name":"Data Analysis with R","score":0.9790999889373779,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11871","display_name":"Advanced Statistical Methods and Models","score":0.9785000085830688,"subfield":{"id":"https://openalex.org/subfields/2613","display_name":"Statistics and Probability"},"field":{"id":"https://openalex.org/fields/26","display_name":"Mathematics"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/overfitting","display_name":"Overfitting","score":0.9180965423583984},{"id":"https://openalex.org/keywords/model-selection","display_name":"Model selection","score":0.7436697483062744},{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.7193936109542847},{"id":"https://openalex.org/keywords/generalization","display_name":"Generalization","score":0.6208770871162415},{"id":"https://openalex.org/keywords/resampling","display_name":"Resampling","score":0.6072017550468445},{"id":"https://openalex.org/keywords/machine-learning","display_name":"Machine learning","score":0.5857415795326233},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.5606794953346252},{"id":"https://openalex.org/keywords/selection","display_name":"Selection (genetic algorithm)","score":0.5468674302101135},{"id":"https://openalex.org/keywords/statistical-model","display_name":"Statistical model","score":0.5251184105873108},{"id":"https://openalex.org/keywords/data-mining","display_name":"Data mining","score":0.45126205682754517},{"id":"https://openalex.org/keywords/regression","display_name":"Regression","score":0.44819629192352295},{"id":"https://openalex.org/keywords/linear-model","display_name":"Linear model","score":0.44181811809539795},{"id":"https://openalex.org/keywords/variance","display_name":"Variance (accounting)","score":0.4362232983112335},{"id":"https://openalex.org/keywords/regression-analysis","display_name":"Regression analysis","score":0.41495534777641296},{"id":"https://openalex.org/keywords/statistics","display_name":"Statistics","score":0.22368329763412476},{"id":"https://openalex.org/keywords/mathematics","display_name":"Mathematics","score":0.22073131799697876},{"id":"https://openalex.org/keywords/artificial-neural-network","display_name":"Artificial neural network","score":0.14867982268333435}],"concepts":[{"id":"https://openalex.org/C22019652","wikidata":"https://www.wikidata.org/wiki/Q331309","display_name":"Overfitting","level":3,"score":0.9180965423583984},{"id":"https://openalex.org/C93959086","wikidata":"https://www.wikidata.org/wiki/Q6888345","display_name":"Model selection","level":2,"score":0.7436697483062744},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.7193936109542847},{"id":"https://openalex.org/C177148314","wikidata":"https://www.wikidata.org/wiki/Q170084","display_name":"Generalization","level":2,"score":0.6208770871162415},{"id":"https://openalex.org/C150921843","wikidata":"https://www.wikidata.org/wiki/Q1170431","display_name":"Resampling","level":2,"score":0.6072017550468445},{"id":"https://openalex.org/C119857082","wikidata":"https://www.wikidata.org/wiki/Q2539","display_name":"Machine learning","level":1,"score":0.5857415795326233},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.5606794953346252},{"id":"https://openalex.org/C81917197","wikidata":"https://www.wikidata.org/wiki/Q628760","display_name":"Selection (genetic algorithm)","level":2,"score":0.5468674302101135},{"id":"https://openalex.org/C114289077","wikidata":"https://www.wikidata.org/wiki/Q3284399","display_name":"Statistical model","level":2,"score":0.5251184105873108},{"id":"https://openalex.org/C124101348","wikidata":"https://www.wikidata.org/wiki/Q172491","display_name":"Data mining","level":1,"score":0.45126205682754517},{"id":"https://openalex.org/C83546350","wikidata":"https://www.wikidata.org/wiki/Q1139051","display_name":"Regression","level":2,"score":0.44819629192352295},{"id":"https://openalex.org/C163175372","wikidata":"https://www.wikidata.org/wiki/Q3339222","display_name":"Linear model","level":2,"score":0.44181811809539795},{"id":"https://openalex.org/C196083921","wikidata":"https://www.wikidata.org/wiki/Q7915758","display_name":"Variance (accounting)","level":2,"score":0.4362232983112335},{"id":"https://openalex.org/C152877465","wikidata":"https://www.wikidata.org/wiki/Q208042","display_name":"Regression analysis","level":2,"score":0.41495534777641296},{"id":"https://openalex.org/C105795698","wikidata":"https://www.wikidata.org/wiki/Q12483","display_name":"Statistics","level":1,"score":0.22368329763412476},{"id":"https://openalex.org/C33923547","wikidata":"https://www.wikidata.org/wiki/Q395","display_name":"Mathematics","level":0,"score":0.22073131799697876},{"id":"https://openalex.org/C50644808","wikidata":"https://www.wikidata.org/wiki/Q192776","display_name":"Artificial neural network","level":2,"score":0.14867982268333435},{"id":"https://openalex.org/C134306372","wikidata":"https://www.wikidata.org/wiki/Q7754","display_name":"Mathematical analysis","level":1,"score":0.0},{"id":"https://openalex.org/C144133560","wikidata":"https://www.wikidata.org/wiki/Q4830453","display_name":"Business","level":0,"score":0.0},{"id":"https://openalex.org/C121955636","wikidata":"https://www.wikidata.org/wiki/Q4116214","display_name":"Accounting","level":1,"score":0.0}],"mesh":[],"locations_count":3,"locations":[{"id":"doi:10.3390/make1010032","is_oa":true,"landing_page_url":"https://doi.org/10.3390/make1010032","pdf_url":"https://www.mdpi.com/2504-4990/1/1/32/pdf?version=1553678296","source":{"id":"https://openalex.org/S4210213891","display_name":"Machine Learning and Knowledge Extraction","issn_l":"2504-4990","issn":["2504-4990"],"is_oa":true,"is_in_doaj":true,"is_core":true,"host_organization":"https://openalex.org/P4310310987","host_organization_name":"Multidisciplinary Digital Publishing Institute","host_organization_lineage":["https://openalex.org/P4310310987"],"host_organization_lineage_names":["Multidisciplinary Digital Publishing Institute"],"type":"journal"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Machine Learning and Knowledge Extraction","raw_type":"journal-article"},{"id":"pmh:oai:mdpi.com:/2504-4990/1/1/32/","is_oa":true,"landing_page_url":"http://dx.doi.org/10.3390/make1010032","pdf_url":null,"source":{"id":"https://openalex.org/S4306400947","display_name":"MDPI (MDPI AG)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I4210097602","host_organization_name":"Multidisciplinary Digital Publishing Institute (Switzerland)","host_organization_lineage":["https://openalex.org/I4210097602"],"host_organization_lineage_names":[],"type":"repository"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":"Machine Learning and Knowledge Extraction","raw_type":"Text"},{"id":"pmh:oai:trepo.tuni.fi:10024/215779","is_oa":true,"landing_page_url":"https://trepo.tuni.fi/handle/10024/215779","pdf_url":null,"source":{"id":"https://openalex.org/S7407055260","display_name":"Trepo - Institutional Repository of Tampere University","issn_l":null,"issn":null,"is_oa":false,"is_in_doaj":false,"is_core":false,"host_organization":null,"host_organization_name":null,"host_organization_lineage":[],"host_organization_lineage_names":[],"type":"repository"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"article"}],"best_oa_location":{"id":"doi:10.3390/make1010032","is_oa":true,"landing_page_url":"https://doi.org/10.3390/make1010032","pdf_url":"https://www.mdpi.com/2504-4990/1/1/32/pdf?version=1553678296","source":{"id":"https://openalex.org/S4210213891","display_name":"Machine Learning and Knowledge Extraction","issn_l":"2504-4990","issn":["2504-4990"],"is_oa":true,"is_in_doaj":true,"is_core":true,"host_organization":"https://openalex.org/P4310310987","host_organization_name":"Multidisciplinary Digital Publishing Institute","host_organization_lineage":["https://openalex.org/P4310310987"],"host_organization_lineage_names":["Multidisciplinary Digital Publishing Institute"],"type":"journal"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Machine Learning and Knowledge Extraction","raw_type":"journal-article"},"sustainable_development_goals":[],"awards":[],"funders":[],"has_content":{"grobid_xml":true,"pdf":true},"content_urls":{"pdf":"https://content.openalex.org/works/W2925920795.pdf","grobid_xml":"https://content.openalex.org/works/W2925920795.grobid-xml"},"referenced_works_count":87,"referenced_works":["https://openalex.org/W197379496","https://openalex.org/W369767410","https://openalex.org/W601070381","https://openalex.org/W1001370459","https://openalex.org/W1468645148","https://openalex.org/W1509562192","https://openalex.org/W1516193414","https://openalex.org/W1523985187","https://openalex.org/W1554944419","https://openalex.org/W1560724230","https://openalex.org/W1577349312","https://openalex.org/W1726463755","https://openalex.org/W1824067107","https://openalex.org/W1840091437","https://openalex.org/W1877880381","https://openalex.org/W1940174779","https://openalex.org/W1966827292","https://openalex.org/W1975032412","https://openalex.org/W1981251392","https://openalex.org/W1981525111","https://openalex.org/W1981552604","https://openalex.org/W1983755491","https://openalex.org/W1995945562","https://openalex.org/W2013805643","https://openalex.org/W2019448438","https://openalex.org/W2019880039","https://openalex.org/W2020925091","https://openalex.org/W2029084939","https://openalex.org/W2047028564","https://openalex.org/W2052779929","https://openalex.org/W2054282473","https://openalex.org/W2058839892","https://openalex.org/W2070907364","https://openalex.org/W2076118331","https://openalex.org/W2076684951","https://openalex.org/W2085890860","https://openalex.org/W2087414659","https://openalex.org/W2089763487","https://openalex.org/W2099385862","https://openalex.org/W2103903744","https://openalex.org/W2104676838","https://openalex.org/W2105981176","https://openalex.org/W2109844396","https://openalex.org/W2112081648","https://openalex.org/W2115643478","https://openalex.org/W2115709314","https://openalex.org/W2118649542","https://openalex.org/W2120906154","https://openalex.org/W2122825543","https://openalex.org/W2124181495","https://openalex.org/W2131842864","https://openalex.org/W2135046866","https://openalex.org/W2140875296","https://openalex.org/W2141975087","https://openalex.org/W2144935164","https://openalex.org/W2148807518","https://openalex.org/W2150209433","https://openalex.org/W2154290668","https://openalex.org/W2154776925","https://openalex.org/W2158196600","https://openalex.org/W2159397589","https://openalex.org/W2168175751","https://openalex.org/W2187180375","https://openalex.org/W2294962740","https://openalex.org/W2300879143","https://openalex.org/W2798641619","https://openalex.org/W2888056875","https://openalex.org/W2891113190","https://openalex.org/W2897173776","https://openalex.org/W2905506148","https://openalex.org/W2910575305","https://openalex.org/W3002782274","https://openalex.org/W3104887532","https://openalex.org/W3144545015","https://openalex.org/W3175417087","https://openalex.org/W4211177544","https://openalex.org/W4212883601","https://openalex.org/W4234698323","https://openalex.org/W4256183008","https://openalex.org/W4299551239","https://openalex.org/W4379510236","https://openalex.org/W4399582985","https://openalex.org/W6608024681","https://openalex.org/W6638983183","https://openalex.org/W6680701566","https://openalex.org/W6682981795","https://openalex.org/W6902656498"],"related_works":["https://openalex.org/W4362597605","https://openalex.org/W4225271882","https://openalex.org/W2003394143","https://openalex.org/W2109007220","https://openalex.org/W1607827294","https://openalex.org/W2895680438","https://openalex.org/W4221149483","https://openalex.org/W2611757366","https://openalex.org/W1980211030","https://openalex.org/W2053546922"],"abstract_inverted_index":{"When":[0],"performing":[1],"a":[2,11,26,40],"regression":[3,124],"or":[4],"classification":[5,139],"analysis,":[6],"one":[7,42],"needs":[8,43],"to":[9,37,44,48,132],"specify":[10],"statistical":[12,83],"model.":[13],"This":[14],"model":[15,47,52,67,70,95],"should":[16],"avoid":[17],"the":[18,63,75,100,114],"overfitting":[19],"and":[20,24,69,78,91,103],"underfitting":[21],"of":[22,66],"data,":[23],"achieve":[25],"low":[27],"generalization":[28],"error":[29],"that":[30],"characterizes":[31],"its":[32],"prediction":[33],"performance.":[34],"In":[35,58],"order":[36],"identify":[38],"such":[39],"model,":[41],"decide":[45],"which":[46],"select":[49],"from":[50],"candidate":[51],"families":[53],"based":[54],"on":[55],"performance":[56],"evaluations.":[57],"this":[59],"paper,":[60],"we":[61,118],"review":[62],"theoretical":[64,115],"framework":[65],"selection":[68,89],"assessment,":[71],"including":[72],"error-complexity":[73],"curves,":[74],"bias-variance":[76],"tradeoff,":[77],"learning":[79],"curves":[80],"for":[81,94,106,122],"evaluating":[82],"models.":[84,125],"We":[85],"discuss":[86],"criterion-based,":[87],"step-wise":[88],"procedures":[90],"resampling":[92],"methods":[93],"selection,":[96],"whereas":[97],"cross-validation":[98],"provides":[99],"most":[101],"simple":[102],"generic":[104],"means":[105],"computationally":[107],"estimating":[108],"all":[109],"required":[110],"entities.":[111],"To":[112],"make":[113],"concepts":[116],"transparent,":[117],"present":[119],"worked":[120],"examples":[121],"linear":[123],"However,":[126],"our":[127],"conceptual":[128],"presentation":[129],"is":[130],"extensible":[131],"more":[133],"general":[134],"models,":[135],"as":[136,138],"well":[137],"problems.":[140]},"counts_by_year":[{"year":2026,"cited_by_count":16},{"year":2025,"cited_by_count":24},{"year":2024,"cited_by_count":19},{"year":2023,"cited_by_count":18},{"year":2022,"cited_by_count":24},{"year":2021,"cited_by_count":10},{"year":2020,"cited_by_count":9},{"year":2019,"cited_by_count":5}],"updated_date":"2026-05-08T15:41:06.802602","created_date":"2025-10-10T00:00:00"}
