{"id":"https://openalex.org/W3115199521","doi":"https://doi.org/10.1088/2632-2153/abfe7c","title":"Improving sample and feature selection with principal covariates regression","display_name":"Improving sample and feature selection with principal covariates regression","publication_year":2021,"publication_date":"2021-05-06","ids":{"openalex":"https://openalex.org/W3115199521","doi":"https://doi.org/10.1088/2632-2153/abfe7c","mag":"3115199521"},"language":"en","primary_location":{"id":"doi:10.1088/2632-2153/abfe7c","is_oa":true,"landing_page_url":"https://doi.org/10.1088/2632-2153/abfe7c","pdf_url":"https://iopscience.iop.org/article/10.1088/2632-2153/abfe7c/pdf","source":{"id":"https://openalex.org/S4210200687","display_name":"Machine Learning Science and Technology","issn_l":"2632-2153","issn":["2632-2153"],"is_oa":true,"is_in_doaj":true,"is_core":true,"host_organization":"https://openalex.org/P4310320083","host_organization_name":"IOP Publishing","host_organization_lineage":["https://openalex.org/P4310320083","https://openalex.org/P4310311669"],"host_organization_lineage_names":["IOP Publishing","Institute of Physics"],"type":"journal"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Machine Learning: Science and Technology","raw_type":"journal-article"},"type":"preprint","indexed_in":["arxiv","crossref","datacite","doaj"],"open_access":{"is_oa":true,"oa_status":"gold","oa_url":"https://iopscience.iop.org/article/10.1088/2632-2153/abfe7c/pdf","any_repository_has_fulltext":true},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5067642969","display_name":"Rose K. Cersonsky","orcid":"https://orcid.org/0000-0003-4515-3441"},"institutions":[{"id":"https://openalex.org/I5124864","display_name":"\u00c9cole Polytechnique F\u00e9d\u00e9rale de Lausanne","ror":"https://ror.org/02s376052","country_code":"CH","type":"education","lineage":["https://openalex.org/I2799323385","https://openalex.org/I5124864"]}],"countries":["CH"],"is_corresponding":true,"raw_author_name":"Rose K Cersonsky","raw_affiliation_strings":["Laboratory of Computational Science and Modeling, IMX, \u00c9cole Polytechnique F\u00e9d\u00e9rale de Lausanne, 1015 Lausanne, Switzerland"],"raw_orcid":"https://orcid.org/0000-0003-4515-3441","affiliations":[{"raw_affiliation_string":"Laboratory of Computational Science and Modeling, IMX, \u00c9cole Polytechnique F\u00e9d\u00e9rale de Lausanne, 1015 Lausanne, Switzerland","institution_ids":["https://openalex.org/I5124864"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5059459283","display_name":"Benjamin A. Helfrecht","orcid":null},"institutions":[{"id":"https://openalex.org/I5124864","display_name":"\u00c9cole Polytechnique F\u00e9d\u00e9rale de Lausanne","ror":"https://ror.org/02s376052","country_code":"CH","type":"education","lineage":["https://openalex.org/I2799323385","https://openalex.org/I5124864"]}],"countries":["CH"],"is_corresponding":false,"raw_author_name":"Benjamin A Helfrecht","raw_affiliation_strings":["Laboratory of Computational Science and Modeling, IMX, \u00c9cole Polytechnique F\u00e9d\u00e9rale de Lausanne, 1015 Lausanne, Switzerland"],"raw_orcid":"https://orcid.org/0000-0002-2260-7183","affiliations":[{"raw_affiliation_string":"Laboratory of Computational Science and Modeling, IMX, \u00c9cole Polytechnique F\u00e9d\u00e9rale de Lausanne, 1015 Lausanne, Switzerland","institution_ids":["https://openalex.org/I5124864"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5042465133","display_name":"Edgar A. Engel","orcid":"https://orcid.org/0000-0003-2944-9445"},"institutions":[{"id":"https://openalex.org/I241749","display_name":"University of Cambridge","ror":"https://ror.org/013meh722","country_code":"GB","type":"education","lineage":["https://openalex.org/I241749"]}],"countries":["GB"],"is_corresponding":false,"raw_author_name":"Edgar A Engel","raw_affiliation_strings":["TCM Group, Cavendish Laboratory, University of Cambridge, J.J. Thomson Avenue, Cambridge CB3 0HE, United Kingdom"],"raw_orcid":"https://orcid.org/0000-0003-2944-9445","affiliations":[{"raw_affiliation_string":"TCM Group, Cavendish Laboratory, University of Cambridge, J.J. Thomson Avenue, Cambridge CB3 0HE, United Kingdom","institution_ids":["https://openalex.org/I241749"]}]},{"author_position":"middle","author":{"id":null,"display_name":"Sergei Kliavinek","orcid":"https://orcid.org/0000-0001-8326-325X"},"institutions":[{"id":"https://openalex.org/I5124864","display_name":"\u00c9cole Polytechnique F\u00e9d\u00e9rale de Lausanne","ror":"https://ror.org/02s376052","country_code":"CH","type":"education","lineage":["https://openalex.org/I2799323385","https://openalex.org/I5124864"]}],"countries":["CH"],"is_corresponding":false,"raw_author_name":"Sergei Kliavinek","raw_affiliation_strings":["Laboratory of Computational Science and Modeling, IMX, \u00c9cole Polytechnique F\u00e9d\u00e9rale de Lausanne, 1015 Lausanne, Switzerland"],"raw_orcid":"https://orcid.org/0000-0001-8326-325X","affiliations":[{"raw_affiliation_string":"Laboratory of Computational Science and Modeling, IMX, \u00c9cole Polytechnique F\u00e9d\u00e9rale de Lausanne, 1015 Lausanne, Switzerland","institution_ids":["https://openalex.org/I5124864"]}]},{"author_position":"last","author":{"id":null,"display_name":"Michele Ceriotti","orcid":"https://orcid.org/0000-0003-2571-2832"},"institutions":[{"id":"https://openalex.org/I5124864","display_name":"\u00c9cole Polytechnique F\u00e9d\u00e9rale de Lausanne","ror":"https://ror.org/02s376052","country_code":"CH","type":"education","lineage":["https://openalex.org/I2799323385","https://openalex.org/I5124864"]}],"countries":["CH"],"is_corresponding":true,"raw_author_name":"Michele Ceriotti","raw_affiliation_strings":["Laboratory of Computational Science and Modeling, IMX, \u00c9cole Polytechnique F\u00e9d\u00e9rale de Lausanne, 1015 Lausanne, Switzerland"],"raw_orcid":"https://orcid.org/0000-0003-2571-2832","affiliations":[{"raw_affiliation_string":"Laboratory of Computational Science and Modeling, IMX, \u00c9cole Polytechnique F\u00e9d\u00e9rale de Lausanne, 1015 Lausanne, Switzerland","institution_ids":["https://openalex.org/I5124864"]}]}],"institutions":[],"countries_distinct_count":2,"institutions_distinct_count":5,"corresponding_author_ids":["https://openalex.org/A5067642969"],"corresponding_institution_ids":["https://openalex.org/I5124864"],"apc_list":{"value":1600,"currency":"GBP","value_usd":1962},"apc_paid":{"value":1600,"currency":"GBP","value_usd":1962},"fwci":0.3203,"has_fulltext":false,"cited_by_count":5,"citation_normalized_percentile":{"value":0.47687503,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":{"min":89,"max":96},"biblio":{"volume":"2","issue":"3","first_page":"035038","last_page":"035038"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T11948","display_name":"Machine Learning in Materials Science","score":0.995199978351593,"subfield":{"id":"https://openalex.org/subfields/2505","display_name":"Materials Chemistry"},"field":{"id":"https://openalex.org/fields/25","display_name":"Materials Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T11948","display_name":"Machine Learning in Materials Science","score":0.995199978351593,"subfield":{"id":"https://openalex.org/subfields/2505","display_name":"Materials Chemistry"},"field":{"id":"https://openalex.org/fields/25","display_name":"Materials Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10211","display_name":"Computational Drug Discovery Methods","score":0.9904999732971191,"subfield":{"id":"https://openalex.org/subfields/1703","display_name":"Computational Theory and Mathematics"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10640","display_name":"Spectroscopy and Chemometric Analyses","score":0.9851999878883362,"subfield":{"id":"https://openalex.org/subfields/1602","display_name":"Analytical Chemistry"},"field":{"id":"https://openalex.org/fields/16","display_name":"Chemistry"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.7003054618835449},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.6511085629463196},{"id":"https://openalex.org/keywords/principal-component-regression","display_name":"Principal component regression","score":0.6456552743911743},{"id":"https://openalex.org/keywords/feature-selection","display_name":"Feature selection","score":0.6267426013946533},{"id":"https://openalex.org/keywords/regression","display_name":"Regression","score":0.5987606644630432},{"id":"https://openalex.org/keywords/machine-learning","display_name":"Machine learning","score":0.592434287071228},{"id":"https://openalex.org/keywords/covariate","display_name":"Covariate","score":0.5425409078598022},{"id":"https://openalex.org/keywords/kernel","display_name":"Kernel (algebra)","score":0.5330326557159424},{"id":"https://openalex.org/keywords/context","display_name":"Context (archaeology)","score":0.5256907939910889},{"id":"https://openalex.org/keywords/elastic-net-regularization","display_name":"Elastic net regularization","score":0.47194188833236694},{"id":"https://openalex.org/keywords/kernel-regression","display_name":"Kernel regression","score":0.43932846188545227},{"id":"https://openalex.org/keywords/feature","display_name":"Feature (linguistics)","score":0.42661362886428833},{"id":"https://openalex.org/keywords/supervised-learning","display_name":"Supervised learning","score":0.41619428992271423},{"id":"https://openalex.org/keywords/regression-analysis","display_name":"Regression analysis","score":0.4102945029735565},{"id":"https://openalex.org/keywords/principal-component-analysis","display_name":"Principal component analysis","score":0.3954002261161804},{"id":"https://openalex.org/keywords/pattern-recognition","display_name":"Pattern recognition (psychology)","score":0.39150702953338623},{"id":"https://openalex.org/keywords/artificial-neural-network","display_name":"Artificial neural network","score":0.32440972328186035},{"id":"https://openalex.org/keywords/statistics","display_name":"Statistics","score":0.20890632271766663},{"id":"https://openalex.org/keywords/mathematics","display_name":"Mathematics","score":0.17553558945655823}],"concepts":[{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.7003054618835449},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.6511085629463196},{"id":"https://openalex.org/C74887250","wikidata":"https://www.wikidata.org/wiki/Q3455892","display_name":"Principal component regression","level":3,"score":0.6456552743911743},{"id":"https://openalex.org/C148483581","wikidata":"https://www.wikidata.org/wiki/Q446488","display_name":"Feature selection","level":2,"score":0.6267426013946533},{"id":"https://openalex.org/C83546350","wikidata":"https://www.wikidata.org/wiki/Q1139051","display_name":"Regression","level":2,"score":0.5987606644630432},{"id":"https://openalex.org/C119857082","wikidata":"https://www.wikidata.org/wiki/Q2539","display_name":"Machine learning","level":1,"score":0.592434287071228},{"id":"https://openalex.org/C119043178","wikidata":"https://www.wikidata.org/wiki/Q320723","display_name":"Covariate","level":2,"score":0.5425409078598022},{"id":"https://openalex.org/C74193536","wikidata":"https://www.wikidata.org/wiki/Q574844","display_name":"Kernel (algebra)","level":2,"score":0.5330326557159424},{"id":"https://openalex.org/C2779343474","wikidata":"https://www.wikidata.org/wiki/Q3109175","display_name":"Context (archaeology)","level":2,"score":0.5256907939910889},{"id":"https://openalex.org/C203868755","wikidata":"https://www.wikidata.org/wiki/Q5353562","display_name":"Elastic net regularization","level":3,"score":0.47194188833236694},{"id":"https://openalex.org/C200695384","wikidata":"https://www.wikidata.org/wiki/Q1739319","display_name":"Kernel regression","level":3,"score":0.43932846188545227},{"id":"https://openalex.org/C2776401178","wikidata":"https://www.wikidata.org/wiki/Q12050496","display_name":"Feature (linguistics)","level":2,"score":0.42661362886428833},{"id":"https://openalex.org/C136389625","wikidata":"https://www.wikidata.org/wiki/Q334384","display_name":"Supervised learning","level":3,"score":0.41619428992271423},{"id":"https://openalex.org/C152877465","wikidata":"https://www.wikidata.org/wiki/Q208042","display_name":"Regression analysis","level":2,"score":0.4102945029735565},{"id":"https://openalex.org/C27438332","wikidata":"https://www.wikidata.org/wiki/Q2873","display_name":"Principal component analysis","level":2,"score":0.3954002261161804},{"id":"https://openalex.org/C153180895","wikidata":"https://www.wikidata.org/wiki/Q7148389","display_name":"Pattern recognition (psychology)","level":2,"score":0.39150702953338623},{"id":"https://openalex.org/C50644808","wikidata":"https://www.wikidata.org/wiki/Q192776","display_name":"Artificial neural network","level":2,"score":0.32440972328186035},{"id":"https://openalex.org/C105795698","wikidata":"https://www.wikidata.org/wiki/Q12483","display_name":"Statistics","level":1,"score":0.20890632271766663},{"id":"https://openalex.org/C33923547","wikidata":"https://www.wikidata.org/wiki/Q395","display_name":"Mathematics","level":0,"score":0.17553558945655823},{"id":"https://openalex.org/C138885662","wikidata":"https://www.wikidata.org/wiki/Q5891","display_name":"Philosophy","level":0,"score":0.0},{"id":"https://openalex.org/C86803240","wikidata":"https://www.wikidata.org/wiki/Q420","display_name":"Biology","level":0,"score":0.0},{"id":"https://openalex.org/C114614502","wikidata":"https://www.wikidata.org/wiki/Q76592","display_name":"Combinatorics","level":1,"score":0.0},{"id":"https://openalex.org/C151730666","wikidata":"https://www.wikidata.org/wiki/Q7205","display_name":"Paleontology","level":1,"score":0.0},{"id":"https://openalex.org/C41895202","wikidata":"https://www.wikidata.org/wiki/Q8162","display_name":"Linguistics","level":1,"score":0.0}],"mesh":[],"locations_count":9,"locations":[{"id":"doi:10.1088/2632-2153/abfe7c","is_oa":true,"landing_page_url":"https://doi.org/10.1088/2632-2153/abfe7c","pdf_url":"https://iopscience.iop.org/article/10.1088/2632-2153/abfe7c/pdf","source":{"id":"https://openalex.org/S4210200687","display_name":"Machine Learning Science and Technology","issn_l":"2632-2153","issn":["2632-2153"],"is_oa":true,"is_in_doaj":true,"is_core":true,"host_organization":"https://openalex.org/P4310320083","host_organization_name":"IOP Publishing","host_organization_lineage":["https://openalex.org/P4310320083","https://openalex.org/P4310311669"],"host_organization_lineage_names":["IOP Publishing","Institute of Physics"],"type":"journal"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Machine Learning: Science and Technology","raw_type":"journal-article"},{"id":"pmh:oai:arXiv.org:2012.12253","is_oa":true,"landing_page_url":"http://arxiv.org/abs/2012.12253","pdf_url":"https://arxiv.org/pdf/2012.12253","source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"text"},{"id":"mag:3115199521","is_oa":true,"landing_page_url":"http://export.arxiv.org/pdf/2012.12253","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":"arXiv (Cornell University)","raw_type":null},{"id":"pmh:oai:infoscience.epfl.ch:287519","is_oa":true,"landing_page_url":"http://infoscience.epfl.ch/record/287519","pdf_url":null,"source":{"id":"https://openalex.org/S4306400487","display_name":"Infoscience (Ecole Polytechnique F\u00e9d\u00e9rale de Lausanne)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":null,"host_organization_name":null,"host_organization_lineage":[],"host_organization_lineage_names":[],"type":"repository"},"license":"cc-by-nc-nd","license_id":"https://openalex.org/licenses/cc-by-nc-nd","version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"research article"},{"id":"pmh:oai:www.repository.cam.ac.uk:1810/325566","is_oa":true,"landing_page_url":"https://www.repository.cam.ac.uk/handle/1810/325566","pdf_url":null,"source":{"id":"https://openalex.org/S4306401777","display_name":"Apollo (University of Cambridge)","issn_l":null,"issn":null,"is_oa":false,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I241749","host_organization_name":"University of Cambridge","host_organization_lineage":["https://openalex.org/I241749"],"host_organization_lineage_names":[],"type":"repository"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":"","raw_type":"Article"},{"id":"pmh:oai:www.repository.cam.ac.uk:1810/325568","is_oa":true,"landing_page_url":"https://www.repository.cam.ac.uk/handle/1810/325568","pdf_url":null,"source":{"id":"https://openalex.org/S4306401777","display_name":"Apollo (University of Cambridge)","issn_l":null,"issn":null,"is_oa":false,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I241749","host_organization_name":"University of Cambridge","host_organization_lineage":["https://openalex.org/I241749"],"host_organization_lineage_names":[],"type":"repository"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"Article"},{"id":"doi:10.48550/arxiv.2012.12253","is_oa":true,"landing_page_url":"https://doi.org/10.48550/arxiv.2012.12253","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":null,"is_accepted":false,"is_published":null,"raw_source_name":null,"raw_type":"article"},{"id":"doi:10.17863/cam.73023","is_oa":true,"landing_page_url":"https://doi.org/10.17863/cam.73023","pdf_url":null,"source":{"id":"https://openalex.org/S7407050737","display_name":"Apollo","issn_l":null,"issn":[],"is_oa":false,"is_in_doaj":false,"is_core":false,"host_organization":null,"host_organization_name":null,"host_organization_lineage":[],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":null,"is_accepted":false,"is_published":null,"raw_source_name":null,"raw_type":"article-journal"},{"id":"doi:10.17863/cam.73025","is_oa":true,"landing_page_url":"https://doi.org/10.17863/cam.73025","pdf_url":null,"source":{"id":"https://openalex.org/S7407050737","display_name":"Apollo","issn_l":null,"issn":[],"is_oa":false,"is_in_doaj":false,"is_core":false,"host_organization":null,"host_organization_name":null,"host_organization_lineage":[],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":null,"is_accepted":false,"is_published":null,"raw_source_name":null,"raw_type":"article-journal"}],"best_oa_location":{"id":"doi:10.1088/2632-2153/abfe7c","is_oa":true,"landing_page_url":"https://doi.org/10.1088/2632-2153/abfe7c","pdf_url":"https://iopscience.iop.org/article/10.1088/2632-2153/abfe7c/pdf","source":{"id":"https://openalex.org/S4210200687","display_name":"Machine Learning Science and Technology","issn_l":"2632-2153","issn":["2632-2153"],"is_oa":true,"is_in_doaj":true,"is_core":true,"host_organization":"https://openalex.org/P4310320083","host_organization_name":"IOP Publishing","host_organization_lineage":["https://openalex.org/P4310320083","https://openalex.org/P4310311669"],"host_organization_lineage_names":["IOP Publishing","Institute of Physics"],"type":"journal"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Machine Learning: Science and Technology","raw_type":"journal-article"},"sustainable_development_goals":[{"display_name":"Reduced inequalities","score":0.6899999976158142,"id":"https://metadata.un.org/sdg/10"}],"awards":[{"id":"https://openalex.org/G813359770","display_name":null,"funder_award_id":"677013-HBMAP","funder_id":"https://openalex.org/F4320338335","funder_display_name":"H2020 European Research Council"}],"funders":[{"id":"https://openalex.org/F4320334670","display_name":"Trinity College, University of Cambridge","ror":null},{"id":"https://openalex.org/F4320338335","display_name":"H2020 European Research Council","ror":"https://ror.org/0472cxd90"}],"has_content":{"pdf":true,"grobid_xml":true},"content_urls":{"pdf":"https://content.openalex.org/works/W3115199521.pdf","grobid_xml":"https://content.openalex.org/works/W3115199521.grobid-xml"},"referenced_works_count":63,"referenced_works":["https://openalex.org/W1488808450","https://openalex.org/W1602011302","https://openalex.org/W1756006159","https://openalex.org/W1773151392","https://openalex.org/W1975997599","https://openalex.org/W1994410331","https://openalex.org/W1999501864","https://openalex.org/W2010237043","https://openalex.org/W2010464263","https://openalex.org/W2017447741","https://openalex.org/W2017641901","https://openalex.org/W2018244852","https://openalex.org/W2025444507","https://openalex.org/W2029413789","https://openalex.org/W2030363461","https://openalex.org/W2032784723","https://openalex.org/W2040775130","https://openalex.org/W2040884411","https://openalex.org/W2042640655","https://openalex.org/W2051752778","https://openalex.org/W2053962240","https://openalex.org/W2058370262","https://openalex.org/W2063907334","https://openalex.org/W2075529349","https://openalex.org/W2078841894","https://openalex.org/W2083415705","https://openalex.org/W2085831731","https://openalex.org/W2091903645","https://openalex.org/W2098502158","https://openalex.org/W2104489082","https://openalex.org/W2107808739","https://openalex.org/W2131987814","https://openalex.org/W2135595031","https://openalex.org/W2141696759","https://openalex.org/W2143426320","https://openalex.org/W2147988069","https://openalex.org/W2261059368","https://openalex.org/W2276944336","https://openalex.org/W2563408008","https://openalex.org/W2593436234","https://openalex.org/W2620687153","https://openalex.org/W2624385633","https://openalex.org/W2740586183","https://openalex.org/W2784499877","https://openalex.org/W2795523124","https://openalex.org/W2800392236","https://openalex.org/W2805461540","https://openalex.org/W2885194867","https://openalex.org/W2892094491","https://openalex.org/W2900475422","https://openalex.org/W2979598191","https://openalex.org/W3000291311","https://openalex.org/W3033175727","https://openalex.org/W3041909131","https://openalex.org/W3045624638","https://openalex.org/W3119530000","https://openalex.org/W3126083771","https://openalex.org/W4289236186","https://openalex.org/W6600700788","https://openalex.org/W6630862228","https://openalex.org/W6791133293","https://openalex.org/W6893814717","https://openalex.org/W6926310564"],"related_works":["https://openalex.org/W2773081693","https://openalex.org/W2883670420","https://openalex.org/W2213053788","https://openalex.org/W22781849","https://openalex.org/W2149476927","https://openalex.org/W3011932872","https://openalex.org/W3124484778","https://openalex.org/W2897897432","https://openalex.org/W2963214869","https://openalex.org/W1525811561","https://openalex.org/W2900374106","https://openalex.org/W2884898416","https://openalex.org/W2588246945","https://openalex.org/W2520964493","https://openalex.org/W3183081247","https://openalex.org/W1510567447","https://openalex.org/W1728010878","https://openalex.org/W3133924939","https://openalex.org/W3098154559","https://openalex.org/W2963211851"],"abstract_inverted_index":{"Abstract":[0],"Selecting":[1],"the":[2,23,32,37,62,73,77,94,98,141,152,175],"most":[3,78],"relevant":[4],"features":[5,178],"and":[6,35,65,81,130,158,165,179],"samples":[7,80,180],"out":[8],"of":[9,13,25,39,61,76,120,143,173,177,187],"a":[10,16,40,58,90,171,184],"large":[11],"set":[12],"candidates":[14],"is":[15],"task":[17],"that":[18,111],"occurs":[19],"very":[20],"often":[21,36],"in":[22,109,114],"context":[24],"automated":[26],"data":[27],"analysis,":[28],"where":[29],"it":[30],"improves":[31],"computational":[33],"performance":[34],"transferability":[38],"model.":[41],"Here":[42],"we":[43],"focus":[44],"on":[45,72],"two":[46,174],"popular":[47],"subselection":[48,145],"schemes":[49],"applied":[50],"to":[51,126,139,163,182],"this":[52,107],"end:":[53],"CUR":[54],"decomposition,":[55],"derived":[56],"from":[57,123],"low-rank":[59],"approximation":[60],"feature":[63],"matrix,":[64],"farthest":[66],"point":[67],"sampling":[68],"(FPS),":[69],"which":[70],"relies":[71],"iterative":[74],"identification":[75],"diverse":[79],"discriminating":[82],"features.":[83],"We":[84,104,135,150],"modify":[85],"these":[86],"unsupervised":[87,148],"approaches,":[88],"incorporating":[89],"supervised":[91,115],"component":[92],"following":[93],"same":[95],"spirit":[96],"as":[97],"principal":[99],"covariates":[100],"(PCov)":[101],"regression":[102,125,129,188],"method.":[103],"show":[105],"how":[106],"results":[108],"selections":[110,160],"perform":[112],"better":[113],"tasks,":[116],"demonstrating":[117],"with":[118,156],"models":[119],"increasing":[121],"complexity,":[122],"ridge":[124,128],"kernel":[127],"finally":[131],"feed-forward":[132],"neural":[133],"networks.":[134],"also":[136],"present":[137],"adjustments":[138],"minimise":[140],"impact":[142],"any":[144],"when":[146],"performing":[147],"tasks.":[149],"demonstrate":[151],"significant":[153],"improvements":[154],"associated":[155],"PCov-CUR":[157],"PCov-FPS":[159],"for":[161],"applications":[162],"chemistry":[164],"materials":[166],"science,":[167],"typically":[168],"reducing":[169],"by":[170],"factor":[172],"number":[176],"required":[181],"achieve":[183],"given":[185],"level":[186],"accuracy.":[189]},"counts_by_year":[{"year":2025,"cited_by_count":1},{"year":2023,"cited_by_count":2},{"year":2022,"cited_by_count":1},{"year":2021,"cited_by_count":1}],"updated_date":"2026-03-27T05:58:40.876381","created_date":"2025-10-10T00:00:00"}
