{"id":"https://openalex.org/W4405853974","doi":"https://doi.org/10.1007/s41019-024-00270-x","title":"Improving Generalization of Genetic Programming for High-Dimensional Symbolic Regression with Shapley Value Based Feature Selection","display_name":"Improving Generalization of Genetic Programming for High-Dimensional Symbolic Regression with Shapley Value Based Feature Selection","publication_year":2024,"publication_date":"2024-12-28","ids":{"openalex":"https://openalex.org/W4405853974","doi":"https://doi.org/10.1007/s41019-024-00270-x"},"language":"en","primary_location":{"id":"doi:10.1007/s41019-024-00270-x","is_oa":true,"landing_page_url":"https://doi.org/10.1007/s41019-024-00270-x","pdf_url":"https://link.springer.com/content/pdf/10.1007/s41019-024-00270-x.pdf","source":{"id":"https://openalex.org/S2486411021","display_name":"Data Science and Engineering","issn_l":"2364-1185","issn":["2364-1185","2364-1541"],"is_oa":true,"is_in_doaj":true,"is_core":true,"host_organization":"https://openalex.org/P4310319900","host_organization_name":"Springer Science+Business Media","host_organization_lineage":["https://openalex.org/P4310319900","https://openalex.org/P4310319965"],"host_organization_lineage_names":["Springer Science+Business Media","Springer Nature"],"type":"journal"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Data Science and Engineering","raw_type":"journal-article"},"type":"article","indexed_in":["crossref","doaj"],"open_access":{"is_oa":true,"oa_status":"diamond","oa_url":"https://link.springer.com/content/pdf/10.1007/s41019-024-00270-x.pdf","any_repository_has_fulltext":true},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5101811467","display_name":"Chunyu Wang","orcid":"https://orcid.org/0000-0003-1688-2944"},"institutions":[{"id":"https://openalex.org/I41156924","display_name":"Victoria University of Wellington","ror":"https://ror.org/0040r6f76","country_code":"NZ","type":"education","lineage":["https://openalex.org/I41156924"]}],"countries":["NZ"],"is_corresponding":true,"raw_author_name":"Chunyu Wang","raw_affiliation_strings":["Centre for Data Science and Artificial Intelligence & School of Engineering and Computer Science, Victoria University of Wellington, Wellington, 6140, New Zealand"],"affiliations":[{"raw_affiliation_string":"Centre for Data Science and Artificial Intelligence & School of Engineering and Computer Science, Victoria University of Wellington, Wellington, 6140, New Zealand","institution_ids":["https://openalex.org/I41156924"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5100340143","display_name":"Qi Chen","orcid":"https://orcid.org/0000-0001-9367-4757"},"institutions":[{"id":"https://openalex.org/I41156924","display_name":"Victoria University of Wellington","ror":"https://ror.org/0040r6f76","country_code":"NZ","type":"education","lineage":["https://openalex.org/I41156924"]}],"countries":["NZ"],"is_corresponding":false,"raw_author_name":"Qi Chen","raw_affiliation_strings":["Centre for Data Science and Artificial Intelligence & School of Engineering and Computer Science, Victoria University of Wellington, Wellington, 6140, New Zealand"],"affiliations":[{"raw_affiliation_string":"Centre for Data Science and Artificial Intelligence & School of Engineering and Computer Science, Victoria University of Wellington, Wellington, 6140, New Zealand","institution_ids":["https://openalex.org/I41156924"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5080779869","display_name":"Bing Xue","orcid":"https://orcid.org/0000-0002-7790-1216"},"institutions":[{"id":"https://openalex.org/I41156924","display_name":"Victoria University of Wellington","ror":"https://ror.org/0040r6f76","country_code":"NZ","type":"education","lineage":["https://openalex.org/I41156924"]}],"countries":["NZ"],"is_corresponding":false,"raw_author_name":"Bing Xue","raw_affiliation_strings":["Centre for Data Science and Artificial Intelligence & School of Engineering and Computer Science, Victoria University of Wellington, Wellington, 6140, New Zealand"],"affiliations":[{"raw_affiliation_string":"Centre for Data Science and Artificial Intelligence & School of Engineering and Computer Science, Victoria University of Wellington, Wellington, 6140, New Zealand","institution_ids":["https://openalex.org/I41156924"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5100400258","display_name":"Mengjie Zhang","orcid":"https://orcid.org/0000-0003-4463-9538"},"institutions":[{"id":"https://openalex.org/I41156924","display_name":"Victoria University of Wellington","ror":"https://ror.org/0040r6f76","country_code":"NZ","type":"education","lineage":["https://openalex.org/I41156924"]}],"countries":["NZ"],"is_corresponding":false,"raw_author_name":"Mengjie Zhang","raw_affiliation_strings":["Centre for Data Science and Artificial Intelligence & School of Engineering and Computer Science, Victoria University of Wellington, Wellington, 6140, New Zealand"],"affiliations":[{"raw_affiliation_string":"Centre for Data Science and Artificial Intelligence & School of Engineering and Computer Science, Victoria University of Wellington, Wellington, 6140, New Zealand","institution_ids":["https://openalex.org/I41156924"]}]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":4,"corresponding_author_ids":["https://openalex.org/A5101811467"],"corresponding_institution_ids":["https://openalex.org/I41156924"],"apc_list":null,"apc_paid":null,"fwci":2.044,"has_fulltext":true,"cited_by_count":6,"citation_normalized_percentile":{"value":0.89247769,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":{"min":97,"max":99},"biblio":{"volume":"10","issue":"2","first_page":"196","last_page":"211"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T11975","display_name":"Evolutionary Algorithms and Applications","score":0.9998000264167786,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T11975","display_name":"Evolutionary Algorithms and Applications","score":0.9998000264167786,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10100","display_name":"Metaheuristic Optimization Algorithms Research","score":0.9958000183105469,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T12535","display_name":"Machine Learning and Data Classification","score":0.9800999760627747,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/symbolic-regression","display_name":"Symbolic regression","score":0.8063240051269531},{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.7927671074867249},{"id":"https://openalex.org/keywords/genetic-programming","display_name":"Genetic programming","score":0.7825295925140381},{"id":"https://openalex.org/keywords/generalization","display_name":"Generalization","score":0.7652400732040405},{"id":"https://openalex.org/keywords/shapley-value","display_name":"Shapley value","score":0.715056300163269},{"id":"https://openalex.org/keywords/feature-selection","display_name":"Feature selection","score":0.6901602745056152},{"id":"https://openalex.org/keywords/selection","display_name":"Selection (genetic algorithm)","score":0.6569263339042664},{"id":"https://openalex.org/keywords/value","display_name":"Value (mathematics)","score":0.6315785646438599},{"id":"https://openalex.org/keywords/feature","display_name":"Feature (linguistics)","score":0.578486979007721},{"id":"https://openalex.org/keywords/regression","display_name":"Regression","score":0.46972501277923584},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.4627079963684082},{"id":"https://openalex.org/keywords/genetic-algorithm","display_name":"Genetic algorithm","score":0.4528173506259918},{"id":"https://openalex.org/keywords/machine-learning","display_name":"Machine learning","score":0.4008169174194336},{"id":"https://openalex.org/keywords/mathematical-optimization","display_name":"Mathematical optimization","score":0.3432580828666687},{"id":"https://openalex.org/keywords/data-mining","display_name":"Data mining","score":0.3200865685939789},{"id":"https://openalex.org/keywords/statistics","display_name":"Statistics","score":0.2357260286808014},{"id":"https://openalex.org/keywords/mathematical-economics","display_name":"Mathematical economics","score":0.17743778228759766},{"id":"https://openalex.org/keywords/mathematics","display_name":"Mathematics","score":0.1574244201183319},{"id":"https://openalex.org/keywords/game-theory","display_name":"Game theory","score":0.1281191110610962}],"concepts":[{"id":"https://openalex.org/C2776400721","wikidata":"https://www.wikidata.org/wiki/Q18171762","display_name":"Symbolic regression","level":3,"score":0.8063240051269531},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.7927671074867249},{"id":"https://openalex.org/C110332635","wikidata":"https://www.wikidata.org/wiki/Q629498","display_name":"Genetic programming","level":2,"score":0.7825295925140381},{"id":"https://openalex.org/C177148314","wikidata":"https://www.wikidata.org/wiki/Q170084","display_name":"Generalization","level":2,"score":0.7652400732040405},{"id":"https://openalex.org/C199022921","wikidata":"https://www.wikidata.org/wiki/Q240046","display_name":"Shapley value","level":3,"score":0.715056300163269},{"id":"https://openalex.org/C148483581","wikidata":"https://www.wikidata.org/wiki/Q446488","display_name":"Feature selection","level":2,"score":0.6901602745056152},{"id":"https://openalex.org/C81917197","wikidata":"https://www.wikidata.org/wiki/Q628760","display_name":"Selection (genetic algorithm)","level":2,"score":0.6569263339042664},{"id":"https://openalex.org/C2776291640","wikidata":"https://www.wikidata.org/wiki/Q2912517","display_name":"Value (mathematics)","level":2,"score":0.6315785646438599},{"id":"https://openalex.org/C2776401178","wikidata":"https://www.wikidata.org/wiki/Q12050496","display_name":"Feature (linguistics)","level":2,"score":0.578486979007721},{"id":"https://openalex.org/C83546350","wikidata":"https://www.wikidata.org/wiki/Q1139051","display_name":"Regression","level":2,"score":0.46972501277923584},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.4627079963684082},{"id":"https://openalex.org/C8880873","wikidata":"https://www.wikidata.org/wiki/Q187787","display_name":"Genetic algorithm","level":2,"score":0.4528173506259918},{"id":"https://openalex.org/C119857082","wikidata":"https://www.wikidata.org/wiki/Q2539","display_name":"Machine learning","level":1,"score":0.4008169174194336},{"id":"https://openalex.org/C126255220","wikidata":"https://www.wikidata.org/wiki/Q141495","display_name":"Mathematical optimization","level":1,"score":0.3432580828666687},{"id":"https://openalex.org/C124101348","wikidata":"https://www.wikidata.org/wiki/Q172491","display_name":"Data mining","level":1,"score":0.3200865685939789},{"id":"https://openalex.org/C105795698","wikidata":"https://www.wikidata.org/wiki/Q12483","display_name":"Statistics","level":1,"score":0.2357260286808014},{"id":"https://openalex.org/C144237770","wikidata":"https://www.wikidata.org/wiki/Q747534","display_name":"Mathematical economics","level":1,"score":0.17743778228759766},{"id":"https://openalex.org/C33923547","wikidata":"https://www.wikidata.org/wiki/Q395","display_name":"Mathematics","level":0,"score":0.1574244201183319},{"id":"https://openalex.org/C177142836","wikidata":"https://www.wikidata.org/wiki/Q44455","display_name":"Game theory","level":2,"score":0.1281191110610962},{"id":"https://openalex.org/C138885662","wikidata":"https://www.wikidata.org/wiki/Q5891","display_name":"Philosophy","level":0,"score":0.0},{"id":"https://openalex.org/C134306372","wikidata":"https://www.wikidata.org/wiki/Q7754","display_name":"Mathematical analysis","level":1,"score":0.0},{"id":"https://openalex.org/C41895202","wikidata":"https://www.wikidata.org/wiki/Q8162","display_name":"Linguistics","level":1,"score":0.0}],"mesh":[],"locations_count":2,"locations":[{"id":"doi:10.1007/s41019-024-00270-x","is_oa":true,"landing_page_url":"https://doi.org/10.1007/s41019-024-00270-x","pdf_url":"https://link.springer.com/content/pdf/10.1007/s41019-024-00270-x.pdf","source":{"id":"https://openalex.org/S2486411021","display_name":"Data Science and Engineering","issn_l":"2364-1185","issn":["2364-1185","2364-1541"],"is_oa":true,"is_in_doaj":true,"is_core":true,"host_organization":"https://openalex.org/P4310319900","host_organization_name":"Springer Science+Business Media","host_organization_lineage":["https://openalex.org/P4310319900","https://openalex.org/P4310319965"],"host_organization_lineage_names":["Springer Science+Business Media","Springer Nature"],"type":"journal"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Data Science and Engineering","raw_type":"journal-article"},{"id":"pmh:oai:doaj.org/article:10b0456ddcce42118116792fc7a9424b","is_oa":true,"landing_page_url":"https://doaj.org/article/10b0456ddcce42118116792fc7a9424b","pdf_url":null,"source":{"id":"https://openalex.org/S112646816","display_name":"SHILAP Revista de lepidopterolog\u00eda","issn_l":"0300-5267","issn":["0300-5267","2340-4078"],"is_oa":true,"is_in_doaj":true,"is_core":false,"host_organization":null,"host_organization_name":null,"host_organization_lineage":[],"host_organization_lineage_names":[],"type":"journal"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":"Data Science and Engineering, Vol 10, Iss 2, Pp 196-211 (2024)","raw_type":"article"}],"best_oa_location":{"id":"doi:10.1007/s41019-024-00270-x","is_oa":true,"landing_page_url":"https://doi.org/10.1007/s41019-024-00270-x","pdf_url":"https://link.springer.com/content/pdf/10.1007/s41019-024-00270-x.pdf","source":{"id":"https://openalex.org/S2486411021","display_name":"Data Science and Engineering","issn_l":"2364-1185","issn":["2364-1185","2364-1541"],"is_oa":true,"is_in_doaj":true,"is_core":true,"host_organization":"https://openalex.org/P4310319900","host_organization_name":"Springer Science+Business Media","host_organization_lineage":["https://openalex.org/P4310319900","https://openalex.org/P4310319965"],"host_organization_lineage_names":["Springer Science+Business Media","Springer Nature"],"type":"journal"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Data Science and Engineering","raw_type":"journal-article"},"sustainable_development_goals":[{"display_name":"No poverty","id":"https://metadata.un.org/sdg/1","score":0.5899999737739563}],"awards":[{"id":"https://openalex.org/G1259549522","display_name":null,"funder_award_id":"VUW1914","funder_id":"https://openalex.org/F4320335369","funder_display_name":"Marsden Fund"},{"id":"https://openalex.org/G2104203407","display_name":null,"funder_award_id":"VUW2016","funder_id":"https://openalex.org/F4320316156","funder_display_name":"New Zealand Government"},{"id":"https://openalex.org/G5000515651","display_name":null,"funder_award_id":"VUW1913","funder_id":"https://openalex.org/F4320316156","funder_display_name":"New Zealand Government"},{"id":"https://openalex.org/G5426661128","display_name":null,"funder_award_id":"VUW1913","funder_id":"https://openalex.org/F4320335369","funder_display_name":"Marsden Fund"},{"id":"https://openalex.org/G6083011409","display_name":null,"funder_award_id":"VUW2016","funder_id":"https://openalex.org/F4320335369","funder_display_name":"Marsden Fund"},{"id":"https://openalex.org/G6908269673","display_name":null,"funder_award_id":"VUW1914","funder_id":"https://openalex.org/F4320316156","funder_display_name":"New Zealand Government"}],"funders":[{"id":"https://openalex.org/F4320316156","display_name":"New Zealand Government","ror":"https://ror.org/04v3jxv31"},{"id":"https://openalex.org/F4320329501","display_name":"Serono Symposia International Foundation","ror":null},{"id":"https://openalex.org/F4320335369","display_name":"Marsden Fund","ror":null}],"has_content":{"grobid_xml":false,"pdf":true},"content_urls":{"pdf":"https://content.openalex.org/works/W4405853974.pdf"},"referenced_works_count":24,"referenced_works":["https://openalex.org/W1519072852","https://openalex.org/W2025131201","https://openalex.org/W2040492000","https://openalex.org/W2129888542","https://openalex.org/W2132862423","https://openalex.org/W2343420905","https://openalex.org/W2556301080","https://openalex.org/W2558896678","https://openalex.org/W2595303237","https://openalex.org/W2734114384","https://openalex.org/W2889259518","https://openalex.org/W2973941913","https://openalex.org/W2982960219","https://openalex.org/W2999911359","https://openalex.org/W3016401366","https://openalex.org/W3042621157","https://openalex.org/W3080395176","https://openalex.org/W3120671187","https://openalex.org/W3206431085","https://openalex.org/W4387011164","https://openalex.org/W4389312652","https://openalex.org/W4392523547","https://openalex.org/W6944942256","https://openalex.org/W6945313366"],"related_works":["https://openalex.org/W2968285896","https://openalex.org/W2381504162","https://openalex.org/W1567571923","https://openalex.org/W2472646430","https://openalex.org/W2610450612","https://openalex.org/W2549153708","https://openalex.org/W1964607451","https://openalex.org/W2897801744","https://openalex.org/W2147355282","https://openalex.org/W2394133867"],"abstract_inverted_index":{"Abstract":[0],"Symbolic":[1],"Regression":[2],"(SR)":[3],"on":[4,126,153,167],"high-dimensional":[5,40,118,128],"datasets":[6],"often":[7],"encounters":[8],"significant":[9],"challenges,":[10],"resulting":[11],"in":[12,31,35,115,146],"models":[13],"with":[14],"poor":[15],"generalization":[16,27,151],"capabilities.":[17],"While":[18],"feature":[19,57,83,102,143],"selection":[20,103,144],"has":[21],"the":[22,26,50,63,85,106,131,168],"potential":[23],"to":[24,55,92,109],"enhance":[25],"and":[28,69,111,140,150],"learning":[29,149],"performance":[30,152],"general,":[32],"its":[33],"application":[34],"Genetic":[36],"Programming":[37],"(GP)":[38],"for":[39,117],"SR":[41],"remains":[42],"a":[43,66,70,89,100,121],"complex":[44],"problem.":[45],"Originating":[46],"from":[47],"game":[48],"theory,":[49],"Shapley":[51,86,107],"value":[52,87,108],"is":[53],"applied":[54],"additive":[56],"attribution":[58],"approaches":[59],"where":[60],"it":[61],"distributes":[62],"difference":[64],"between":[65],"model":[67],"output":[68],"baseline":[71],"average":[72],"across":[73],"input":[74],"variables.":[75],"By":[76],"providing":[77],"an":[78],"accurate":[79],"assessment":[80],"of":[81,123,148,170],"each":[82],"importance,":[84],"offers":[88],"robust":[90],"approach":[91],"select":[93,112],"features.":[94,172],"In":[95],"this":[96],"paper,":[97],"we":[98],"propose":[99],"novel":[101],"method":[104],"leveraging":[105],"identify":[110],"important":[113,171],"features":[114],"GP":[116,139],"SR.":[119],"Through":[120],"series":[122],"experiments":[124],"conducted":[125],"ten":[127],"regression":[129],"datasets,":[130],"results":[132],"indicate":[133],"that":[134,159],"our":[135,160],"algorithm":[136,161],"surpasses":[137],"standard":[138],"other":[141],"GP-based":[142],"methods":[145],"terms":[147],"most":[154],"datasets.":[155],"Further":[156],"analysis":[157],"reveals":[158],"generates":[162],"more":[163],"compact":[164],"models,":[165],"focusing":[166],"inclusion":[169]},"counts_by_year":[{"year":2026,"cited_by_count":2},{"year":2025,"cited_by_count":4}],"updated_date":"2026-04-10T15:06:20.359241","created_date":"2025-10-10T00:00:00"}
