{"id":"https://openalex.org/W4407619039","doi":"https://doi.org/10.1186/s40537-025-01071-3","title":"Enhancing the performance of gradient boosting trees on regression problems","display_name":"Enhancing the performance of gradient boosting trees on regression problems","publication_year":2025,"publication_date":"2025-02-17","ids":{"openalex":"https://openalex.org/W4407619039","doi":"https://doi.org/10.1186/s40537-025-01071-3"},"language":"en","primary_location":{"id":"doi:10.1186/s40537-025-01071-3","is_oa":true,"landing_page_url":"https://doi.org/10.1186/s40537-025-01071-3","pdf_url":"https://journalofbigdata.springeropen.com/counter/pdf/10.1186/s40537-025-01071-3","source":{"id":"https://openalex.org/S2737955091","display_name":"Journal Of Big Data","issn_l":"2196-1115","issn":["2196-1115"],"is_oa":true,"is_in_doaj":true,"is_core":true,"host_organization":"https://openalex.org/P4310319900","host_organization_name":"Springer Science+Business Media","host_organization_lineage":["https://openalex.org/P4310319900","https://openalex.org/P4310319965"],"host_organization_lineage_names":["Springer Science+Business Media","Springer Nature"],"type":"journal"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Journal of Big Data","raw_type":"journal-article"},"type":"article","indexed_in":["crossref","doaj"],"open_access":{"is_oa":true,"oa_status":"gold","oa_url":"https://journalofbigdata.springeropen.com/counter/pdf/10.1186/s40537-025-01071-3","any_repository_has_fulltext":true},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5070534741","display_name":"Lydia Wahid Rizkallah","orcid":"https://orcid.org/0000-0002-8243-2135"},"institutions":[{"id":"https://openalex.org/I145487455","display_name":"Cairo University","ror":"https://ror.org/03q21mh05","country_code":"EG","type":"education","lineage":["https://openalex.org/I145487455"]}],"countries":["EG"],"is_corresponding":true,"raw_author_name":"Lydia Wahid Rizkallah","raw_affiliation_strings":["Computer Engineering Department, Faculty of Engineering, Cairo University, Giza, Egypt"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"Computer Engineering Department, Faculty of Engineering, Cairo University, Giza, Egypt","institution_ids":["https://openalex.org/I145487455"]}]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":1,"corresponding_author_ids":["https://openalex.org/A5070534741"],"corresponding_institution_ids":["https://openalex.org/I145487455"],"apc_list":{"value":1060,"currency":"GBP","value_usd":1300},"apc_paid":{"value":1060,"currency":"GBP","value_usd":1300},"fwci":87.9961,"has_fulltext":true,"cited_by_count":42,"citation_normalized_percentile":{"value":0.99943177,"is_in_top_1_percent":true,"is_in_top_10_percent":true},"cited_by_percentile_year":{"min":99,"max":100},"biblio":{"volume":"12","issue":"1","first_page":null,"last_page":null},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T12535","display_name":"Machine Learning and Data Classification","score":0.9966999888420105,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T12535","display_name":"Machine Learning and Data Classification","score":0.9966999888420105,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10057","display_name":"Face and Expression Recognition","score":0.9941999912261963,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11512","display_name":"Anomaly Detection Techniques and Applications","score":0.9858999848365784,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/gradient-boosting","display_name":"Gradient boosting","score":0.853749692440033},{"id":"https://openalex.org/keywords/boosting","display_name":"Boosting (machine learning)","score":0.8330245018005371},{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.7449822425842285},{"id":"https://openalex.org/keywords/computational-science-and-engineering","display_name":"Computational Science and Engineering","score":0.730637788772583},{"id":"https://openalex.org/keywords/regression","display_name":"Regression","score":0.579632580280304},{"id":"https://openalex.org/keywords/machine-learning","display_name":"Machine learning","score":0.5236831903457642},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.4936009645462036},{"id":"https://openalex.org/keywords/data-mining","display_name":"Data mining","score":0.3215276002883911},{"id":"https://openalex.org/keywords/random-forest","display_name":"Random forest","score":0.231878399848938},{"id":"https://openalex.org/keywords/statistics","display_name":"Statistics","score":0.1639193296432495},{"id":"https://openalex.org/keywords/mathematics","display_name":"Mathematics","score":0.16136369109153748}],"concepts":[{"id":"https://openalex.org/C70153297","wikidata":"https://www.wikidata.org/wiki/Q5591907","display_name":"Gradient boosting","level":3,"score":0.853749692440033},{"id":"https://openalex.org/C46686674","wikidata":"https://www.wikidata.org/wiki/Q466303","display_name":"Boosting (machine learning)","level":2,"score":0.8330245018005371},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.7449822425842285},{"id":"https://openalex.org/C68597687","wikidata":"https://www.wikidata.org/wiki/Q362601","display_name":"Computational Science and Engineering","level":2,"score":0.730637788772583},{"id":"https://openalex.org/C83546350","wikidata":"https://www.wikidata.org/wiki/Q1139051","display_name":"Regression","level":2,"score":0.579632580280304},{"id":"https://openalex.org/C119857082","wikidata":"https://www.wikidata.org/wiki/Q2539","display_name":"Machine learning","level":1,"score":0.5236831903457642},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.4936009645462036},{"id":"https://openalex.org/C124101348","wikidata":"https://www.wikidata.org/wiki/Q172491","display_name":"Data mining","level":1,"score":0.3215276002883911},{"id":"https://openalex.org/C169258074","wikidata":"https://www.wikidata.org/wiki/Q245748","display_name":"Random forest","level":2,"score":0.231878399848938},{"id":"https://openalex.org/C105795698","wikidata":"https://www.wikidata.org/wiki/Q12483","display_name":"Statistics","level":1,"score":0.1639193296432495},{"id":"https://openalex.org/C33923547","wikidata":"https://www.wikidata.org/wiki/Q395","display_name":"Mathematics","level":0,"score":0.16136369109153748}],"mesh":[],"locations_count":2,"locations":[{"id":"doi:10.1186/s40537-025-01071-3","is_oa":true,"landing_page_url":"https://doi.org/10.1186/s40537-025-01071-3","pdf_url":"https://journalofbigdata.springeropen.com/counter/pdf/10.1186/s40537-025-01071-3","source":{"id":"https://openalex.org/S2737955091","display_name":"Journal Of Big Data","issn_l":"2196-1115","issn":["2196-1115"],"is_oa":true,"is_in_doaj":true,"is_core":true,"host_organization":"https://openalex.org/P4310319900","host_organization_name":"Springer Science+Business Media","host_organization_lineage":["https://openalex.org/P4310319900","https://openalex.org/P4310319965"],"host_organization_lineage_names":["Springer Science+Business Media","Springer Nature"],"type":"journal"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Journal of Big Data","raw_type":"journal-article"},{"id":"pmh:oai:doaj.org/article:c60d80722b504fbeb1c86e8572647979","is_oa":true,"landing_page_url":"https://doaj.org/article/c60d80722b504fbeb1c86e8572647979","pdf_url":null,"source":{"id":"https://openalex.org/S112646816","display_name":"SHILAP Revista de lepidopterolog\u00eda","issn_l":"0300-5267","issn":["0300-5267","2340-4078"],"is_oa":true,"is_in_doaj":true,"is_core":false,"host_organization":null,"host_organization_name":null,"host_organization_lineage":[],"host_organization_lineage_names":[],"type":"journal"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":"Journal of Big Data, Vol 12, Iss 1, Pp 1-34 (2025)","raw_type":"article"}],"best_oa_location":{"id":"doi:10.1186/s40537-025-01071-3","is_oa":true,"landing_page_url":"https://doi.org/10.1186/s40537-025-01071-3","pdf_url":"https://journalofbigdata.springeropen.com/counter/pdf/10.1186/s40537-025-01071-3","source":{"id":"https://openalex.org/S2737955091","display_name":"Journal Of Big Data","issn_l":"2196-1115","issn":["2196-1115"],"is_oa":true,"is_in_doaj":true,"is_core":true,"host_organization":"https://openalex.org/P4310319900","host_organization_name":"Springer Science+Business Media","host_organization_lineage":["https://openalex.org/P4310319900","https://openalex.org/P4310319965"],"host_organization_lineage_names":["Springer Science+Business Media","Springer Nature"],"type":"journal"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Journal of Big Data","raw_type":"journal-article"},"sustainable_development_goals":[],"awards":[],"funders":[{"id":"https://openalex.org/F4320321148","display_name":"Cairo University","ror":"https://ror.org/03q21mh05"},{"id":"https://openalex.org/F4320321655","display_name":"Science and Technology Development Fund","ror":"https://ror.org/044vr6g03"}],"has_content":{"pdf":true,"grobid_xml":true},"content_urls":{"pdf":"https://content.openalex.org/works/W4407619039.pdf","grobid_xml":"https://content.openalex.org/works/W4407619039.grobid-xml"},"referenced_works_count":14,"referenced_works":["https://openalex.org/W2730943916","https://openalex.org/W2982127094","https://openalex.org/W2987201163","https://openalex.org/W2989902081","https://openalex.org/W3038447340","https://openalex.org/W3081125651","https://openalex.org/W3092092489","https://openalex.org/W3095017951","https://openalex.org/W3103103062","https://openalex.org/W3138941680","https://openalex.org/W4206256881","https://openalex.org/W4306650020","https://openalex.org/W4313481885","https://openalex.org/W4391023762"],"related_works":["https://openalex.org/W2967733078","https://openalex.org/W3204430031","https://openalex.org/W3137904399","https://openalex.org/W4310492845","https://openalex.org/W2885778889","https://openalex.org/W4310224730","https://openalex.org/W2766514146","https://openalex.org/W4289703016","https://openalex.org/W2885516856","https://openalex.org/W3094138326"],"abstract_inverted_index":{"Abstract":[0],"Gradient":[1],"Boosting":[2],"Trees":[3],"(GBT)":[4],"is":[5,12,45,64,89],"a":[6,61],"powerful":[7],"machine":[8],"learning":[9,16],"technique":[10],"that":[11,18,66,122],"based":[13],"on":[14,83,91],"ensemble":[15],"methods":[17],"leverage":[19],"the":[20,50,77,81,123],"idea":[21],"of":[22,49,80],"boosting.":[23],"GBT":[24,68,109,134],"combines":[25,67],"multiple":[26],"weak":[27],"learners":[28],"sequentially":[29],"to":[30,54,75],"boost":[31],"its":[32,36],"prediction":[33,56],"power":[34,79],"proving":[35],"outstanding":[37],"efficiency":[38,104],"in":[39],"many":[40],"problems,":[41],"and":[42,71,97,100,117],"hence":[43],"it":[44,101],"now":[46],"considered":[47],"one":[48,108,133],"top":[51],"techniques":[52],"used":[53],"solve":[55],"problems.":[57],"In":[58],"this":[59],"paper,":[60],"hybrid":[62],"approach":[63,82,88,125],"proposed":[65,87,124],"with":[69],"K-means":[70,73],"Bisecting":[72],"clustering":[74],"enhance":[76],"predictive":[78],"regression":[84,93],"datasets.":[85],"The":[86],"applied":[90],"40":[92],"datasets":[94],"from":[95],"UCI":[96],"Kaggle":[98],"websites":[99],"achieves":[102,126],"better":[103,128],"than":[105,130],"using":[106,131],"only":[107,132],"model.":[110,135],"Statistical":[111],"tests":[112,120],"are":[113],"applied,":[114],"namely,":[115],"Friedman":[116],"Wilcoxon":[118],"signed-rank":[119],"showing":[121],"significant":[127],"results":[129]},"counts_by_year":[{"year":2026,"cited_by_count":14},{"year":2025,"cited_by_count":28}],"updated_date":"2026-05-05T08:41:31.759640","created_date":"2025-10-10T00:00:00"}
