{"id":"https://openalex.org/W4414459468","doi":"https://doi.org/10.1007/s00521-025-11648-x","title":"CorrBoost: a feature selection technique and utility of tabular deep neural networks in software fault prediction","display_name":"CorrBoost: a feature selection technique and utility of tabular deep neural networks in software fault prediction","publication_year":2025,"publication_date":"2025-09-24","ids":{"openalex":"https://openalex.org/W4414459468","doi":"https://doi.org/10.1007/s00521-025-11648-x"},"language":"en","primary_location":{"id":"doi:10.1007/s00521-025-11648-x","is_oa":true,"landing_page_url":"https://doi.org/10.1007/s00521-025-11648-x","pdf_url":"https://link.springer.com/content/pdf/10.1007/s00521-025-11648-x.pdf","source":{"id":"https://openalex.org/S147897268","display_name":"Neural Computing and Applications","issn_l":"0941-0643","issn":["0941-0643","1433-3058"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310319900","host_organization_name":"Springer Science+Business Media","host_organization_lineage":["https://openalex.org/P4310319900","https://openalex.org/P4310319965"],"host_organization_lineage_names":["Springer Science+Business Media","Springer Nature"],"type":"journal"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Neural Computing and Applications","raw_type":"journal-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":true,"oa_status":"hybrid","oa_url":"https://link.springer.com/content/pdf/10.1007/s00521-025-11648-x.pdf","any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5051884352","display_name":"Tamanna Sharma","orcid":null},"institutions":[{"id":"https://openalex.org/I74653059","display_name":"Public Health Foundation of India","ror":"https://ror.org/058s20p71","country_code":"IN","type":"nonprofit","lineage":["https://openalex.org/I74653059"]}],"countries":["IN"],"is_corresponding":false,"raw_author_name":"Tamanna Sharma","raw_affiliation_strings":["Publicis Sapient, Gurgaon, India"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"Publicis Sapient, Gurgaon, India","institution_ids":["https://openalex.org/I74653059"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5064136287","display_name":"Sanjay Misra","orcid":"https://orcid.org/0000-0002-3556-9331"},"institutions":[{"id":"https://openalex.org/I3130438513","display_name":"Institute for Energy Technology","ror":"https://ror.org/02jqtg033","country_code":"NO","type":"facility","lineage":["https://openalex.org/I3130438513"]}],"countries":["NO"],"is_corresponding":true,"raw_author_name":"Sanjay Misra","raw_affiliation_strings":["Institute of Energy Technology (IFE), Halden, Norway"],"raw_orcid":"https://orcid.org/0000-0002-3556-9331","affiliations":[{"raw_affiliation_string":"Institute of Energy Technology (IFE), Halden, Norway","institution_ids":["https://openalex.org/I3130438513"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5038626586","display_name":"Ricardo Colomo\u2010Palacios","orcid":"https://orcid.org/0000-0002-1555-9726"},"institutions":[{"id":"https://openalex.org/I88060688","display_name":"Universidad Polit\u00e9cnica de Madrid","ror":"https://ror.org/03n6nwv02","country_code":"ES","type":"education","lineage":["https://openalex.org/I88060688"]}],"countries":["ES"],"is_corresponding":false,"raw_author_name":"Ricardo Colomo-Palacios","raw_affiliation_strings":["Department of Computer Science, Universidad Politecnica de Madrid, Madrid, Spain"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"Department of Computer Science, Universidad Politecnica de Madrid, Madrid, Spain","institution_ids":["https://openalex.org/I88060688"]}]}],"institutions":[],"countries_distinct_count":3,"institutions_distinct_count":3,"corresponding_author_ids":["https://openalex.org/A5064136287"],"corresponding_institution_ids":["https://openalex.org/I3130438513"],"apc_list":{"value":2390,"currency":"EUR","value_usd":2990},"apc_paid":{"value":2390,"currency":"EUR","value_usd":2990},"fwci":0.0,"has_fulltext":true,"cited_by_count":0,"citation_normalized_percentile":{"value":0.35596006,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":null,"biblio":{"volume":"37","issue":"32","first_page":"26845","last_page":"26886"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10260","display_name":"Software Engineering Research","score":1.0,"subfield":{"id":"https://openalex.org/subfields/1710","display_name":"Information Systems"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10260","display_name":"Software Engineering Research","score":1.0,"subfield":{"id":"https://openalex.org/subfields/1710","display_name":"Information Systems"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T12423","display_name":"Software Reliability and Analysis Research","score":0.9991000294685364,"subfield":{"id":"https://openalex.org/subfields/1712","display_name":"Software"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10743","display_name":"Software Testing and Debugging Techniques","score":0.9973000288009644,"subfield":{"id":"https://openalex.org/subfields/1712","display_name":"Software"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/feature-selection","display_name":"Feature selection","score":0.7218999862670898},{"id":"https://openalex.org/keywords/artificial-neural-network","display_name":"Artificial neural network","score":0.5861999988555908},{"id":"https://openalex.org/keywords/feature","display_name":"Feature (linguistics)","score":0.5145999789237976},{"id":"https://openalex.org/keywords/software","display_name":"Software","score":0.4909999966621399},{"id":"https://openalex.org/keywords/deep-learning","display_name":"Deep learning","score":0.4489000141620636},{"id":"https://openalex.org/keywords/tree","display_name":"Tree (set theory)","score":0.4487000107765198},{"id":"https://openalex.org/keywords/overfitting","display_name":"Overfitting","score":0.3946000039577484},{"id":"https://openalex.org/keywords/dimensionality-reduction","display_name":"Dimensionality reduction","score":0.36959999799728394},{"id":"https://openalex.org/keywords/selection","display_name":"Selection (genetic algorithm)","score":0.3529999852180481}],"concepts":[{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.8224999904632568},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.7282999753952026},{"id":"https://openalex.org/C148483581","wikidata":"https://www.wikidata.org/wiki/Q446488","display_name":"Feature selection","level":2,"score":0.7218999862670898},{"id":"https://openalex.org/C119857082","wikidata":"https://www.wikidata.org/wiki/Q2539","display_name":"Machine learning","level":1,"score":0.6510000228881836},{"id":"https://openalex.org/C50644808","wikidata":"https://www.wikidata.org/wiki/Q192776","display_name":"Artificial neural network","level":2,"score":0.5861999988555908},{"id":"https://openalex.org/C2776401178","wikidata":"https://www.wikidata.org/wiki/Q12050496","display_name":"Feature (linguistics)","level":2,"score":0.5145999789237976},{"id":"https://openalex.org/C2777904410","wikidata":"https://www.wikidata.org/wiki/Q7397","display_name":"Software","level":2,"score":0.4909999966621399},{"id":"https://openalex.org/C108583219","wikidata":"https://www.wikidata.org/wiki/Q197536","display_name":"Deep learning","level":2,"score":0.4489000141620636},{"id":"https://openalex.org/C113174947","wikidata":"https://www.wikidata.org/wiki/Q2859736","display_name":"Tree (set theory)","level":2,"score":0.4487000107765198},{"id":"https://openalex.org/C124101348","wikidata":"https://www.wikidata.org/wiki/Q172491","display_name":"Data mining","level":1,"score":0.44510000944137573},{"id":"https://openalex.org/C22019652","wikidata":"https://www.wikidata.org/wiki/Q331309","display_name":"Overfitting","level":3,"score":0.3946000039577484},{"id":"https://openalex.org/C70518039","wikidata":"https://www.wikidata.org/wiki/Q16000077","display_name":"Dimensionality reduction","level":2,"score":0.36959999799728394},{"id":"https://openalex.org/C81917197","wikidata":"https://www.wikidata.org/wiki/Q628760","display_name":"Selection (genetic algorithm)","level":2,"score":0.3529999852180481},{"id":"https://openalex.org/C153180895","wikidata":"https://www.wikidata.org/wiki/Q7148389","display_name":"Pattern recognition (psychology)","level":2,"score":0.3450999855995178},{"id":"https://openalex.org/C111030470","wikidata":"https://www.wikidata.org/wiki/Q1430460","display_name":"Curse of dimensionality","level":2,"score":0.3393000066280365},{"id":"https://openalex.org/C93959086","wikidata":"https://www.wikidata.org/wiki/Q6888345","display_name":"Model selection","level":2,"score":0.32499998807907104},{"id":"https://openalex.org/C2984842247","wikidata":"https://www.wikidata.org/wiki/Q197536","display_name":"Deep neural networks","level":3,"score":0.32109999656677246},{"id":"https://openalex.org/C2777212361","wikidata":"https://www.wikidata.org/wiki/Q5127848","display_name":"Class (philosophy)","level":2,"score":0.3206000030040741},{"id":"https://openalex.org/C164226766","wikidata":"https://www.wikidata.org/wiki/Q7293202","display_name":"Rank (graph theory)","level":2,"score":0.31029999256134033},{"id":"https://openalex.org/C84525736","wikidata":"https://www.wikidata.org/wiki/Q831366","display_name":"Decision tree","level":2,"score":0.30660000443458557},{"id":"https://openalex.org/C52622490","wikidata":"https://www.wikidata.org/wiki/Q1026626","display_name":"Feature extraction","level":2,"score":0.2994999885559082},{"id":"https://openalex.org/C1009929","wikidata":"https://www.wikidata.org/wiki/Q179550","display_name":"Software bug","level":3,"score":0.2978000044822693},{"id":"https://openalex.org/C107673813","wikidata":"https://www.wikidata.org/wiki/Q812534","display_name":"Bayesian probability","level":2,"score":0.2872999906539917},{"id":"https://openalex.org/C185798385","wikidata":"https://www.wikidata.org/wiki/Q1161707","display_name":"Benchmark (surveying)","level":2,"score":0.2667999863624573},{"id":"https://openalex.org/C68597687","wikidata":"https://www.wikidata.org/wiki/Q362601","display_name":"Computational Science and Engineering","level":2,"score":0.26499998569488525},{"id":"https://openalex.org/C189430467","wikidata":"https://www.wikidata.org/wiki/Q7293293","display_name":"Ranking (information retrieval)","level":2,"score":0.2639000117778778},{"id":"https://openalex.org/C128942645","wikidata":"https://www.wikidata.org/wiki/Q1568346","display_name":"Test case","level":3,"score":0.2628999948501587},{"id":"https://openalex.org/C197323446","wikidata":"https://www.wikidata.org/wiki/Q331222","display_name":"Oversampling","level":3,"score":0.2619999945163727},{"id":"https://openalex.org/C175551986","wikidata":"https://www.wikidata.org/wiki/Q47089","display_name":"Fault (geology)","level":2,"score":0.2605000138282776},{"id":"https://openalex.org/C83665646","wikidata":"https://www.wikidata.org/wiki/Q42139305","display_name":"Feature vector","level":2,"score":0.2524999976158142}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.1007/s00521-025-11648-x","is_oa":true,"landing_page_url":"https://doi.org/10.1007/s00521-025-11648-x","pdf_url":"https://link.springer.com/content/pdf/10.1007/s00521-025-11648-x.pdf","source":{"id":"https://openalex.org/S147897268","display_name":"Neural Computing and Applications","issn_l":"0941-0643","issn":["0941-0643","1433-3058"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310319900","host_organization_name":"Springer Science+Business Media","host_organization_lineage":["https://openalex.org/P4310319900","https://openalex.org/P4310319965"],"host_organization_lineage_names":["Springer Science+Business Media","Springer Nature"],"type":"journal"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Neural Computing and Applications","raw_type":"journal-article"}],"best_oa_location":{"id":"doi:10.1007/s00521-025-11648-x","is_oa":true,"landing_page_url":"https://doi.org/10.1007/s00521-025-11648-x","pdf_url":"https://link.springer.com/content/pdf/10.1007/s00521-025-11648-x.pdf","source":{"id":"https://openalex.org/S147897268","display_name":"Neural Computing and Applications","issn_l":"0941-0643","issn":["0941-0643","1433-3058"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310319900","host_organization_name":"Springer Science+Business Media","host_organization_lineage":["https://openalex.org/P4310319900","https://openalex.org/P4310319965"],"host_organization_lineage_names":["Springer Science+Business Media","Springer Nature"],"type":"journal"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Neural Computing and Applications","raw_type":"journal-article"},"sustainable_development_goals":[],"awards":[],"funders":[],"has_content":{"pdf":true,"grobid_xml":true},"content_urls":{"pdf":"https://content.openalex.org/works/W4414459468.pdf","grobid_xml":"https://content.openalex.org/works/W4414459468.grobid-xml"},"referenced_works_count":84,"referenced_works":["https://openalex.org/W1490324987","https://openalex.org/W1611601820","https://openalex.org/W1678356000","https://openalex.org/W1964962870","https://openalex.org/W1969483024","https://openalex.org/W1970065340","https://openalex.org/W1970789984","https://openalex.org/W1987855178","https://openalex.org/W2007338412","https://openalex.org/W2025700486","https://openalex.org/W2030623877","https://openalex.org/W2060561050","https://openalex.org/W2069429561","https://openalex.org/W2089763487","https://openalex.org/W2092939357","https://openalex.org/W2101234009","https://openalex.org/W2104933073","https://openalex.org/W2118283821","https://openalex.org/W2130898128","https://openalex.org/W2136706100","https://openalex.org/W2143426320","https://openalex.org/W2143637886","https://openalex.org/W2146338950","https://openalex.org/W2150874999","https://openalex.org/W2153635508","https://openalex.org/W2157353183","https://openalex.org/W2158698691","https://openalex.org/W2158864412","https://openalex.org/W2163732854","https://openalex.org/W2164627280","https://openalex.org/W2253795368","https://openalex.org/W2290195878","https://openalex.org/W2293040502","https://openalex.org/W2295598076","https://openalex.org/W2303043072","https://openalex.org/W2471516951","https://openalex.org/W2474835145","https://openalex.org/W2567070169","https://openalex.org/W2606020393","https://openalex.org/W2613904329","https://openalex.org/W2743316948","https://openalex.org/W2772617084","https://openalex.org/W2783657687","https://openalex.org/W2795247881","https://openalex.org/W2796525775","https://openalex.org/W2809021616","https://openalex.org/W2845365777","https://openalex.org/W2890838230","https://openalex.org/W2905816416","https://openalex.org/W2911964244","https://openalex.org/W2919115771","https://openalex.org/W2921707507","https://openalex.org/W2959969964","https://openalex.org/W2962956369","https://openalex.org/W2963520355","https://openalex.org/W2983209690","https://openalex.org/W2985145524","https://openalex.org/W2993673073","https://openalex.org/W2994099454","https://openalex.org/W3006436762","https://openalex.org/W3035711813","https://openalex.org/W3036075185","https://openalex.org/W3098350627","https://openalex.org/W3172831760","https://openalex.org/W3215497572","https://openalex.org/W4212883601","https://openalex.org/W4224242396","https://openalex.org/W4229042779","https://openalex.org/W4232632925","https://openalex.org/W4238530616","https://openalex.org/W4239605813","https://openalex.org/W4252871143","https://openalex.org/W4286910448","https://openalex.org/W4287115869","https://openalex.org/W4287124503","https://openalex.org/W4290728118","https://openalex.org/W4293713156","https://openalex.org/W4294541781","https://openalex.org/W4294982321","https://openalex.org/W4295312788","https://openalex.org/W4300900294","https://openalex.org/W4301186107","https://openalex.org/W4307908377","https://openalex.org/W4384026509"],"related_works":[],"abstract_inverted_index":{"Abstract":[0],"Context":[1],"Software":[2],"Fault":[3],"Prediction":[4],"(SFP)":[5],"leverages":[6],"supervised":[7],"Machine":[8],"Learning":[9,26],"to":[10,33,53,92],"detect":[11],"faulty":[12],"software":[13,16],"constructs":[14],"using":[15,112,121],"metrics":[17],"and":[18,51,70,82,104,110,115,127,133,144,168,188],"corresponding":[19],"labels.":[20],"Despite":[21],"recent":[22],"advances":[23],"in":[24,140,153],"Deep":[25],"(DL)":[27],"for":[28,72,202],"tabular":[29,61,191],"data,":[30],"their":[31],"application":[32],"SFP":[34,203],"remains":[35],"underexplored.":[36],"Objectives":[37],"This":[38],"study":[39],"proposes":[40],"a":[41,149,183],"novel":[42],"feature":[43,55,154],"selection":[44],"method,":[45],"CorrBoost,":[46],"which":[47],"combines":[48],"correlation":[49],"analysis":[50],"XGBoost":[52],"address":[54],"dimensionality.":[56],"Additionally,":[57],"we":[58,85],"evaluate":[59],"existing":[60,134],"DL":[62,98,138,160,192],"architectures,":[63],"super":[64],"convergent":[65],"deep":[66],"neural":[67],"networks":[68],"(sDNN)":[69],"TabNet":[71],"SFP.":[73],"Methods":[74],"Using":[75],"26":[76],"public":[77],"datasets":[78],"from":[79],"NASA,":[80],"PROMISE,":[81],"AEEEM":[83],"repositories,":[84],"apply":[86],"the":[87,122],"adaptive":[88],"synthetic":[89],"oversampling":[90],"technique":[91],"manage":[93],"class":[94],"imbalance.":[95],"We":[96],"compare":[97],"models":[99,108,136,181],"with":[100,156,178],"five":[101],"state-of-the-art":[102,135],"techniques":[103],"two":[105],"gradient-boosted":[106],"tree":[107,180],"(XGBoost":[109],"LightGBM)":[111],"AUC-ROC,":[113],"AUPRC,":[114],"Accuracy.":[116],"Statistical":[117],"significance":[118],"is":[119],"validated":[120],"Bayesian":[123],"Signed":[124],"Rank":[125],"Test":[126],"Scott-Knott":[128],"ESD.":[129],"Results":[130],"Gradient-boosted":[131],"trees":[132],"outperform":[137],"methods":[139,201],"AUC-ROC":[141],"by":[142],"17.9%":[143],"9.6%,":[145],"respectively.":[146],"CorrBoost":[147,176],"achieves":[148],"55%":[150],"average":[151],"reduction":[152],"dimensionality":[155],"negligible":[157],"performance":[158,187],"loss.":[159],"methods,":[161],"however,":[162],"incur":[163],"significantly":[164],"higher":[165],"processing":[166],"time":[167],"perform":[169],"poorly":[170],"on":[171,204],"unseen":[172],"test":[173],"data.":[174,206],"Conclusion":[175],"combined":[177],"boosted":[179],"offers":[182],"superior":[184],"trade-off":[185],"between":[186],"computation.":[189],"While":[190],"architectures":[193],"hold":[194],"promise,":[195],"they":[196],"currently":[197],"lag":[198],"behind":[199],"traditional":[200],"real-world":[205]},"counts_by_year":[],"updated_date":"2026-05-21T06:26:12.895304","created_date":"2025-10-10T00:00:00"}
