{"id":"https://openalex.org/W3052585663","doi":"https://doi.org/10.1109/iske47853.2019.9170328","title":"A Hybrid Data Preprocessing Technique based on Maximum Likelihood Logistic Regression with Filtering for Enhancing Software Defect Prediction","display_name":"A Hybrid Data Preprocessing Technique based on Maximum Likelihood Logistic Regression with Filtering for Enhancing Software Defect Prediction","publication_year":2019,"publication_date":"2019-11-01","ids":{"openalex":"https://openalex.org/W3052585663","doi":"https://doi.org/10.1109/iske47853.2019.9170328","mag":"3052585663"},"language":"en","primary_location":{"id":"doi:10.1109/iske47853.2019.9170328","is_oa":false,"landing_page_url":"https://doi.org/10.1109/iske47853.2019.9170328","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"2019 IEEE 14th International Conference on Intelligent Systems and Knowledge Engineering (ISKE)","raw_type":"proceedings-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":false,"oa_status":"closed","oa_url":null,"any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5024206271","display_name":"Kamal Bashir","orcid":"https://orcid.org/0000-0002-1820-6010"},"institutions":[{"id":"https://openalex.org/I4800084","display_name":"Southwest Jiaotong University","ror":"https://ror.org/00hn7w693","country_code":"CN","type":"education","lineage":["https://openalex.org/I4800084"]}],"countries":["CN"],"is_corresponding":true,"raw_author_name":"Kamal Bashir","raw_affiliation_strings":["Southwest Jiaotong University,School of Information Science and Technology,Chengdu,China,611756","School of Information Science and Technology, Southwest Jiaotong University, Chengdu, China"],"affiliations":[{"raw_affiliation_string":"Southwest Jiaotong University,School of Information Science and Technology,Chengdu,China,611756","institution_ids":["https://openalex.org/I4800084"]},{"raw_affiliation_string":"School of Information Science and Technology, Southwest Jiaotong University, Chengdu, China","institution_ids":["https://openalex.org/I4800084"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5064794037","display_name":"Tayseer Ali","orcid":null},"institutions":[{"id":"https://openalex.org/I4800084","display_name":"Southwest Jiaotong University","ror":"https://ror.org/00hn7w693","country_code":"CN","type":"education","lineage":["https://openalex.org/I4800084"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Tayseer Ali","raw_affiliation_strings":["Southwest Jiaotong University,School of Material Science and Engineering,Chengdu,China,611756","School of Material Science and Engineering, Southwest Jiaotong University, Chengdu, China"],"affiliations":[{"raw_affiliation_string":"Southwest Jiaotong University,School of Material Science and Engineering,Chengdu,China,611756","institution_ids":["https://openalex.org/I4800084"]},{"raw_affiliation_string":"School of Material Science and Engineering, Southwest Jiaotong University, Chengdu, China","institution_ids":["https://openalex.org/I4800084"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5022128757","display_name":"Mahama Yahaya","orcid":null},"institutions":[{"id":"https://openalex.org/I4800084","display_name":"Southwest Jiaotong University","ror":"https://ror.org/00hn7w693","country_code":"CN","type":"education","lineage":["https://openalex.org/I4800084"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Mahama Yahaya","raw_affiliation_strings":["Southwest Jiaotong University,School of Transport and Logistics Engineering,Chengdu,China,611756","School of Transport and Logistics Engineering, Southwest Jiaotong University, Chengdu, China"],"affiliations":[{"raw_affiliation_string":"Southwest Jiaotong University,School of Transport and Logistics Engineering,Chengdu,China,611756","institution_ids":["https://openalex.org/I4800084"]},{"raw_affiliation_string":"School of Transport and Logistics Engineering, Southwest Jiaotong University, Chengdu, China","institution_ids":["https://openalex.org/I4800084"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5022715025","display_name":"Ahmed Saad Hussein","orcid":null},"institutions":[{"id":"https://openalex.org/I4800084","display_name":"Southwest Jiaotong University","ror":"https://ror.org/00hn7w693","country_code":"CN","type":"education","lineage":["https://openalex.org/I4800084"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Ahmed Saad Hussein","raw_affiliation_strings":["Southwest Jiaotong University,School of Information Science and Technology,Chengdu,China,611756","School of Information Science and Technology, Southwest Jiaotong University, Chengdu, China"],"affiliations":[{"raw_affiliation_string":"Southwest Jiaotong University,School of Information Science and Technology,Chengdu,China,611756","institution_ids":["https://openalex.org/I4800084"]},{"raw_affiliation_string":"School of Information Science and Technology, Southwest Jiaotong University, Chengdu, China","institution_ids":["https://openalex.org/I4800084"]}]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":4,"corresponding_author_ids":["https://openalex.org/A5024206271"],"corresponding_institution_ids":["https://openalex.org/I4800084"],"apc_list":null,"apc_paid":null,"fwci":0.6783,"has_fulltext":false,"cited_by_count":6,"citation_normalized_percentile":{"value":0.80805374,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":{"min":89,"max":96},"biblio":{"volume":null,"issue":null,"first_page":"921","last_page":"927"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10260","display_name":"Software Engineering Research","score":1.0,"subfield":{"id":"https://openalex.org/subfields/1710","display_name":"Information Systems"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10260","display_name":"Software Engineering Research","score":1.0,"subfield":{"id":"https://openalex.org/subfields/1710","display_name":"Information Systems"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T12423","display_name":"Software Reliability and Analysis Research","score":0.9991000294685364,"subfield":{"id":"https://openalex.org/subfields/1712","display_name":"Software"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T12127","display_name":"Software System Performance and Reliability","score":0.979200005531311,"subfield":{"id":"https://openalex.org/subfields/1705","display_name":"Computer Networks and Communications"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/feature-selection","display_name":"Feature selection","score":0.8163713812828064},{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.6911566853523254},{"id":"https://openalex.org/keywords/data-pre-processing","display_name":"Data pre-processing","score":0.6049120426177979},{"id":"https://openalex.org/keywords/preprocessor","display_name":"Preprocessor","score":0.5895218253135681},{"id":"https://openalex.org/keywords/context","display_name":"Context (archaeology)","score":0.5715963840484619},{"id":"https://openalex.org/keywords/data-mining","display_name":"Data mining","score":0.5610562562942505},{"id":"https://openalex.org/keywords/software","display_name":"Software","score":0.553915798664093},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.5323180556297302},{"id":"https://openalex.org/keywords/machine-learning","display_name":"Machine learning","score":0.5054736137390137},{"id":"https://openalex.org/keywords/random-forest","display_name":"Random forest","score":0.49840617179870605},{"id":"https://openalex.org/keywords/logistic-regression","display_name":"Logistic regression","score":0.4642195701599121},{"id":"https://openalex.org/keywords/curse-of-dimensionality","display_name":"Curse of dimensionality","score":0.4268019199371338},{"id":"https://openalex.org/keywords/pattern-recognition","display_name":"Pattern recognition (psychology)","score":0.37247157096862793}],"concepts":[{"id":"https://openalex.org/C148483581","wikidata":"https://www.wikidata.org/wiki/Q446488","display_name":"Feature selection","level":2,"score":0.8163713812828064},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.6911566853523254},{"id":"https://openalex.org/C10551718","wikidata":"https://www.wikidata.org/wiki/Q5227332","display_name":"Data pre-processing","level":2,"score":0.6049120426177979},{"id":"https://openalex.org/C34736171","wikidata":"https://www.wikidata.org/wiki/Q918333","display_name":"Preprocessor","level":2,"score":0.5895218253135681},{"id":"https://openalex.org/C2779343474","wikidata":"https://www.wikidata.org/wiki/Q3109175","display_name":"Context (archaeology)","level":2,"score":0.5715963840484619},{"id":"https://openalex.org/C124101348","wikidata":"https://www.wikidata.org/wiki/Q172491","display_name":"Data mining","level":1,"score":0.5610562562942505},{"id":"https://openalex.org/C2777904410","wikidata":"https://www.wikidata.org/wiki/Q7397","display_name":"Software","level":2,"score":0.553915798664093},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.5323180556297302},{"id":"https://openalex.org/C119857082","wikidata":"https://www.wikidata.org/wiki/Q2539","display_name":"Machine learning","level":1,"score":0.5054736137390137},{"id":"https://openalex.org/C169258074","wikidata":"https://www.wikidata.org/wiki/Q245748","display_name":"Random forest","level":2,"score":0.49840617179870605},{"id":"https://openalex.org/C151956035","wikidata":"https://www.wikidata.org/wiki/Q1132755","display_name":"Logistic regression","level":2,"score":0.4642195701599121},{"id":"https://openalex.org/C111030470","wikidata":"https://www.wikidata.org/wiki/Q1430460","display_name":"Curse of dimensionality","level":2,"score":0.4268019199371338},{"id":"https://openalex.org/C153180895","wikidata":"https://www.wikidata.org/wiki/Q7148389","display_name":"Pattern recognition (psychology)","level":2,"score":0.37247157096862793},{"id":"https://openalex.org/C86803240","wikidata":"https://www.wikidata.org/wiki/Q420","display_name":"Biology","level":0,"score":0.0},{"id":"https://openalex.org/C199360897","wikidata":"https://www.wikidata.org/wiki/Q9143","display_name":"Programming language","level":1,"score":0.0},{"id":"https://openalex.org/C151730666","wikidata":"https://www.wikidata.org/wiki/Q7205","display_name":"Paleontology","level":1,"score":0.0}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.1109/iske47853.2019.9170328","is_oa":false,"landing_page_url":"https://doi.org/10.1109/iske47853.2019.9170328","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"2019 IEEE 14th International Conference on Intelligent Systems and Knowledge Engineering (ISKE)","raw_type":"proceedings-article"}],"best_oa_location":null,"sustainable_development_goals":[],"awards":[],"funders":[],"has_content":{"grobid_xml":false,"pdf":false},"content_urls":null,"referenced_works_count":19,"referenced_works":["https://openalex.org/W168970045","https://openalex.org/W1995806857","https://openalex.org/W2095642553","https://openalex.org/W2101195239","https://openalex.org/W2146338950","https://openalex.org/W2151666086","https://openalex.org/W2160958420","https://openalex.org/W2164873210","https://openalex.org/W2239636899","https://openalex.org/W2784042651","https://openalex.org/W2785772932","https://openalex.org/W2922466793","https://openalex.org/W2991623083","https://openalex.org/W2998216295","https://openalex.org/W3141989311","https://openalex.org/W4255000972","https://openalex.org/W4285719527","https://openalex.org/W6674522558","https://openalex.org/W7066667914"],"related_works":["https://openalex.org/W4388745254","https://openalex.org/W2989490741","https://openalex.org/W2980082554","https://openalex.org/W1517228774","https://openalex.org/W2767419625","https://openalex.org/W2389704471","https://openalex.org/W3092506759","https://openalex.org/W2367545121","https://openalex.org/W4248881655","https://openalex.org/W2482165163"],"abstract_inverted_index":{"Software":[0,248],"Defect":[1,249],"Prediction":[2,250],"(SDP)":[3],"is":[4,99,115,125,153],"critical":[5],"to":[6,16,69,118,155,240],"ensure":[7],"product":[8],"reliability":[9],"and":[10,46,122,142,146,187,203,219,237,259],"customer":[11],"satisfaction.":[12],"Many":[13],"studies":[14],"conducted":[15,116],"predict":[17],"defective":[18,301],"modules":[19,302],"in":[20,110,164,234,290,303],"the":[21,52,74,91,123,158,165,177,181,267,273,285,292,304],"software":[22,27,168,231,305],"development":[23,306],"process":[24],"applied":[25,199,214],"historical":[26],"defect":[28,169,232],"data":[29,35,53,67,88,209,218],"mined":[30],"from":[31,37,207,222],"online":[32,38],"depositories.":[33],"However,":[34],"obtained":[36],"depositories":[39],"have":[40,171],"problems":[41,89],"associated":[42],"with":[43],"high":[44],"dimensionality":[45,49],"noisy.":[47],"High":[48],"comes":[50],"when":[51],"contains":[54],"a":[55,106,216],"huge":[56],"number":[57],"of":[58,64,76,86,94,160,167,184,247,272,300],"independent":[59],"attributes":[60],"for":[61,90,162,244,296],"developing":[62],"models":[63,274],"classification.":[65],"Noisy":[66],"refer":[68],"those":[70],"located":[71],"deep":[72],"inside":[73],"region":[75],"different":[77],"class":[78],"other":[79],"than":[80],"their":[81,235],"own.":[82],"The":[83,252,270,281],"adverse":[84],"effect":[85],"these":[87],"prediction":[92,170,299],"performance":[93,271],"most":[95],"statistical":[96],"learning":[97],"methodologies":[98],"self-evident.":[100],"To":[101],"this":[102,227],"end,":[103],"we":[104],"suggest":[105],"hybrid":[107],"preprocessing":[108],"approach":[109,213],"which":[111],"iterative":[112],"partitioning":[113],"filtering":[114,189],"prior":[117],"feature":[119,294],"selection":[120,186,197,212],"(FS)":[121],"technique":[124,198],"validated":[126],"using":[127,276],"selected":[128,206,221,268],"FS":[129,163],"methods":[130],"including":[131],"Chisquare":[132],"(CS),":[133],"information":[134],"gain":[135,137],"(IG),":[136],"ratio":[138],"(GR),":[139],"relief":[140],"(RF)":[141],"symmetric":[143],"uncertainty":[144],"(SU)":[145],"maximum":[147],"likelihood":[148],"logistic":[149],"regression":[150],"(MLLR).":[151],"It":[152],"important":[154],"note":[156],"that":[157,284],"idea":[159],"MLLR":[161,286],"context":[166],"not":[172],"been":[173],"fully":[174],"investigated":[175],"despite":[176],"potential":[178],"usefulness.":[179],"For":[180],"combined":[182],"use":[183],"variable":[185,196,211],"noise":[188],"(NF),":[190],"two":[191],"cases":[192],"are":[193,264,279],"considered:":[194],"(1)":[195],"on":[200,215,229,266],"original":[201,208],"dataset":[202],"relevant":[204],"variables":[205,220],"(2)":[210],"cleaned":[217,223],"data.":[224],"We":[225],"apply":[226],"method":[228],"six":[230],"datasets":[233],"clean":[236],"noisy":[238],"form":[239],"select":[241],"useful":[242,289],"features":[243],"classification":[245],"modeling":[246],"(SDP).":[251],"Random":[253],"Forest":[254],"(RaF),":[255],"K-Nearest":[256],"Neighbors":[257],"(KNN)":[258],"Multilayer":[260],"Perceptron":[261],"(MLP)":[262],"classifiers":[263],"tested":[265],"feature.":[269],"captured":[275],"three":[277],"indicators":[278],"compared.":[280],"results":[282],"confirm":[283],"can":[287],"be":[288],"selecting":[291],"optimal":[293],"subset":[295],"more":[297],"accurate":[298],"process.":[307]},"counts_by_year":[{"year":2025,"cited_by_count":2},{"year":2024,"cited_by_count":1},{"year":2023,"cited_by_count":1},{"year":2021,"cited_by_count":2}],"updated_date":"2025-11-06T03:46:38.306776","created_date":"2025-10-10T00:00:00"}
