{"id":"https://openalex.org/W2601165891","doi":"https://doi.org/10.1109/maltesque.2017.7882013","title":"Automatic feature selection by regularization to improve bug prediction accuracy","display_name":"Automatic feature selection by regularization to improve bug prediction accuracy","publication_year":2017,"publication_date":"2017-02-21","ids":{"openalex":"https://openalex.org/W2601165891","doi":"https://doi.org/10.1109/maltesque.2017.7882013","mag":"2601165891"},"language":"en","primary_location":{"id":"doi:10.1109/maltesque.2017.7882013","is_oa":false,"landing_page_url":"https://doi.org/10.1109/maltesque.2017.7882013","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"2017 IEEE Workshop on Machine Learning Techniques for Software Quality Evaluation (MaLTeSQuE)","raw_type":"proceedings-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":false,"oa_status":"closed","oa_url":null,"any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5030648899","display_name":"Haidar Osman","orcid":null},"institutions":[{"id":"https://openalex.org/I118564535","display_name":"University of Bern","ror":"https://ror.org/02k7v4d05","country_code":"CH","type":"education","lineage":["https://openalex.org/I118564535"]}],"countries":["CH"],"is_corresponding":true,"raw_author_name":"Haidar Osman","raw_affiliation_strings":["Software Composition Group, University of Bern, Bern, Switzerland"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"Software Composition Group, University of Bern, Bern, Switzerland","institution_ids":["https://openalex.org/I118564535"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5024783227","display_name":"Mohammad Ghafari","orcid":"https://orcid.org/0000-0002-1986-9668"},"institutions":[{"id":"https://openalex.org/I118564535","display_name":"University of Bern","ror":"https://ror.org/02k7v4d05","country_code":"CH","type":"education","lineage":["https://openalex.org/I118564535"]}],"countries":["CH"],"is_corresponding":false,"raw_author_name":"Mohammad Ghafari","raw_affiliation_strings":["Software Composition Group, University of Bern, Bern, Switzerland"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"Software Composition Group, University of Bern, Bern, Switzerland","institution_ids":["https://openalex.org/I118564535"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5041096019","display_name":"Oscar Nierstrasz","orcid":"https://orcid.org/0000-0002-9975-9791"},"institutions":[{"id":"https://openalex.org/I118564535","display_name":"University of Bern","ror":"https://ror.org/02k7v4d05","country_code":"CH","type":"education","lineage":["https://openalex.org/I118564535"]}],"countries":["CH"],"is_corresponding":false,"raw_author_name":"Oscar Nierstrasz","raw_affiliation_strings":["Software Composition Group, University of Bern, Bern, Switzerland"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"Software Composition Group, University of Bern, Bern, Switzerland","institution_ids":["https://openalex.org/I118564535"]}]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":3,"corresponding_author_ids":["https://openalex.org/A5030648899"],"corresponding_institution_ids":["https://openalex.org/I118564535"],"apc_list":null,"apc_paid":null,"fwci":5.5685,"has_fulltext":false,"cited_by_count":37,"citation_normalized_percentile":{"value":0.9607542,"is_in_top_1_percent":false,"is_in_top_10_percent":true},"cited_by_percentile_year":{"min":89,"max":99},"biblio":{"volume":null,"issue":null,"first_page":"27","last_page":"32"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10260","display_name":"Software Engineering Research","score":1.0,"subfield":{"id":"https://openalex.org/subfields/1710","display_name":"Information Systems"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10260","display_name":"Software Engineering Research","score":1.0,"subfield":{"id":"https://openalex.org/subfields/1710","display_name":"Information Systems"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T12423","display_name":"Software Reliability and Analysis Research","score":0.9994000196456909,"subfield":{"id":"https://openalex.org/subfields/1712","display_name":"Software"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10743","display_name":"Software Testing and Debugging Techniques","score":0.9979000091552734,"subfield":{"id":"https://openalex.org/subfields/1712","display_name":"Software"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/feature-selection","display_name":"Feature selection","score":0.7992113828659058},{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.7564636468887329},{"id":"https://openalex.org/keywords/machine-learning","display_name":"Machine learning","score":0.6711456775665283},{"id":"https://openalex.org/keywords/regularization","display_name":"Regularization (linguistics)","score":0.6276334524154663},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.6192437410354614},{"id":"https://openalex.org/keywords/predictive-modelling","display_name":"Predictive modelling","score":0.47400128841400146},{"id":"https://openalex.org/keywords/feature","display_name":"Feature (linguistics)","score":0.470415860414505},{"id":"https://openalex.org/keywords/model-selection","display_name":"Model selection","score":0.4498139023780823},{"id":"https://openalex.org/keywords/data-mining","display_name":"Data mining","score":0.4390876889228821},{"id":"https://openalex.org/keywords/regression","display_name":"Regression","score":0.4281054735183716},{"id":"https://openalex.org/keywords/lasso","display_name":"Lasso (programming language)","score":0.42384690046310425},{"id":"https://openalex.org/keywords/statistics","display_name":"Statistics","score":0.1049065887928009},{"id":"https://openalex.org/keywords/mathematics","display_name":"Mathematics","score":0.10087040066719055}],"concepts":[{"id":"https://openalex.org/C148483581","wikidata":"https://www.wikidata.org/wiki/Q446488","display_name":"Feature selection","level":2,"score":0.7992113828659058},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.7564636468887329},{"id":"https://openalex.org/C119857082","wikidata":"https://www.wikidata.org/wiki/Q2539","display_name":"Machine learning","level":1,"score":0.6711456775665283},{"id":"https://openalex.org/C2776135515","wikidata":"https://www.wikidata.org/wiki/Q17143721","display_name":"Regularization (linguistics)","level":2,"score":0.6276334524154663},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.6192437410354614},{"id":"https://openalex.org/C45804977","wikidata":"https://www.wikidata.org/wiki/Q7239673","display_name":"Predictive modelling","level":2,"score":0.47400128841400146},{"id":"https://openalex.org/C2776401178","wikidata":"https://www.wikidata.org/wiki/Q12050496","display_name":"Feature (linguistics)","level":2,"score":0.470415860414505},{"id":"https://openalex.org/C93959086","wikidata":"https://www.wikidata.org/wiki/Q6888345","display_name":"Model selection","level":2,"score":0.4498139023780823},{"id":"https://openalex.org/C124101348","wikidata":"https://www.wikidata.org/wiki/Q172491","display_name":"Data mining","level":1,"score":0.4390876889228821},{"id":"https://openalex.org/C83546350","wikidata":"https://www.wikidata.org/wiki/Q1139051","display_name":"Regression","level":2,"score":0.4281054735183716},{"id":"https://openalex.org/C37616216","wikidata":"https://www.wikidata.org/wiki/Q3218363","display_name":"Lasso (programming language)","level":2,"score":0.42384690046310425},{"id":"https://openalex.org/C105795698","wikidata":"https://www.wikidata.org/wiki/Q12483","display_name":"Statistics","level":1,"score":0.1049065887928009},{"id":"https://openalex.org/C33923547","wikidata":"https://www.wikidata.org/wiki/Q395","display_name":"Mathematics","level":0,"score":0.10087040066719055},{"id":"https://openalex.org/C41895202","wikidata":"https://www.wikidata.org/wiki/Q8162","display_name":"Linguistics","level":1,"score":0.0},{"id":"https://openalex.org/C136764020","wikidata":"https://www.wikidata.org/wiki/Q466","display_name":"World Wide Web","level":1,"score":0.0},{"id":"https://openalex.org/C138885662","wikidata":"https://www.wikidata.org/wiki/Q5891","display_name":"Philosophy","level":0,"score":0.0}],"mesh":[],"locations_count":2,"locations":[{"id":"doi:10.1109/maltesque.2017.7882013","is_oa":false,"landing_page_url":"https://doi.org/10.1109/maltesque.2017.7882013","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"2017 IEEE Workshop on Machine Learning Techniques for Software Quality Evaluation (MaLTeSQuE)","raw_type":"proceedings-article"},{"id":"pmh:oai:boris.unibe.ch:113142","is_oa":false,"landing_page_url":"https://boris.unibe.ch/113142/","pdf_url":null,"source":{"id":"https://openalex.org/S4306401086","display_name":"Bern Open Repository and Information System (University of Bern)","issn_l":null,"issn":null,"is_oa":false,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I118564535","host_organization_name":"University of Bern","host_organization_lineage":["https://openalex.org/I118564535"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":"Osman, Haidar; Ghafari, Mohammad; Nierstrasz, Oscar Marius (21 February 2017). Automatic Feature Selection by Regularization to Improve Bug Prediction Accuracy. In: 1st international Workshop on Machine Learning Techniques for Software Quality Evaluation. Klagenfurt, Austria. 21. Feb. 2017. 10.1109/MALTESQUE.2017.7882013 &lt;http://dx.doi.org/10.1109/MALTESQUE.2017.7882013&gt;","raw_type":"info:eu-repo/semantics/conferenceObject"}],"best_oa_location":null,"sustainable_development_goals":[],"awards":[],"funders":[],"has_content":{"grobid_xml":false,"pdf":false},"content_urls":null,"referenced_works_count":45,"referenced_works":["https://openalex.org/W1542582976","https://openalex.org/W1554944419","https://openalex.org/W1964062576","https://openalex.org/W1975040830","https://openalex.org/W1976850132","https://openalex.org/W1978937721","https://openalex.org/W1980851144","https://openalex.org/W1988510359","https://openalex.org/W1999785511","https://openalex.org/W2000251235","https://openalex.org/W2001599472","https://openalex.org/W2012319196","https://openalex.org/W2024594469","https://openalex.org/W2026750231","https://openalex.org/W2029578494","https://openalex.org/W2034445489","https://openalex.org/W2044280950","https://openalex.org/W2046830558","https://openalex.org/W2050496630","https://openalex.org/W2057179820","https://openalex.org/W2057780988","https://openalex.org/W2061019658","https://openalex.org/W2080521990","https://openalex.org/W2093831363","https://openalex.org/W2105300539","https://openalex.org/W2109386713","https://openalex.org/W2119016061","https://openalex.org/W2123934793","https://openalex.org/W2127623179","https://openalex.org/W2132887549","https://openalex.org/W2135198476","https://openalex.org/W2142481192","https://openalex.org/W2144746916","https://openalex.org/W2145026116","https://openalex.org/W2146474553","https://openalex.org/W2153863197","https://openalex.org/W2158744032","https://openalex.org/W2158864412","https://openalex.org/W2159610968","https://openalex.org/W2163732854","https://openalex.org/W2170866915","https://openalex.org/W2497047467","https://openalex.org/W3141989311","https://openalex.org/W3215186461","https://openalex.org/W6632525909"],"related_works":["https://openalex.org/W2380784125","https://openalex.org/W2810025138","https://openalex.org/W1997711767","https://openalex.org/W3118634075","https://openalex.org/W4386543887","https://openalex.org/W4387885766","https://openalex.org/W2765894738","https://openalex.org/W3015383640","https://openalex.org/W2083862258","https://openalex.org/W3144599579"],"abstract_inverted_index":{"Bug":[0],"prediction":[1,48,67,86,107,124,163],"has":[2],"been":[3,27],"a":[4,21,32,47,65,85],"hot":[5],"research":[6],"topic":[7],"for":[8,147],"the":[9,42,61,97,129,157,162,166],"past":[10],"two":[11],"decades,":[12],"during":[13],"which":[14],"different":[15],"machine":[16,76],"learning":[17,77],"models":[18],"based":[19],"on":[20,105,139],"variety":[22],"of":[23,46,63,96,102,131,165],"software":[24],"metrics":[25],"have":[26],"proposed.":[28],"Feature":[29],"selection":[30,52,81,92,120],"is":[31,53,108],"technique":[33],"that":[34,83,156],"removes":[35],"noisy":[36],"and":[37,44,69,137,141,168],"redundant":[38],"features":[39],"to":[40,60,88],"improve":[41,169],"accuracy":[43],"generalizability":[45],"model.":[49],"Although":[50],"feature":[51,80,91,119],"important,":[54],"it":[55],"adds":[56],"yet":[57],"another":[58],"step":[59],"process":[62],"building":[64],"bug":[66,106,123,145],"model":[68,87],"increases":[70],"its":[71],"complexity.":[72],"Recent":[73],"advances":[74],"in":[75,122],"introduce":[78],"embedded":[79,118],"methods":[82,104,134,160],"allow":[84],"carry":[89],"out":[90],"automatically":[93],"as":[94,116,144],"part":[95],"training":[98],"process.":[99],"The":[100],"effect":[101],"these":[103],"unknown.":[109],"In":[110],"this":[111],"paper":[112],"we":[113,127],"study":[114,128],"regularization":[115,133,159],"an":[117],"method":[121],"models.":[125],"Specifically,":[126],"impact":[130],"three":[132,158],"(Ridge,":[135],"Lasso,":[136],"ElasticNet)":[138],"linear":[140],"Poisson":[142],"Regression":[143],"predictors":[146],"five":[148],"open":[149],"source":[150],"Java":[151],"systems.":[152],"Our":[153],"results":[154],"show":[155],"reduce":[161],"error":[164],"regressors":[167],"their":[170],"stability.":[171]},"counts_by_year":[{"year":2026,"cited_by_count":1},{"year":2025,"cited_by_count":6},{"year":2024,"cited_by_count":5},{"year":2023,"cited_by_count":3},{"year":2022,"cited_by_count":4},{"year":2021,"cited_by_count":7},{"year":2020,"cited_by_count":1},{"year":2019,"cited_by_count":6},{"year":2018,"cited_by_count":3},{"year":2017,"cited_by_count":1}],"updated_date":"2026-05-08T15:41:06.802602","created_date":"2025-10-10T00:00:00"}
