{"id":"https://openalex.org/W2124797841","doi":"https://doi.org/10.1109/msr.2009.5069480","title":"Tracking concept drift of software projects using defect prediction quality","display_name":"Tracking concept drift of software projects using defect prediction quality","publication_year":2009,"publication_date":"2009-05-01","ids":{"openalex":"https://openalex.org/W2124797841","doi":"https://doi.org/10.1109/msr.2009.5069480","mag":"2124797841"},"language":"en","primary_location":{"id":"doi:10.1109/msr.2009.5069480","is_oa":false,"landing_page_url":"https://doi.org/10.1109/msr.2009.5069480","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"2009 6th IEEE International Working Conference on Mining Software Repositories","raw_type":"proceedings-article"},"type":"article","indexed_in":["crossref","datacite"],"open_access":{"is_oa":true,"oa_status":"green","oa_url":null,"any_repository_has_fulltext":true},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5047321863","display_name":"Jayalath Ekanayake","orcid":null},"institutions":[{"id":"https://openalex.org/I202697423","display_name":"University of Zurich","ror":"https://ror.org/02crff812","country_code":"CH","type":"education","lineage":["https://openalex.org/I202697423"]}],"countries":["CH"],"is_corresponding":false,"raw_author_name":"Jayalath Ekanayake","raw_affiliation_strings":["Dynamic and Distributed Systems Group, University of Zurich, Switzerland","Dynamic and Distributed Systems Group, Department of Informatics, University of Zurich, Switzerland#TAB#"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"Dynamic and Distributed Systems Group, University of Zurich, Switzerland","institution_ids":["https://openalex.org/I202697423"]},{"raw_affiliation_string":"Dynamic and Distributed Systems Group, Department of Informatics, University of Zurich, Switzerland#TAB#","institution_ids":["https://openalex.org/I202697423"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5011196488","display_name":"Jonas Tappolet","orcid":null},"institutions":[{"id":"https://openalex.org/I202697423","display_name":"University of Zurich","ror":"https://ror.org/02crff812","country_code":"CH","type":"education","lineage":["https://openalex.org/I202697423"]}],"countries":["CH"],"is_corresponding":false,"raw_author_name":"Jonas Tappolet","raw_affiliation_strings":["Dynamic and Distributed Systems Group, University of Zurich, Switzerland","Dynamic and Distributed Systems Group, Department of Informatics, University of Zurich, Switzerland#TAB#"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"Dynamic and Distributed Systems Group, University of Zurich, Switzerland","institution_ids":["https://openalex.org/I202697423"]},{"raw_affiliation_string":"Dynamic and Distributed Systems Group, Department of Informatics, University of Zurich, Switzerland#TAB#","institution_ids":["https://openalex.org/I202697423"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5009436227","display_name":"Harald C. Gall","orcid":"https://orcid.org/0000-0002-3874-5628"},"institutions":[{"id":"https://openalex.org/I202697423","display_name":"University of Zurich","ror":"https://ror.org/02crff812","country_code":"CH","type":"education","lineage":["https://openalex.org/I202697423"]}],"countries":["CH"],"is_corresponding":false,"raw_author_name":"Harald C. Gall","raw_affiliation_strings":["Software Evolution and Architecture Laboratory, University of Zurich, Switzerland","Software Evolution and Architecture Lab, Department of Informatics, University of Zurich, Switzerland#TAB#"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"Software Evolution and Architecture Laboratory, University of Zurich, Switzerland","institution_ids":["https://openalex.org/I202697423"]},{"raw_affiliation_string":"Software Evolution and Architecture Lab, Department of Informatics, University of Zurich, Switzerland#TAB#","institution_ids":["https://openalex.org/I202697423"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5073592405","display_name":"Abraham Bernstein","orcid":"https://orcid.org/0000-0002-0128-4602"},"institutions":[{"id":"https://openalex.org/I202697423","display_name":"University of Zurich","ror":"https://ror.org/02crff812","country_code":"CH","type":"education","lineage":["https://openalex.org/I202697423"]}],"countries":["CH"],"is_corresponding":false,"raw_author_name":"Abraham Bernstein","raw_affiliation_strings":["Dynamic and Distributed Systems Group, University of Zurich, Switzerland","Dynamic and Distributed Systems Group, Department of Informatics, University of Zurich, Switzerland#TAB#"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"Dynamic and Distributed Systems Group, University of Zurich, Switzerland","institution_ids":["https://openalex.org/I202697423"]},{"raw_affiliation_string":"Dynamic and Distributed Systems Group, Department of Informatics, University of Zurich, Switzerland#TAB#","institution_ids":["https://openalex.org/I202697423"]}]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":4,"corresponding_author_ids":[],"corresponding_institution_ids":[],"apc_list":null,"apc_paid":null,"fwci":12.4229,"has_fulltext":false,"cited_by_count":75,"citation_normalized_percentile":{"value":0.9841514,"is_in_top_1_percent":false,"is_in_top_10_percent":true},"cited_by_percentile_year":{"min":96,"max":99},"biblio":{"volume":null,"issue":null,"first_page":null,"last_page":null},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10260","display_name":"Software Engineering Research","score":1.0,"subfield":{"id":"https://openalex.org/subfields/1710","display_name":"Information Systems"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10260","display_name":"Software Engineering Research","score":1.0,"subfield":{"id":"https://openalex.org/subfields/1710","display_name":"Information Systems"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T12423","display_name":"Software Reliability and Analysis Research","score":0.9976999759674072,"subfield":{"id":"https://openalex.org/subfields/1712","display_name":"Software"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T12127","display_name":"Software System Performance and Reliability","score":0.9970999956130981,"subfield":{"id":"https://openalex.org/subfields/1705","display_name":"Computer Networks and Communications"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.7541158199310303},{"id":"https://openalex.org/keywords/eclipse","display_name":"Eclipse","score":0.6392683982849121},{"id":"https://openalex.org/keywords/software-bug","display_name":"Software bug","score":0.6221062541007996},{"id":"https://openalex.org/keywords/quality","display_name":"Quality (philosophy)","score":0.6077741384506226},{"id":"https://openalex.org/keywords/process","display_name":"Process (computing)","score":0.5581226348876953},{"id":"https://openalex.org/keywords/software","display_name":"Software","score":0.5513965487480164},{"id":"https://openalex.org/keywords/data-mining","display_name":"Data mining","score":0.5212193727493286},{"id":"https://openalex.org/keywords/decision-tree","display_name":"Decision tree","score":0.5178273320198059},{"id":"https://openalex.org/keywords/set","display_name":"Set (abstract data type)","score":0.5091072916984558},{"id":"https://openalex.org/keywords/software-quality","display_name":"Software quality","score":0.5070784091949463},{"id":"https://openalex.org/keywords/concept-drift","display_name":"Concept drift","score":0.48645731806755066},{"id":"https://openalex.org/keywords/construct","display_name":"Construct (python library)","score":0.48063793778419495},{"id":"https://openalex.org/keywords/task","display_name":"Task (project management)","score":0.44948112964630127},{"id":"https://openalex.org/keywords/predictive-modelling","display_name":"Predictive modelling","score":0.4442150890827179},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.37467920780181885},{"id":"https://openalex.org/keywords/machine-learning","display_name":"Machine learning","score":0.35532957315444946},{"id":"https://openalex.org/keywords/software-development","display_name":"Software development","score":0.3544332981109619},{"id":"https://openalex.org/keywords/programming-language","display_name":"Programming language","score":0.14033502340316772},{"id":"https://openalex.org/keywords/systems-engineering","display_name":"Systems engineering","score":0.11853337287902832},{"id":"https://openalex.org/keywords/engineering","display_name":"Engineering","score":0.10790643095970154}],"concepts":[{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.7541158199310303},{"id":"https://openalex.org/C2778505590","wikidata":"https://www.wikidata.org/wiki/Q141022","display_name":"Eclipse","level":2,"score":0.6392683982849121},{"id":"https://openalex.org/C1009929","wikidata":"https://www.wikidata.org/wiki/Q179550","display_name":"Software bug","level":3,"score":0.6221062541007996},{"id":"https://openalex.org/C2779530757","wikidata":"https://www.wikidata.org/wiki/Q1207505","display_name":"Quality (philosophy)","level":2,"score":0.6077741384506226},{"id":"https://openalex.org/C98045186","wikidata":"https://www.wikidata.org/wiki/Q205663","display_name":"Process (computing)","level":2,"score":0.5581226348876953},{"id":"https://openalex.org/C2777904410","wikidata":"https://www.wikidata.org/wiki/Q7397","display_name":"Software","level":2,"score":0.5513965487480164},{"id":"https://openalex.org/C124101348","wikidata":"https://www.wikidata.org/wiki/Q172491","display_name":"Data mining","level":1,"score":0.5212193727493286},{"id":"https://openalex.org/C84525736","wikidata":"https://www.wikidata.org/wiki/Q831366","display_name":"Decision tree","level":2,"score":0.5178273320198059},{"id":"https://openalex.org/C177264268","wikidata":"https://www.wikidata.org/wiki/Q1514741","display_name":"Set (abstract data type)","level":2,"score":0.5091072916984558},{"id":"https://openalex.org/C117447612","wikidata":"https://www.wikidata.org/wiki/Q1412670","display_name":"Software quality","level":4,"score":0.5070784091949463},{"id":"https://openalex.org/C60777511","wikidata":"https://www.wikidata.org/wiki/Q3045002","display_name":"Concept drift","level":3,"score":0.48645731806755066},{"id":"https://openalex.org/C2780801425","wikidata":"https://www.wikidata.org/wiki/Q5164392","display_name":"Construct (python library)","level":2,"score":0.48063793778419495},{"id":"https://openalex.org/C2780451532","wikidata":"https://www.wikidata.org/wiki/Q759676","display_name":"Task (project management)","level":2,"score":0.44948112964630127},{"id":"https://openalex.org/C45804977","wikidata":"https://www.wikidata.org/wiki/Q7239673","display_name":"Predictive modelling","level":2,"score":0.4442150890827179},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.37467920780181885},{"id":"https://openalex.org/C119857082","wikidata":"https://www.wikidata.org/wiki/Q2539","display_name":"Machine learning","level":1,"score":0.35532957315444946},{"id":"https://openalex.org/C529173508","wikidata":"https://www.wikidata.org/wiki/Q638608","display_name":"Software development","level":3,"score":0.3544332981109619},{"id":"https://openalex.org/C199360897","wikidata":"https://www.wikidata.org/wiki/Q9143","display_name":"Programming language","level":1,"score":0.14033502340316772},{"id":"https://openalex.org/C201995342","wikidata":"https://www.wikidata.org/wiki/Q682496","display_name":"Systems engineering","level":1,"score":0.11853337287902832},{"id":"https://openalex.org/C127413603","wikidata":"https://www.wikidata.org/wiki/Q11023","display_name":"Engineering","level":0,"score":0.10790643095970154},{"id":"https://openalex.org/C121332964","wikidata":"https://www.wikidata.org/wiki/Q413","display_name":"Physics","level":0,"score":0.0},{"id":"https://openalex.org/C138885662","wikidata":"https://www.wikidata.org/wiki/Q5891","display_name":"Philosophy","level":0,"score":0.0},{"id":"https://openalex.org/C1276947","wikidata":"https://www.wikidata.org/wiki/Q333","display_name":"Astronomy","level":1,"score":0.0},{"id":"https://openalex.org/C89198739","wikidata":"https://www.wikidata.org/wiki/Q3079880","display_name":"Data stream mining","level":2,"score":0.0},{"id":"https://openalex.org/C111472728","wikidata":"https://www.wikidata.org/wiki/Q9471","display_name":"Epistemology","level":1,"score":0.0}],"mesh":[],"locations_count":4,"locations":[{"id":"doi:10.1109/msr.2009.5069480","is_oa":false,"landing_page_url":"https://doi.org/10.1109/msr.2009.5069480","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"2009 6th IEEE International Working Conference on Mining Software Repositories","raw_type":"proceedings-article"},{"id":"pmh:oai:www.zora.uzh.ch:25862","is_oa":true,"landing_page_url":null,"pdf_url":null,"source":{"id":"https://openalex.org/S4306401281","display_name":"Zurich Open Repository and Archive (University of Zurich)","issn_l":null,"issn":null,"is_oa":false,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I202697423","host_organization_name":"University of Zurich","host_organization_lineage":["https://openalex.org/I202697423"],"host_organization_lineage_names":[],"type":"repository"},"license":"other-oa","license_id":"https://openalex.org/licenses/other-oa","version":"acceptedVersion","is_accepted":true,"is_published":false,"raw_source_name":"Ekanayake, J; Tappolet, J; Gall, H C; Bernstein, A  (2009). Tracking concept drift of software projects using defect prediction quality.  In: 6th IEEE Working Conference on Mining Software Repositories, Vancouver, Canada, May 2009.","raw_type":"Conference or Workshop Item"},{"id":"pmh:oai:CiteSeerX.psu:10.1.1.462.3944","is_oa":false,"landing_page_url":"http://citeseerx.ist.psu.edu/viewdoc/summary?doi=10.1.1.462.3944","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":"http://ifipwg213.org/system/files/51MSR2009_0111_Ekanayake_Jayalath.pdf","raw_type":"text"},{"id":"doi:10.5167/uzh-25862","is_oa":true,"landing_page_url":"https://doi.org/10.5167/uzh-25862","pdf_url":null,"source":{"id":"https://openalex.org/S7407051291","display_name":"Universit\u00e4t Z\u00fcrich, ZORA","issn_l":null,"issn":[],"is_oa":false,"is_in_doaj":false,"is_core":false,"host_organization":null,"host_organization_name":null,"host_organization_lineage":[],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":null,"is_accepted":false,"is_published":null,"raw_source_name":null,"raw_type":""}],"best_oa_location":{"id":"pmh:oai:www.zora.uzh.ch:25862","is_oa":true,"landing_page_url":null,"pdf_url":null,"source":{"id":"https://openalex.org/S4306401281","display_name":"Zurich Open Repository and Archive (University of Zurich)","issn_l":null,"issn":null,"is_oa":false,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I202697423","host_organization_name":"University of Zurich","host_organization_lineage":["https://openalex.org/I202697423"],"host_organization_lineage_names":[],"type":"repository"},"license":"other-oa","license_id":"https://openalex.org/licenses/other-oa","version":"acceptedVersion","is_accepted":true,"is_published":false,"raw_source_name":"Ekanayake, J; Tappolet, J; Gall, H C; Bernstein, A  (2009). Tracking concept drift of software projects using defect prediction quality.  In: 6th IEEE Working Conference on Mining Software Repositories, Vancouver, Canada, May 2009.","raw_type":"Conference or Workshop Item"},"sustainable_development_goals":[{"score":0.550000011920929,"id":"https://metadata.un.org/sdg/16","display_name":"Peace, Justice and strong institutions"}],"awards":[],"funders":[],"has_content":{"grobid_xml":false,"pdf":false},"content_urls":null,"referenced_works_count":22,"referenced_works":["https://openalex.org/W139044672","https://openalex.org/W1570448133","https://openalex.org/W1599232982","https://openalex.org/W1973540172","https://openalex.org/W2036296745","https://openalex.org/W2082314767","https://openalex.org/W2096942889","https://openalex.org/W2113658292","https://openalex.org/W2125055259","https://openalex.org/W2142481192","https://openalex.org/W2147105902","https://openalex.org/W2150786161","https://openalex.org/W2151553346","https://openalex.org/W2156237258","https://openalex.org/W2159610968","https://openalex.org/W2164519300","https://openalex.org/W2966207845","https://openalex.org/W2983995785","https://openalex.org/W3145932680","https://openalex.org/W4252675558","https://openalex.org/W6605683200","https://openalex.org/W6635911578"],"related_works":["https://openalex.org/W2990081132","https://openalex.org/W4296984035","https://openalex.org/W3127121676","https://openalex.org/W3108206468","https://openalex.org/W137217271","https://openalex.org/W91167106","https://openalex.org/W3091433184","https://openalex.org/W3158675493","https://openalex.org/W3216967183","https://openalex.org/W2022585969"],"abstract_inverted_index":{"Defect":[0],"prediction":[1,33,64,127,132,163,176,236,246],"is":[2,35],"an":[3],"important":[4],"task":[5],"in":[6,82,158,200,210],"the":[7,13,29,32,40,44,53,62,83,89,131,135,159,174,208,218,234,255],"mining":[8],"of":[9,15,43,55,71,110,153,161,212,220,254,258],"software":[10,22,192],"repositories,":[11],"but":[12],"quality":[14,34,133,177],"predictions":[16],"varies":[17],"strongly":[18],"within":[19],"and":[20,100,102,105,116,129,146,155,183,217,231],"across":[21],"projects.":[23],"In":[24],"this":[25,122],"paper":[26],"we":[27,51,166,205],"investigate":[28],"reasons":[30],"why":[31],"so":[36],"fluctuating":[37],"due":[38,78,262],"to":[39,79,124,142,196,226,263],"altering":[41],"nature":[42],"bug":[45,85],"(or":[46],"defect)":[47],"fixing":[48],"process.":[49],"Therefore,":[50],"adopt":[52],"notion":[54],"a":[56,80,149,180,184,215,227,264],"concept":[57,144,198,229,266],"drift,":[58],"which":[59,171],"denotes":[60],"that":[61,191,207,241],"defect":[63,126,162,175,235,245],"model":[65],"has":[66,74],"become":[67],"unsuitable":[68],"as":[69,148],"set":[70],"influencing":[72,173],"features":[73,107],"changed":[75],"-":[76,147,151],"usually":[77],"change":[81,209],"underlying":[84],"generation":[86],"process":[87],"(i.e.,":[88],"concept).":[90],"We":[91,119],"explore":[92],"four":[93],"open":[94],"source":[95],"projects":[96],"(Eclipse,":[97],"OpenOffice,":[98],"Netbeans":[99],"Mozilla)":[101],"construct":[103],"file-level":[104],"project-level":[106],"for":[108,248],"each":[109],"them":[111,224],"from":[112],"their":[113,201],"respective":[114],"CVS":[115],"Bugzilla":[117],"repositories.":[118],"then":[120],"use":[121],"data":[123],"build":[125],"models":[128,247],"visualize":[130],"along":[134],"time":[136],"axis.":[137],"These":[138],"visualizations":[139],"allow":[140],"us":[141],"identify":[143,167],"drifts":[145,199],"consequence":[150],"phases":[152],"stability":[154,259],"instability":[156,261],"expressed":[157],"level":[160],"quality.":[164,237],"Further,":[165],"those":[168],"project":[169,242],"features,":[170],"are":[172,194],"using":[178,244],"both":[179],"tree":[181],"induction-algorithm":[182],"linear":[185],"regression":[186],"model.":[187],"Our":[188,238],"experiments":[189],"uncover":[190],"systems":[193],"subject":[195],"considerable":[197],"evolution":[202],"history.":[203],"Specifically,":[204],"observe":[206],"number":[211,219],"authors":[213],"editing":[214],"file":[216],"defects":[221],"fixed":[222],"by":[223],"contribute":[225],"project's":[228],"drift":[230],"therefore":[232],"influence":[233],"findings":[239],"suggest":[240],"managers":[243],"decision":[249],"making":[250],"should":[251],"be":[252],"aware":[253],"actual":[256],"phase":[257],"or":[260],"potential":[265],"drift.":[267]},"counts_by_year":[{"year":2025,"cited_by_count":3},{"year":2024,"cited_by_count":4},{"year":2023,"cited_by_count":5},{"year":2022,"cited_by_count":5},{"year":2021,"cited_by_count":7},{"year":2020,"cited_by_count":5},{"year":2019,"cited_by_count":4},{"year":2018,"cited_by_count":3},{"year":2017,"cited_by_count":4},{"year":2016,"cited_by_count":3},{"year":2015,"cited_by_count":5},{"year":2014,"cited_by_count":4},{"year":2013,"cited_by_count":7},{"year":2012,"cited_by_count":7}],"updated_date":"2026-06-11T09:08:48.828518","created_date":"2025-10-10T00:00:00"}
