{"id":"https://openalex.org/W4226106048","doi":"https://doi.org/10.48550/arxiv.2203.00803","title":"Code Smells in Machine Learning Systems","display_name":"Code Smells in Machine Learning Systems","publication_year":2022,"publication_date":"2022-03-02","ids":{"openalex":"https://openalex.org/W4226106048","doi":"https://doi.org/10.48550/arxiv.2203.00803"},"language":"en","primary_location":{"id":"pmh:oai:arXiv.org:2203.00803","is_oa":true,"landing_page_url":"http://arxiv.org/abs/2203.00803","pdf_url":"https://arxiv.org/pdf/2203.00803","source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":"","raw_type":"text"},"type":"preprint","indexed_in":["arxiv","datacite"],"open_access":{"is_oa":true,"oa_status":"green","oa_url":"https://arxiv.org/pdf/2203.00803","any_repository_has_fulltext":true},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5006496692","display_name":"Jiri Gesi","orcid":"https://orcid.org/0000-0002-1188-2921"},"institutions":[],"countries":[],"is_corresponding":true,"raw_author_name":"Gesi, Jiri","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5100390245","display_name":"Siqi Liu","orcid":"https://orcid.org/0000-0003-1751-4385"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Liu, Siqi","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5108050276","display_name":"Jiawei Li","orcid":"https://orcid.org/0000-0001-9801-4715"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Li, Jiawei","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5078115464","display_name":"Iftekhar Ahmed","orcid":"https://orcid.org/0000-0001-8221-5352"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Ahmed, Iftekhar","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5101612061","display_name":"Nachiappan Nagappan","orcid":"https://orcid.org/0000-0003-1358-4124"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Nagappan, Nachiappan","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5081036622","display_name":"David Lo","orcid":"https://orcid.org/0000-0002-4367-7201"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Lo, David","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5055793778","display_name":"Eduardo Santana de Almeida","orcid":"https://orcid.org/0000-0002-9312-6715"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"de Almeida, Eduardo Santana","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5033873409","display_name":"Pavneet Singh Kochhar","orcid":"https://orcid.org/0000-0002-4342-6672"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Kochhar, Pavneet Singh","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"last","author":{"id":"https://openalex.org/A5007075465","display_name":"Lingfeng Bao","orcid":"https://orcid.org/0000-0003-1846-0921"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Bao, Lingfeng","raw_affiliation_strings":[],"affiliations":[]}],"institutions":[],"countries_distinct_count":0,"institutions_distinct_count":9,"corresponding_author_ids":["https://openalex.org/A5006496692"],"corresponding_institution_ids":[],"apc_list":null,"apc_paid":null,"fwci":null,"has_fulltext":false,"cited_by_count":12,"citation_normalized_percentile":null,"cited_by_percentile_year":null,"biblio":{"volume":null,"issue":null,"first_page":null,"last_page":null},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10260","display_name":"Software Engineering Research","score":0.9984999895095825,"subfield":{"id":"https://openalex.org/subfields/1710","display_name":"Information Systems"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10260","display_name":"Software Engineering Research","score":0.9984999895095825,"subfield":{"id":"https://openalex.org/subfields/1710","display_name":"Information Systems"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T12127","display_name":"Software System Performance and Reliability","score":0.9697999954223633,"subfield":{"id":"https://openalex.org/subfields/1705","display_name":"Computer Networks and Communications"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11948","display_name":"Machine Learning in Materials Science","score":0.9430999755859375,"subfield":{"id":"https://openalex.org/subfields/2505","display_name":"Materials Chemistry"},"field":{"id":"https://openalex.org/fields/25","display_name":"Materials Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/code-smell","display_name":"Code smell","score":0.8896550536155701},{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.6516698598861694},{"id":"https://openalex.org/keywords/context","display_name":"Context (archaeology)","score":0.639228343963623},{"id":"https://openalex.org/keywords/code-review","display_name":"Code review","score":0.5813344120979309},{"id":"https://openalex.org/keywords/code","display_name":"Code (set theory)","score":0.5659081935882568},{"id":"https://openalex.org/keywords/software-engineering","display_name":"Software engineering","score":0.46613284945487976},{"id":"https://openalex.org/keywords/dependency","display_name":"Dependency (UML)","score":0.43096923828125},{"id":"https://openalex.org/keywords/software-system","display_name":"Software system","score":0.42649608850479126},{"id":"https://openalex.org/keywords/software-maintenance","display_name":"Software maintenance","score":0.4109841287136078},{"id":"https://openalex.org/keywords/software-quality","display_name":"Software quality","score":0.37223196029663086},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.33830660581588745},{"id":"https://openalex.org/keywords/software","display_name":"Software","score":0.33261919021606445},{"id":"https://openalex.org/keywords/software-development","display_name":"Software development","score":0.2952198088169098},{"id":"https://openalex.org/keywords/programming-language","display_name":"Programming language","score":0.19318902492523193}],"concepts":[{"id":"https://openalex.org/C133237599","wikidata":"https://www.wikidata.org/wiki/Q2295111","display_name":"Code smell","level":5,"score":0.8896550536155701},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.6516698598861694},{"id":"https://openalex.org/C2779343474","wikidata":"https://www.wikidata.org/wiki/Q3109175","display_name":"Context (archaeology)","level":2,"score":0.639228343963623},{"id":"https://openalex.org/C150292731","wikidata":"https://www.wikidata.org/wiki/Q1342704","display_name":"Code review","level":5,"score":0.5813344120979309},{"id":"https://openalex.org/C2776760102","wikidata":"https://www.wikidata.org/wiki/Q5139990","display_name":"Code (set theory)","level":3,"score":0.5659081935882568},{"id":"https://openalex.org/C115903868","wikidata":"https://www.wikidata.org/wiki/Q80993","display_name":"Software engineering","level":1,"score":0.46613284945487976},{"id":"https://openalex.org/C19768560","wikidata":"https://www.wikidata.org/wiki/Q320727","display_name":"Dependency (UML)","level":2,"score":0.43096923828125},{"id":"https://openalex.org/C149091818","wikidata":"https://www.wikidata.org/wiki/Q2429814","display_name":"Software system","level":3,"score":0.42649608850479126},{"id":"https://openalex.org/C101317890","wikidata":"https://www.wikidata.org/wiki/Q940053","display_name":"Software maintenance","level":4,"score":0.4109841287136078},{"id":"https://openalex.org/C117447612","wikidata":"https://www.wikidata.org/wiki/Q1412670","display_name":"Software quality","level":4,"score":0.37223196029663086},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.33830660581588745},{"id":"https://openalex.org/C2777904410","wikidata":"https://www.wikidata.org/wiki/Q7397","display_name":"Software","level":2,"score":0.33261919021606445},{"id":"https://openalex.org/C529173508","wikidata":"https://www.wikidata.org/wiki/Q638608","display_name":"Software development","level":3,"score":0.2952198088169098},{"id":"https://openalex.org/C199360897","wikidata":"https://www.wikidata.org/wiki/Q9143","display_name":"Programming language","level":1,"score":0.19318902492523193},{"id":"https://openalex.org/C86803240","wikidata":"https://www.wikidata.org/wiki/Q420","display_name":"Biology","level":0,"score":0.0},{"id":"https://openalex.org/C151730666","wikidata":"https://www.wikidata.org/wiki/Q7205","display_name":"Paleontology","level":1,"score":0.0},{"id":"https://openalex.org/C177264268","wikidata":"https://www.wikidata.org/wiki/Q1514741","display_name":"Set (abstract data type)","level":2,"score":0.0}],"mesh":[],"locations_count":2,"locations":[{"id":"pmh:oai:arXiv.org:2203.00803","is_oa":true,"landing_page_url":"http://arxiv.org/abs/2203.00803","pdf_url":"https://arxiv.org/pdf/2203.00803","source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":"","raw_type":"text"},{"id":"doi:10.48550/arxiv.2203.00803","is_oa":true,"landing_page_url":"https://doi.org/10.48550/arxiv.2203.00803","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":null,"is_accepted":false,"is_published":null,"raw_source_name":null,"raw_type":"article"}],"best_oa_location":{"id":"pmh:oai:arXiv.org:2203.00803","is_oa":true,"landing_page_url":"http://arxiv.org/abs/2203.00803","pdf_url":"https://arxiv.org/pdf/2203.00803","source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":"","raw_type":"text"},"sustainable_development_goals":[],"awards":[],"funders":[],"has_content":{"grobid_xml":false,"pdf":false},"content_urls":null,"referenced_works_count":0,"referenced_works":[],"related_works":["https://openalex.org/W3175279244","https://openalex.org/W3137757622","https://openalex.org/W2083714857","https://openalex.org/W3121200789","https://openalex.org/W1847720358","https://openalex.org/W2899956841","https://openalex.org/W4280612920","https://openalex.org/W2518360245","https://openalex.org/W3116427025","https://openalex.org/W4307656098"],"abstract_inverted_index":{"As":[0],"Deep":[1],"learning":[2],"(DL)":[3],"systems":[4,23,40,215],"continuously":[5],"evolve":[6],"and":[7,29,76,105,119,155,181,195,208],"grow,":[8],"assuring":[9],"their":[10,78],"quality":[11],"becomes":[12],"an":[13],"important":[14],"yet":[15],"challenging":[16],"task.":[17],"Compared":[18],"to":[19,41,45,52,107],"non-DL":[20,64],"systems,":[21,101,154],"DL":[22,39,99,146,153,165,174,214],"have":[24,124,142],"more":[25,43],"complex":[26],"team":[27],"compositions":[28],"heavier":[30],"data":[31],"dependency.":[32],"These":[33],"inherent":[34],"characteristics":[35],"would":[36],"potentially":[37],"cause":[38],"be":[42],"vulnerable":[44],"bugs":[46],"and,":[47],"in":[48,82,95,164,173],"the":[49,88,96,138,150,179,182,211,217],"long":[50],"run,":[51],"maintenance":[53,81,116,139,212],"issues.":[54],"Code":[55],"smells":[56,94,122,172,189,205],"are":[57,206],"empirically":[58],"tested":[59],"as":[60],"efficient":[61],"indicators":[62],"of":[63,98,115,152,184,193,213],"systems.":[65,166,175],"Therefore,":[66],"we":[67,135,156,168,177],"took":[68],"a":[69,109,191],"step":[70],"forward":[71],"into":[72],"identifying":[73],"code":[74,93,121,171,188,204],"smells,":[75],"understanding":[77],"impact":[79,183],"on":[80,91,210],"this":[83],"comprehensive":[84],"study.":[85],"This":[86],"is":[87],"first":[89,110],"study":[90],"investigating":[92],"context":[97],"software":[100],"which":[102],"helps":[103],"researchers":[104],"practitioners":[106],"get":[108],"look":[111],"at":[112],"what":[113,120],"kind":[114],"modification":[117,162],"made":[118,144],"developers":[123,147],"been":[125,143],"dealing":[126],"with.":[127],"Our":[128],"paper":[129],"has":[130],"three":[131],"major":[132],"contributions.":[133],"First,":[134],"comprehensively":[136],"investigated":[137],"modifications":[140],"that":[141,200],"by":[145],"via":[148],"studying":[149],"evolution":[151],"identified":[157,187,203],"nine":[158],"frequently":[159],"occurred":[160],"maintenance-related":[161],"categories":[163],"Second,":[167],"summarized":[169],"five":[170],"Third,":[176],"validated":[178],"prevalence,":[180],"our":[185,201],"newly":[186,202],"through":[190],"mixture":[192],"qualitative":[194],"quantitative":[196],"analysis.":[197],"We":[198],"found":[199],"prevalent":[207],"impactful":[209],"from":[216],"developer's":[218],"perspective.":[219]},"counts_by_year":[{"year":2025,"cited_by_count":1},{"year":2024,"cited_by_count":6},{"year":2023,"cited_by_count":4},{"year":2022,"cited_by_count":1}],"updated_date":"2026-02-09T09:26:11.010843","created_date":"2025-10-10T00:00:00"}
