{"id":"https://openalex.org/W6911689491","doi":"https://doi.org/10.5281/zenodo.13631459","title":"Detecting Code Smells using ChatGPT: Initial Insights","display_name":"Detecting Code Smells using ChatGPT: Initial Insights","publication_year":2024,"publication_date":"2024-06-06","ids":{"openalex":"https://openalex.org/W6911689491","doi":"https://doi.org/10.5281/zenodo.13631459"},"language":"en","primary_location":{"id":"doi:10.5281/zenodo.13631459","is_oa":true,"landing_page_url":"https://doi.org/10.5281/zenodo.13631459","pdf_url":null,"source":{"id":"https://openalex.org/S4306400562","display_name":"Zenodo (CERN European Organization for Nuclear Research)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I67311998","host_organization_name":"European Organization for Nuclear Research","host_organization_lineage":["https://openalex.org/I67311998"],"host_organization_lineage_names":[],"type":"repository"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":null,"is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"dataset"},"type":"dataset","indexed_in":["datacite"],"open_access":{"is_oa":true,"oa_status":"green","oa_url":"https://doi.org/10.5281/zenodo.13631459","any_repository_has_fulltext":true},"authorships":[{"author_position":"first","author":{"id":null,"display_name":"Silva, Luciana Lourdes","orcid":"https://orcid.org/0000-0002-9987-4538"},"institutions":[],"countries":[],"is_corresponding":true,"raw_author_name":"Silva, Luciana Lourdes","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":null,"display_name":"Silva, Janio Rosa da","orcid":"https://orcid.org/0000-0001-8756-9344"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Silva, Janio Rosa da","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":null,"display_name":"Montandon, Jo\u00e3o Eduardo","orcid":"https://orcid.org/0000-0002-3371-7353"},"institutions":[{"id":"https://openalex.org/I110200422","display_name":"Universidade Federal de Minas Gerais","ror":"https://ror.org/0176yjw32","country_code":"BR","type":"education","lineage":["https://openalex.org/I110200422"]}],"countries":["BR"],"is_corresponding":false,"raw_author_name":"Montandon, Jo\u00e3o Eduardo","raw_affiliation_strings":["Universidade Federal de Minas Gerais"],"affiliations":[{"raw_affiliation_string":"Universidade Federal de Minas Gerais","institution_ids":["https://openalex.org/I110200422"]}]},{"author_position":"middle","author":{"id":null,"display_name":"Andrade, Marcus","orcid":"https://orcid.org/0009-0004-4429-9777"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Andrade, Marcus","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"last","author":{"id":null,"display_name":"Valente, Marco Tulio","orcid":"https://orcid.org/0000-0002-8180-7548"},"institutions":[{"id":"https://openalex.org/I110200422","display_name":"Universidade Federal de Minas Gerais","ror":"https://ror.org/0176yjw32","country_code":"BR","type":"education","lineage":["https://openalex.org/I110200422"]}],"countries":["BR"],"is_corresponding":false,"raw_author_name":"Valente, Marco Tulio","raw_affiliation_strings":["Universidade Federal de Minas Gerais"],"affiliations":[{"raw_affiliation_string":"Universidade Federal de Minas Gerais","institution_ids":["https://openalex.org/I110200422"]}]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":5,"corresponding_author_ids":[],"corresponding_institution_ids":[],"apc_list":null,"apc_paid":null,"fwci":null,"has_fulltext":false,"cited_by_count":0,"citation_normalized_percentile":null,"cited_by_percentile_year":null,"biblio":{"volume":null,"issue":null,"first_page":null,"last_page":null},"is_retracted":false,"is_paratext":false,"is_xpac":true,"primary_topic":null,"topics":[],"keywords":[{"id":"https://openalex.org/keywords/sql","display_name":"SQL","score":0.5756999850273132},{"id":"https://openalex.org/keywords/table","display_name":"Table (database)","score":0.5403000116348267},{"id":"https://openalex.org/keywords/directory","display_name":"Directory","score":0.5170999765396118},{"id":"https://openalex.org/keywords/replication","display_name":"Replication (statistics)","score":0.5062000155448914},{"id":"https://openalex.org/keywords/code","display_name":"Code (set theory)","score":0.4997999966144562},{"id":"https://openalex.org/keywords/timestamp","display_name":"Timestamp","score":0.46700000762939453},{"id":"https://openalex.org/keywords/column","display_name":"Column (typography)","score":0.4668999910354614},{"id":"https://openalex.org/keywords/identifier","display_name":"Identifier","score":0.4490000009536743},{"id":"https://openalex.org/keywords/file-format","display_name":"File format","score":0.4108999967575073}],"concepts":[{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.8012999892234802},{"id":"https://openalex.org/C510870499","wikidata":"https://www.wikidata.org/wiki/Q47607","display_name":"SQL","level":2,"score":0.5756999850273132},{"id":"https://openalex.org/C45235069","wikidata":"https://www.wikidata.org/wiki/Q278425","display_name":"Table (database)","level":2,"score":0.5403000116348267},{"id":"https://openalex.org/C2777683733","wikidata":"https://www.wikidata.org/wiki/Q201456","display_name":"Directory","level":2,"score":0.5170999765396118},{"id":"https://openalex.org/C23123220","wikidata":"https://www.wikidata.org/wiki/Q816826","display_name":"Information retrieval","level":1,"score":0.5076000094413757},{"id":"https://openalex.org/C12590798","wikidata":"https://www.wikidata.org/wiki/Q3933199","display_name":"Replication (statistics)","level":2,"score":0.5062000155448914},{"id":"https://openalex.org/C2776760102","wikidata":"https://www.wikidata.org/wiki/Q5139990","display_name":"Code (set theory)","level":3,"score":0.4997999966144562},{"id":"https://openalex.org/C77088390","wikidata":"https://www.wikidata.org/wiki/Q8513","display_name":"Database","level":1,"score":0.4869999885559082},{"id":"https://openalex.org/C113954288","wikidata":"https://www.wikidata.org/wiki/Q186885","display_name":"Timestamp","level":2,"score":0.46700000762939453},{"id":"https://openalex.org/C2780551164","wikidata":"https://www.wikidata.org/wiki/Q2306599","display_name":"Column (typography)","level":3,"score":0.4668999910354614},{"id":"https://openalex.org/C154504017","wikidata":"https://www.wikidata.org/wiki/Q853614","display_name":"Identifier","level":2,"score":0.4490000009536743},{"id":"https://openalex.org/C97250363","wikidata":"https://www.wikidata.org/wiki/Q235557","display_name":"File format","level":2,"score":0.4108999967575073},{"id":"https://openalex.org/C5655090","wikidata":"https://www.wikidata.org/wiki/Q192588","display_name":"Relational database","level":2,"score":0.38659998774528503},{"id":"https://openalex.org/C124101348","wikidata":"https://www.wikidata.org/wiki/Q172491","display_name":"Data mining","level":1,"score":0.3797999918460846},{"id":"https://openalex.org/C59276292","wikidata":"https://www.wikidata.org/wiki/Q580427","display_name":"Database index","level":3,"score":0.3785000145435333},{"id":"https://openalex.org/C133237599","wikidata":"https://www.wikidata.org/wiki/Q2295111","display_name":"Code smell","level":5,"score":0.3781999945640564},{"id":"https://openalex.org/C199360897","wikidata":"https://www.wikidata.org/wiki/Q9143","display_name":"Programming language","level":1,"score":0.35690000653266907},{"id":"https://openalex.org/C9652623","wikidata":"https://www.wikidata.org/wiki/Q190109","display_name":"Field (mathematics)","level":2,"score":0.35659998655319214},{"id":"https://openalex.org/C2777561058","wikidata":"https://www.wikidata.org/wiki/Q2652119","display_name":"Program comprehension","level":4,"score":0.3228999972343445},{"id":"https://openalex.org/C54239708","wikidata":"https://www.wikidata.org/wiki/Q1329910","display_name":"View","level":3,"score":0.30570000410079956},{"id":"https://openalex.org/C68476402","wikidata":"https://www.wikidata.org/wiki/Q1456936","display_name":"Table of contents","level":2,"score":0.2948000133037567},{"id":"https://openalex.org/C36464697","wikidata":"https://www.wikidata.org/wiki/Q451553","display_name":"Visualization","level":2,"score":0.29260000586509705},{"id":"https://openalex.org/C201743585","wikidata":"https://www.wikidata.org/wiki/Q1373925","display_name":"Flat file database","level":5,"score":0.29120001196861267},{"id":"https://openalex.org/C43126263","wikidata":"https://www.wikidata.org/wiki/Q128751","display_name":"Source code","level":2,"score":0.275299996137619},{"id":"https://openalex.org/C172367668","wikidata":"https://www.wikidata.org/wiki/Q6504956","display_name":"Data visualization","level":3,"score":0.27309998869895935},{"id":"https://openalex.org/C171730128","wikidata":"https://www.wikidata.org/wiki/Q5227290","display_name":"Data file","level":2,"score":0.2728999853134155},{"id":"https://openalex.org/C73555534","wikidata":"https://www.wikidata.org/wiki/Q622825","display_name":"Cluster analysis","level":2,"score":0.26899999380111694},{"id":"https://openalex.org/C10272871","wikidata":"https://www.wikidata.org/wiki/Q929972","display_name":"Software inspection","level":5,"score":0.26809999346733093},{"id":"https://openalex.org/C132964779","wikidata":"https://www.wikidata.org/wiki/Q2110223","display_name":"Raw data","level":2,"score":0.26589998602867126},{"id":"https://openalex.org/C154420247","wikidata":"https://www.wikidata.org/wiki/Q846619","display_name":"Stored procedure","level":5,"score":0.2614000141620636},{"id":"https://openalex.org/C5968703","wikidata":"https://www.wikidata.org/wiki/Q267136","display_name":"Database model","level":3,"score":0.25270000100135803}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.5281/zenodo.13631459","is_oa":true,"landing_page_url":"https://doi.org/10.5281/zenodo.13631459","pdf_url":null,"source":{"id":"https://openalex.org/S4306400562","display_name":"Zenodo (CERN European Organization for Nuclear Research)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I67311998","host_organization_name":"European Organization for Nuclear Research","host_organization_lineage":["https://openalex.org/I67311998"],"host_organization_lineage_names":[],"type":"repository"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":null,"is_accepted":false,"is_published":null,"raw_source_name":null,"raw_type":"dataset"}],"best_oa_location":{"id":"doi:10.5281/zenodo.13631459","is_oa":true,"landing_page_url":"https://doi.org/10.5281/zenodo.13631459","pdf_url":null,"source":{"id":"https://openalex.org/S4306400562","display_name":"Zenodo (CERN European Organization for Nuclear Research)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I67311998","host_organization_name":"European Organization for Nuclear Research","host_organization_lineage":["https://openalex.org/I67311998"],"host_organization_lineage_names":[],"type":"repository"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":null,"is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"dataset"},"sustainable_development_goals":[],"awards":[],"funders":[],"has_content":{"grobid_xml":false,"pdf":false},"content_urls":null,"referenced_works_count":0,"referenced_works":[],"related_works":[],"abstract_inverted_index":{"Replication":[0,9],"Package:":[1],"Detecting":[2,24],"Code":[3,25],"Smells":[4,26],"using":[5,27],"ChatGPT:":[6,28],"Initial":[7,29],"Insights":[8],"Package":[10],"This":[11,192],"repository":[12],"contains":[13,96,119,184,194,388],"data":[14,38,410],"files":[15],"to":[16,71,180,187,200,382,398,400,404,421],"replicate":[17],"our":[18,181,188],"study":[19],"presented":[20],"in":[21,39,46,57,68,90,216,222,254,272,282,302,319,329,366,456],"the":[22,44,55,66,73,76,80,87,177,196,205,210,223,232,248,255,273,280,283,287,296,303,310,320,327,330,343,350,354,359,367,378,393,418,422,425,428,439,443,448,451,457,460,464,468],"paper":[23],"Insights.":[30],"Dataset":[31,106],"Structure":[32],"We":[33,234],"provide":[34],"raw":[35],"and":[36,84,209,315,337,402],"preprocessed":[37],"different":[40],"formats:":[41],"csv":[42],"-":[43,54,65,79,171,183,191,218,227,240,276,290,306,323,339,349,363,370,416,424,434,438,447,454,463],"database":[45,56,67,88],"CSV":[47,58],"format":[48,59,70],"with":[49,60],"comma":[50],"separated":[51,62],"columns.":[52,63],"csv-semi-comma":[53],"semi-comma":[61],"html":[64],"HTML":[69],"ease":[72],"visualization":[74],"of":[75,86,112,247,353,427,467],"dataset.":[77,225,256,321,345,361],"sql":[78,109],"original":[81,178,224,274,284,304,344,360,368,394],"SQL":[82],"(schema":[83],"data)":[85],"used":[89,397],"this":[91],"study.":[92],"Each":[93,202],"compressed":[94],"directory":[95,110],"a":[97,241,291],"README":[98],"file":[99],"explaining":[100],"which":[101],"information":[102,120,389,403],"each":[103],"column":[104,193],"includes.":[105],"Overview":[107],"A.":[108],"consists":[111],"two":[113],"tables:":[114],"1.":[115],"The":[116,385,408],"table":[117,386],"tb_unique_bad_smell":[118],"we":[121,175,198,213,380,390,396,411],"collect":[122],"from":[123,238,342,358,392],"ChatGPT.":[124,201,233,383],"CREATE":[125],"TABLE":[126],"public.tb_unique_bad_smell":[127],"(":[128],"id_unique_bad_smell":[129],"integer":[130,172,371],"NOT":[131],"NULL,":[132],"id_bad_smell":[133],"bigint,":[134,136,162],"id_source_code":[135,170],"chat_gpt_response":[137],"text,":[138,140,142,144,152,154,160],"question":[139,190,203],"badsmell_base":[141],"bad_smell_gpt":[143,226],"found_any":[145],"boolean,":[146,148,150],"valid_bad_smell":[147],"bad_smell_in_base":[149],"bad_smell_not_in_the_base":[151],"bad_smell_not_found":[153,322],"index":[155],"integer,":[156,158],"index_base":[157,338],"url_github":[159],"id_base":[161,362],"dt_insertion":[163],"timestamp":[164],"without":[165],"time":[166],"zone,":[167],"nr_question":[168],"smallint);":[169],"identifier":[173],"when":[174],"imported":[176,341,391],"dataset":[179,285,331,395],"database.chat_gpt_response":[182],"ChatGPT's":[185,406],"response":[186],"prompts.":[189],"all":[195],"prompts":[197],"submitted":[199,381],"includes":[204],"prompt":[206,379],"under":[207],"evaluation":[208],"source":[211,355,469],"code":[212,219,228,356,449,458,470],"were":[214],"interested":[215],"evaluating.badsmell_base":[217],"smells":[220,229,237,249,281,297,311,328],"assigned":[221,420],"identified":[230],"by":[231,251,299],"extracted":[235,357],"these":[236],"`chat_gpt_response`.found_any":[239],"boolean":[242,292],"field":[243,278,293,308,325,365,372],"indicating":[244,294],"if":[245,260,268,295],"any":[246,265],"found":[250,298,314],"ChatGPT":[252,261,288,300,313,333,401],"are":[253,301,317],"In":[257],"other":[258],"words,":[259],"answered":[262],"yes,":[263],"finding":[264],"smell":[266,415,419,452,461],"(even":[267],"it":[269],"is":[270],"not":[271,318,335],"dataset).valid_bad_smell":[275],"text":[277,307,324],"containing":[279,309,326,373],"that":[286,312,332],"identified.bad_smell_in_base":[289],"dataset.bad_smell_not_in_the_base":[305],"they":[316],"did":[334],"detect.index":[336],"indexes":[340],"GitHub":[346,351,465],"provided":[347],"them.url_github":[348],"URL":[352,466],"id":[364],"dataset.nr_question":[369],"1":[374],"or":[375,436],"2,":[376],"identifying":[377],"2.":[384],"`tb_unique_source_code`":[387],"submit":[399],"evaluate":[405],"performance.":[407],"primary":[409],"relied":[412],"on":[413],"are:":[414],"presents":[417],"code.severity":[423],"severity":[426],"smells,":[429],"Major,":[430],"Critical,":[431],"Minor.":[432],"type":[433],"function":[435],"class.code_name":[437],"full":[440],"path":[441],"for":[442],"smell,":[444],"e.g.,":[445],"nm_package.nm_class.nm_methodstart_line":[446],"where":[450,459],"starts.end_line":[453],"line":[455],"ends.link":[462],"evaluated.":[471]},"counts_by_year":[],"updated_date":"2025-11-06T06:51:31.235846","created_date":"2025-10-10T00:00:00"}
