{"id":"https://openalex.org/W4409797602","doi":"https://doi.org/10.1145/3731753","title":"Ecosystem of Large Language Models for Code","display_name":"Ecosystem of Large Language Models for Code","publication_year":2025,"publication_date":"2025-04-25","ids":{"openalex":"https://openalex.org/W4409797602","doi":"https://doi.org/10.1145/3731753"},"language":"en","primary_location":{"id":"doi:10.1145/3731753","is_oa":false,"landing_page_url":"https://doi.org/10.1145/3731753","pdf_url":null,"source":{"id":"https://openalex.org/S142627899","display_name":"ACM Transactions on Software Engineering and Methodology","issn_l":"1049-331X","issn":["1049-331X","1557-7392"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310319798","host_organization_name":"Association for Computing Machinery","host_organization_lineage":["https://openalex.org/P4310319798"],"host_organization_lineage_names":["Association for Computing Machinery"],"type":"journal"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"ACM Transactions on Software Engineering and Methodology","raw_type":"journal-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":false,"oa_status":"closed","oa_url":null,"any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5008695791","display_name":"Zhou Yang","orcid":"https://orcid.org/0000-0001-5938-1918"},"institutions":[{"id":"https://openalex.org/I79891267","display_name":"Singapore Management University","ror":"https://ror.org/050qmg959","country_code":"SG","type":"education","lineage":["https://openalex.org/I79891267"]}],"countries":["SG"],"is_corresponding":true,"raw_author_name":"Zhou Yang","raw_affiliation_strings":["Singapore Management University, Singapore, Singapore","Singapore Management University, Singapore"],"affiliations":[{"raw_affiliation_string":"Singapore Management University, Singapore, Singapore","institution_ids":["https://openalex.org/I79891267"]},{"raw_affiliation_string":"Singapore Management University, Singapore","institution_ids":["https://openalex.org/I79891267"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5002667771","display_name":"Jieke Shi","orcid":"https://orcid.org/0000-0002-0799-5018"},"institutions":[{"id":"https://openalex.org/I79891267","display_name":"Singapore Management University","ror":"https://ror.org/050qmg959","country_code":"SG","type":"education","lineage":["https://openalex.org/I79891267"]}],"countries":["SG"],"is_corresponding":false,"raw_author_name":"Jieke Shi","raw_affiliation_strings":["Singapore Management University, Singapore, Singapore","Singapore Management University, Singapore"],"affiliations":[{"raw_affiliation_string":"Singapore Management University, Singapore, Singapore","institution_ids":["https://openalex.org/I79891267"]},{"raw_affiliation_string":"Singapore Management University, Singapore","institution_ids":["https://openalex.org/I79891267"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5036744986","display_name":"Pr\u00e9mkumar D\u00e9vanbu","orcid":"https://orcid.org/0000-0002-4346-5276"},"institutions":[{"id":"https://openalex.org/I84218800","display_name":"University of California, Davis","ror":"https://ror.org/05rrcem69","country_code":"US","type":"education","lineage":["https://openalex.org/I84218800"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Premkumar Devanbu","raw_affiliation_strings":["UC Davis, Davis, California, USA","Department of Computer Science, UC Davis, USA"],"affiliations":[{"raw_affiliation_string":"UC Davis, Davis, California, USA","institution_ids":["https://openalex.org/I84218800"]},{"raw_affiliation_string":"Department of Computer Science, UC Davis, USA","institution_ids":["https://openalex.org/I84218800"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5081036622","display_name":"David Lo","orcid":"https://orcid.org/0000-0002-4367-7201"},"institutions":[{"id":"https://openalex.org/I79891267","display_name":"Singapore Management University","ror":"https://ror.org/050qmg959","country_code":"SG","type":"education","lineage":["https://openalex.org/I79891267"]}],"countries":["SG"],"is_corresponding":false,"raw_author_name":"David Lo","raw_affiliation_strings":["Singapore Management University, Singapore, Singapore","Singapore Management University, Singapore"],"affiliations":[{"raw_affiliation_string":"Singapore Management University, Singapore, Singapore","institution_ids":["https://openalex.org/I79891267"]},{"raw_affiliation_string":"Singapore Management University, Singapore","institution_ids":["https://openalex.org/I79891267"]}]}],"institutions":[],"countries_distinct_count":2,"institutions_distinct_count":4,"corresponding_author_ids":["https://openalex.org/A5008695791"],"corresponding_institution_ids":["https://openalex.org/I79891267"],"apc_list":null,"apc_paid":null,"fwci":24.4706,"has_fulltext":false,"cited_by_count":9,"citation_normalized_percentile":{"value":0.99327527,"is_in_top_1_percent":true,"is_in_top_10_percent":true},"cited_by_percentile_year":{"min":94,"max":99},"biblio":{"volume":"35","issue":"1","first_page":"1","last_page":"30"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10260","display_name":"Software Engineering Research","score":0.9987999796867371,"subfield":{"id":"https://openalex.org/subfields/1710","display_name":"Information Systems"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10260","display_name":"Software Engineering Research","score":0.9987999796867371,"subfield":{"id":"https://openalex.org/subfields/1710","display_name":"Information Systems"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10743","display_name":"Software Testing and Debugging Techniques","score":0.9922999739646912,"subfield":{"id":"https://openalex.org/subfields/1712","display_name":"Software"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11241","display_name":"Advanced Malware Detection Techniques","score":0.9912999868392944,"subfield":{"id":"https://openalex.org/subfields/1711","display_name":"Signal Processing"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.7730648517608643},{"id":"https://openalex.org/keywords/ecosystem","display_name":"Ecosystem","score":0.5554350018501282},{"id":"https://openalex.org/keywords/code","display_name":"Code (set theory)","score":0.5019981861114502},{"id":"https://openalex.org/keywords/programming-language","display_name":"Programming language","score":0.34842944145202637},{"id":"https://openalex.org/keywords/ecology","display_name":"Ecology","score":0.28661733865737915}],"concepts":[{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.7730648517608643},{"id":"https://openalex.org/C110872660","wikidata":"https://www.wikidata.org/wiki/Q37813","display_name":"Ecosystem","level":2,"score":0.5554350018501282},{"id":"https://openalex.org/C2776760102","wikidata":"https://www.wikidata.org/wiki/Q5139990","display_name":"Code (set theory)","level":3,"score":0.5019981861114502},{"id":"https://openalex.org/C199360897","wikidata":"https://www.wikidata.org/wiki/Q9143","display_name":"Programming language","level":1,"score":0.34842944145202637},{"id":"https://openalex.org/C18903297","wikidata":"https://www.wikidata.org/wiki/Q7150","display_name":"Ecology","level":1,"score":0.28661733865737915},{"id":"https://openalex.org/C177264268","wikidata":"https://www.wikidata.org/wiki/Q1514741","display_name":"Set (abstract data type)","level":2,"score":0.0},{"id":"https://openalex.org/C86803240","wikidata":"https://www.wikidata.org/wiki/Q420","display_name":"Biology","level":0,"score":0.0}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.1145/3731753","is_oa":false,"landing_page_url":"https://doi.org/10.1145/3731753","pdf_url":null,"source":{"id":"https://openalex.org/S142627899","display_name":"ACM Transactions on Software Engineering and Methodology","issn_l":"1049-331X","issn":["1049-331X","1557-7392"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310319798","host_organization_name":"Association for Computing Machinery","host_organization_lineage":["https://openalex.org/P4310319798"],"host_organization_lineage_names":["Association for Computing Machinery"],"type":"journal"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"ACM Transactions on Software Engineering and Methodology","raw_type":"journal-article"}],"best_oa_location":null,"sustainable_development_goals":[],"awards":[],"funders":[],"has_content":{"grobid_xml":false,"pdf":false},"content_urls":null,"referenced_works_count":52,"referenced_works":["https://openalex.org/W950821216","https://openalex.org/W1975675278","https://openalex.org/W1988691616","https://openalex.org/W2019955851","https://openalex.org/W2107142491","https://openalex.org/W2163004671","https://openalex.org/W2605856244","https://openalex.org/W2795081714","https://openalex.org/W2963889172","https://openalex.org/W2979792666","https://openalex.org/W3091065534","https://openalex.org/W3092232764","https://openalex.org/W3109966548","https://openalex.org/W3120545963","https://openalex.org/W3161331107","https://openalex.org/W3162867182","https://openalex.org/W3162945305","https://openalex.org/W4220722393","https://openalex.org/W4221145571","https://openalex.org/W4285209474","https://openalex.org/W4288079288","https://openalex.org/W4308562533","https://openalex.org/W4308627220","https://openalex.org/W4308641647","https://openalex.org/W4312044266","https://openalex.org/W4313547593","https://openalex.org/W4376606615","https://openalex.org/W4376606832","https://openalex.org/W4384009684","https://openalex.org/W4384009685","https://openalex.org/W4384345640","https://openalex.org/W4385564894","https://openalex.org/W4386114095","https://openalex.org/W4388115877","https://openalex.org/W4388483038","https://openalex.org/W4388483294","https://openalex.org/W4389208909","https://openalex.org/W4390874818","https://openalex.org/W4391696889","https://openalex.org/W4399397061","https://openalex.org/W4399513333","https://openalex.org/W4399631748","https://openalex.org/W4399667996","https://openalex.org/W4399871912","https://openalex.org/W4400681445","https://openalex.org/W4401455417","https://openalex.org/W4402665833","https://openalex.org/W4403413448","https://openalex.org/W4403761251","https://openalex.org/W4405366282","https://openalex.org/W4405640497","https://openalex.org/W4406688098"],"related_works":["https://openalex.org/W4391375266","https://openalex.org/W2899084033","https://openalex.org/W2748952813","https://openalex.org/W2390279801","https://openalex.org/W4391913857","https://openalex.org/W2358668433","https://openalex.org/W4396701345","https://openalex.org/W2376932109","https://openalex.org/W2001405890","https://openalex.org/W4396696052"],"abstract_inverted_index":{"The":[0,175],"extensive":[1],"availability":[2],"of":[3,25,64,87,169,204,276],"publicly":[4],"accessible":[5],"source":[6],"code":[7,30],"and":[8,43,89,102,107,111,124,150,157,186,211,230,244,269],"the":[9,65,105,126,141,196,202,213,242,249,257,267,273],"advances":[10],"in":[11,37,104,209],"language":[12,27],"models,":[13,101],"coupled":[14],"with":[15,45,140,221,227,234,254],"increasing":[16],"computational":[17],"resources,":[18],"have":[19],"led":[20],"to":[21,59,119,207,240,271],"a":[22,49,61,85],"remarkable":[23],"rise":[24],"large":[26],"models":[28,33,90,226],"for":[29,76,128],"(LLM4Code).":[31],"These":[32],"do":[34],"not":[35],"exist":[36],"isolation":[38],"but":[39],"rather":[40],"depend":[41],"on":[42,92,173,262],"interact":[44],"each":[46,116],"other,":[47],"forming":[48],"complex":[50],"ecosystem":[51,67,106,243],"that":[52,161,168,246],"is":[53,164,179],"worth":[54],"studying.":[55],"It":[56],"motivates":[57],"us":[58],"introduce":[60],"pioneering":[62],"analysis":[63],"LLM4Code":[66,134,162,220],".":[68,152],"Utilizing":[69],"Hugging":[70],"Face":[71],"[":[72],"]\u2014the":[73],"premier":[74],"hub":[75],"transformer-based":[77],"models\u2014as":[78],"our":[79,263],"primary":[80],"source,":[81],"we":[82,154,187,200,265],"manually":[83,250],"curate":[84],"list":[86],"datasets":[88],"focused":[91],"software":[93,184],"engineering":[94],"tasks.":[95],"We":[96,113,132,237],"first":[97],"identify":[98,219],"key":[99],"datasets,":[100],"users":[103],"quantify":[108],"their":[109],"contributions":[110],"importance.":[112],"then":[114],"examine":[115,155],"model\u2019s":[117],"documentation":[118,156,163],"trace":[120],"its":[121],"base":[122,225],"model":[123,135],"understand":[125],"process":[127],"deriving":[129],"new":[130],"models.":[131],"categorize":[133],"reuse":[136,232],"into":[137],"nine":[138],"categories,":[139],"top":[142],"three":[143],"being":[144],"fine-tuning":[145],",":[146,149],"architecture":[147],"sharing":[148],"quantization":[151],"Additionally,":[153],"licensing":[158],"practices,":[159],"revealing":[160],"less":[165],"detailed":[166],"than":[167],"general":[170],"AI":[171],"repositories":[172],"GitHub.":[174],"license":[176,191],"usage":[177],"pattern":[178],"also":[180],"different":[181],"from":[182,217,248,256],"other":[183],"repositories,":[185],"further":[188],"analyze":[189,195],"potential":[190,203],"incompatibility":[192],"issues.":[193],"To":[194],"rapidly":[197],"growing":[198],"LLM4Code,":[199],"explore":[201],"using":[205],"LLMs":[206,216,239],"assist":[208],"constructing":[210],"analyzing":[212],"ecosystem.":[214],"Advanced":[215],"OpenAI":[218],"98%":[222],"accuracy,":[223,229],"infer":[224],"87%":[228],"predict":[231],"types":[233],"89%":[235],"accuracy.":[236],"employ":[238],"expand":[241],"find":[245],"conclusions":[247],"curated":[251],"dataset":[252],"align":[253],"those":[255],"automatically":[258],"created":[259],"one.":[260],"Based":[261],"findings,":[264],"discuss":[266],"implications":[268],"suggestions":[270],"facilitate":[272],"healthy":[274],"growth":[275],"LLM4Code.":[277]},"counts_by_year":[{"year":2025,"cited_by_count":7},{"year":2024,"cited_by_count":2}],"updated_date":"2025-12-12T23:16:27.785689","created_date":"2025-10-10T00:00:00"}
