{"id":"https://openalex.org/W4315706637","doi":"https://doi.org/10.48550/arxiv.2301.03988","title":"SantaCoder: don't reach for the stars!","display_name":"SantaCoder: don't reach for the stars!","publication_year":2023,"publication_date":"2023-01-09","ids":{"openalex":"https://openalex.org/W4315706637","doi":"https://doi.org/10.48550/arxiv.2301.03988"},"language":"en","primary_location":{"id":"pmh:oai:arXiv.org:2301.03988","is_oa":true,"landing_page_url":"http://arxiv.org/abs/2301.03988","pdf_url":"https://arxiv.org/pdf/2301.03988","source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":"cc-by-sa","license_id":"https://openalex.org/licenses/cc-by-sa","version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":"","raw_type":"text"},"type":"preprint","indexed_in":["arxiv","datacite"],"open_access":{"is_oa":true,"oa_status":"green","oa_url":"https://arxiv.org/pdf/2301.03988","any_repository_has_fulltext":true},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5072906919","display_name":"Loubna Ben Allal","orcid":null},"institutions":[],"countries":[],"is_corresponding":true,"raw_author_name":"Allal, Loubna Ben","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5009823475","display_name":"Raymond Li","orcid":"https://orcid.org/0000-0002-7957-7798"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Li, Raymond","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5068788224","display_name":"Denis Kocetkov","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Kocetkov, Denis","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5002251783","display_name":"Chenghao Mou","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Mou, Chenghao","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5033794353","display_name":"Christopher Akiki","orcid":"https://orcid.org/0000-0002-1634-5068"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Akiki, Christopher","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5029389486","display_name":"Carlos Munoz Ferrandis","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Ferrandis, Carlos Munoz","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5000043237","display_name":"Niklas Muennighoff","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Muennighoff, Niklas","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5101511088","display_name":"Mayank Mishra","orcid":"https://orcid.org/0000-0001-8964-4133"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Mishra, Mayank","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5007842855","display_name":"Alex Gu","orcid":"https://orcid.org/0000-0002-4814-0796"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Gu, Alex","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5070647299","display_name":"Manan Dey","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Dey, Manan","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5090893148","display_name":"Logesh Kumar Umapathi","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Umapathi, Logesh Kumar","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5075492610","display_name":"Carolyn Jane Anderson","orcid":"https://orcid.org/0000-0001-5717-4210"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Anderson, Carolyn Jane","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5018675797","display_name":"Yangtian Zi","orcid":"https://orcid.org/0000-0003-2606-3280"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Zi, Yangtian","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5005743381","display_name":"Joel Lamy Poirier","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Poirier, Joel Lamy","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5083384339","display_name":"Hailey Schoelkopf","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Schoelkopf, Hailey","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5091564502","display_name":"Sergey Troshin","orcid":"https://orcid.org/0000-0001-5493-1773"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Troshin, Sergey","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5063189132","display_name":"Dmitry Abulkhanov","orcid":"https://orcid.org/0000-0002-8758-2458"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Abulkhanov, Dmitry","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5001782949","display_name":"Manuel Romero","orcid":"https://orcid.org/0000-0001-8152-1331"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Romero, Manuel","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5077804559","display_name":"Michael F. L\u00e4ppert","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Lappert, Michael","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5054948010","display_name":"Francesco De Toni","orcid":"https://orcid.org/0000-0003-0062-7674"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"De Toni, Francesco","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5088568785","display_name":"Bernardo Garc\u00eda del R\u00edo","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"del R\u00edo, Bernardo Garc\u00eda","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5100318540","display_name":"Qian Liu","orcid":"https://orcid.org/0000-0002-0517-7687"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Liu, Qian","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5110946701","display_name":"Shamik Bose","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Bose, Shamik","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5018410563","display_name":"Urvashi Bhattacharyya","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Bhattacharyya, Urvashi","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5082624117","display_name":"Terry Yue Zhuo","orcid":"https://orcid.org/0000-0002-5760-5188"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Zhuo, Terry Yue","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5035649010","display_name":"Ian Yu","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Yu, Ian","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5077190748","display_name":"Paulo Villegas","orcid":"https://orcid.org/0000-0001-9293-8052"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Villegas, Paulo","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5076596867","display_name":"Marco Zocca","orcid":"https://orcid.org/0000-0001-5210-9794"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Zocca, Marco","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5048579807","display_name":"Sourab Mangrulkar","orcid":"https://orcid.org/0000-0002-7997-1170"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Mangrulkar, Sourab","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5071825886","display_name":"David Lansky","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Lansky, David","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5044824055","display_name":"Huu Du Nguyen","orcid":"https://orcid.org/0000-0001-6067-6676"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Nguyen, Huu","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5082114795","display_name":"Danish Contractor","orcid":"https://orcid.org/0000-0002-6843-1961"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Contractor, Danish","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5108457098","display_name":"L. F. Villa","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Villa, Luis","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5100405693","display_name":"Jia Li","orcid":"https://orcid.org/0000-0002-5579-8852"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Li, Jia","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5010465328","display_name":"Dzmitry Bahdanau","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Bahdanau, Dzmitry","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5000126238","display_name":"Yacine Jernite","orcid":"https://orcid.org/0000-0002-8053-6862"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Jernite, Yacine","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5085873515","display_name":"Sean Hughes","orcid":"https://orcid.org/0000-0002-2264-8479"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Hughes, Sean","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5003637850","display_name":"Daniel Fried","orcid":"https://orcid.org/0000-0002-5327-2558"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Fried, Daniel","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5044042294","display_name":"Arjun Guha","orcid":"https://orcid.org/0000-0002-7493-3271"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Guha, Arjun","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5103854790","display_name":"Harm de Vries","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"de Vries, Harm","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"last","author":{"id":"https://openalex.org/A5008355834","display_name":"Leandro von Werra","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"von Werra, Leandro","raw_affiliation_strings":[],"affiliations":[]}],"institutions":[],"countries_distinct_count":0,"institutions_distinct_count":41,"corresponding_author_ids":["https://openalex.org/A5072906919"],"corresponding_institution_ids":[],"apc_list":null,"apc_paid":null,"fwci":null,"has_fulltext":true,"cited_by_count":51,"citation_normalized_percentile":null,"cited_by_percentile_year":null,"biblio":{"volume":null,"issue":null,"first_page":null,"last_page":null},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10260","display_name":"Software Engineering Research","score":0.9898999929428101,"subfield":{"id":"https://openalex.org/subfields/1710","display_name":"Information Systems"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10260","display_name":"Software Engineering Research","score":0.9898999929428101,"subfield":{"id":"https://openalex.org/subfields/1710","display_name":"Information Systems"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10028","display_name":"Topic Modeling","score":0.983299970626831,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T12535","display_name":"Machine Learning and Data Classification","score":0.9532999992370605,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.7761378288269043},{"id":"https://openalex.org/keywords/python","display_name":"Python (programming language)","score":0.752582848072052},{"id":"https://openalex.org/keywords/javascript","display_name":"JavaScript","score":0.687254786491394},{"id":"https://openalex.org/keywords/java","display_name":"Java","score":0.6054698824882507},{"id":"https://openalex.org/keywords/programming-language","display_name":"Programming language","score":0.5446630120277405},{"id":"https://openalex.org/keywords/preprocessor","display_name":"Preprocessor","score":0.5235511660575867},{"id":"https://openalex.org/keywords/source-code","display_name":"Source code","score":0.4834750294685364},{"id":"https://openalex.org/keywords/web-application","display_name":"Web application","score":0.4593402147293091},{"id":"https://openalex.org/keywords/language-model","display_name":"Language model","score":0.4533802568912506},{"id":"https://openalex.org/keywords/open-source","display_name":"Open source","score":0.42897987365722656},{"id":"https://openalex.org/keywords/license","display_name":"License","score":0.4216834604740143},{"id":"https://openalex.org/keywords/world-wide-web","display_name":"World Wide Web","score":0.3607594966888428},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.35033586621284485},{"id":"https://openalex.org/keywords/operating-system","display_name":"Operating system","score":0.31166213750839233},{"id":"https://openalex.org/keywords/software","display_name":"Software","score":0.1280900537967682}],"concepts":[{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.7761378288269043},{"id":"https://openalex.org/C519991488","wikidata":"https://www.wikidata.org/wiki/Q28865","display_name":"Python (programming language)","level":2,"score":0.752582848072052},{"id":"https://openalex.org/C544833334","wikidata":"https://www.wikidata.org/wiki/Q2005","display_name":"JavaScript","level":2,"score":0.687254786491394},{"id":"https://openalex.org/C548217200","wikidata":"https://www.wikidata.org/wiki/Q251","display_name":"Java","level":2,"score":0.6054698824882507},{"id":"https://openalex.org/C199360897","wikidata":"https://www.wikidata.org/wiki/Q9143","display_name":"Programming language","level":1,"score":0.5446630120277405},{"id":"https://openalex.org/C34736171","wikidata":"https://www.wikidata.org/wiki/Q918333","display_name":"Preprocessor","level":2,"score":0.5235511660575867},{"id":"https://openalex.org/C43126263","wikidata":"https://www.wikidata.org/wiki/Q128751","display_name":"Source code","level":2,"score":0.4834750294685364},{"id":"https://openalex.org/C118643609","wikidata":"https://www.wikidata.org/wiki/Q189210","display_name":"Web application","level":2,"score":0.4593402147293091},{"id":"https://openalex.org/C137293760","wikidata":"https://www.wikidata.org/wiki/Q3621696","display_name":"Language model","level":2,"score":0.4533802568912506},{"id":"https://openalex.org/C3018397939","wikidata":"https://www.wikidata.org/wiki/Q3644502","display_name":"Open source","level":3,"score":0.42897987365722656},{"id":"https://openalex.org/C2780560020","wikidata":"https://www.wikidata.org/wiki/Q79719","display_name":"License","level":2,"score":0.4216834604740143},{"id":"https://openalex.org/C136764020","wikidata":"https://www.wikidata.org/wiki/Q466","display_name":"World Wide Web","level":1,"score":0.3607594966888428},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.35033586621284485},{"id":"https://openalex.org/C111919701","wikidata":"https://www.wikidata.org/wiki/Q9135","display_name":"Operating system","level":1,"score":0.31166213750839233},{"id":"https://openalex.org/C2777904410","wikidata":"https://www.wikidata.org/wiki/Q7397","display_name":"Software","level":2,"score":0.1280900537967682}],"mesh":[],"locations_count":2,"locations":[{"id":"pmh:oai:arXiv.org:2301.03988","is_oa":true,"landing_page_url":"http://arxiv.org/abs/2301.03988","pdf_url":"https://arxiv.org/pdf/2301.03988","source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":"cc-by-sa","license_id":"https://openalex.org/licenses/cc-by-sa","version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":"","raw_type":"text"},{"id":"doi:10.48550/arxiv.2301.03988","is_oa":true,"landing_page_url":"https://doi.org/10.48550/arxiv.2301.03988","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":null,"is_accepted":false,"is_published":null,"raw_source_name":null,"raw_type":"article"}],"best_oa_location":{"id":"pmh:oai:arXiv.org:2301.03988","is_oa":true,"landing_page_url":"http://arxiv.org/abs/2301.03988","pdf_url":"https://arxiv.org/pdf/2301.03988","source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":"cc-by-sa","license_id":"https://openalex.org/licenses/cc-by-sa","version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":"","raw_type":"text"},"sustainable_development_goals":[],"awards":[],"funders":[],"has_content":{"grobid_xml":true,"pdf":true},"content_urls":{"pdf":"https://content.openalex.org/works/W4315706637.pdf","grobid_xml":"https://content.openalex.org/works/W4315706637.grobid-xml"},"referenced_works_count":0,"referenced_works":[],"related_works":["https://openalex.org/W3080200277","https://openalex.org/W2557718140","https://openalex.org/W67092138","https://openalex.org/W4225687299","https://openalex.org/W2789551765","https://openalex.org/W2113128227","https://openalex.org/W632256878","https://openalex.org/W2491403535","https://openalex.org/W2479811461","https://openalex.org/W2104915799"],"abstract_inverted_index":{"The":[0,74],"BigCode":[1],"project":[2],"is":[3],"an":[4,149],"open-scientific":[5],"collaboration":[6,26],"working":[7],"on":[8,66,79,129],"the":[9,22,25,31,35,42,47,51,58,67,80,130],"responsible":[10],"development":[11],"of":[12,24,34,73,90,136],"large":[13],"language":[14],"models":[15,65,119,145],"for":[16,57],"code.":[17],"This":[18],"tech":[19],"report":[20],"describes":[21],"progress":[23],"until":[27],"December":[28],"2022,":[29],"outlining":[30],"current":[32],"state":[33],"Personally":[36],"Identifiable":[37],"Information":[38],"(PII)":[39],"redaction":[40],"pipeline,":[41],"experiments":[43,52],"conducted":[44],"to":[45],"de-risk":[46],"model":[48,112],"architecture,":[49],"and":[50,70,76,121,127,133],"investigating":[53],"better":[54],"preprocessing":[55],"methods":[56],"training":[59],"data.":[60],"We":[61,84],"train":[62],"1.1B":[63],"parameter":[64],"Java,":[68,131],"JavaScript,":[69,132],"Python":[71,134],"subsets":[72],"Stack":[75],"evaluate":[77],"them":[78],"MultiPL-E":[81],"text-to-code":[82],"benchmark.":[83],"find":[85],"that":[86,98],"more":[87],"aggressive":[88],"filtering":[89],"near-duplicates":[91],"can":[92],"further":[93],"boost":[94],"performance":[95,108],"and,":[96],"surprisingly,":[97],"selecting":[99],"files":[100],"from":[101],"repositories":[102],"with":[103],"5+":[104],"GitHub":[105],"stars":[106],"deteriorates":[107],"significantly.":[109],"Our":[110],"best":[111],"outperforms":[113],"previous":[114],"open-source":[115],"multilingual":[116],"code":[117],"generation":[118,126],"(InCoder-6.7B":[120],"CodeGen-Multi-2.7B)":[122],"in":[123],"both":[124],"left-to-right":[125],"infilling":[128],"portions":[135],"MultiPL-E,":[137],"despite":[138],"being":[139],"a":[140],"substantially":[141],"smaller":[142],"model.":[143],"All":[144],"are":[146],"released":[147],"under":[148],"OpenRAIL":[150],"license":[151],"at":[152],"https://hf.co/bigcode.":[153]},"counts_by_year":[{"year":2025,"cited_by_count":11},{"year":2024,"cited_by_count":23},{"year":2023,"cited_by_count":17}],"updated_date":"2026-03-10T16:38:18.471706","created_date":"2025-10-10T00:00:00"}
