{"id":"https://openalex.org/W2740130862","doi":"https://doi.org/10.1145/3106237.3106290","title":"Are deep neural networks the best choice for modeling source code?","display_name":"Are deep neural networks the best choice for modeling source code?","publication_year":2017,"publication_date":"2017-08-02","ids":{"openalex":"https://openalex.org/W2740130862","doi":"https://doi.org/10.1145/3106237.3106290","mag":"2740130862"},"language":"en","primary_location":{"id":"doi:10.1145/3106237.3106290","is_oa":false,"landing_page_url":"https://doi.org/10.1145/3106237.3106290","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Proceedings of the 2017 11th Joint Meeting on Foundations of Software Engineering","raw_type":"proceedings-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":false,"oa_status":"closed","oa_url":null,"any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5009679905","display_name":"Vincent J. Hellendoorn","orcid":"https://orcid.org/0000-0001-7516-0525"},"institutions":[{"id":"https://openalex.org/I84218800","display_name":"University of California, Davis","ror":"https://ror.org/05rrcem69","country_code":"US","type":"education","lineage":["https://openalex.org/I84218800"]}],"countries":["US"],"is_corresponding":true,"raw_author_name":"Vincent J. Hellendoorn","raw_affiliation_strings":["University of California at Davis, USA"],"affiliations":[{"raw_affiliation_string":"University of California at Davis, USA","institution_ids":["https://openalex.org/I84218800"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5036744986","display_name":"Pr\u00e9mkumar D\u00e9vanbu","orcid":"https://orcid.org/0000-0002-4346-5276"},"institutions":[{"id":"https://openalex.org/I84218800","display_name":"University of California, Davis","ror":"https://ror.org/05rrcem69","country_code":"US","type":"education","lineage":["https://openalex.org/I84218800"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Premkumar Devanbu","raw_affiliation_strings":["University of California at Davis, USA"],"affiliations":[{"raw_affiliation_string":"University of California at Davis, USA","institution_ids":["https://openalex.org/I84218800"]}]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":2,"corresponding_author_ids":["https://openalex.org/A5009679905"],"corresponding_institution_ids":["https://openalex.org/I84218800"],"apc_list":null,"apc_paid":null,"fwci":27.6167,"has_fulltext":false,"cited_by_count":295,"citation_normalized_percentile":{"value":0.99647932,"is_in_top_1_percent":true,"is_in_top_10_percent":true},"cited_by_percentile_year":{"min":94,"max":100},"biblio":{"volume":null,"issue":null,"first_page":"763","last_page":"773"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10028","display_name":"Topic Modeling","score":0.9994000196456909,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10028","display_name":"Topic Modeling","score":0.9994000196456909,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10181","display_name":"Natural Language Processing Techniques","score":0.9994000196456909,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10260","display_name":"Software Engineering Research","score":0.9987000226974487,"subfield":{"id":"https://openalex.org/subfields/1710","display_name":"Information Systems"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.8780660629272461},{"id":"https://openalex.org/keywords/source-code","display_name":"Source code","score":0.7034631371498108},{"id":"https://openalex.org/keywords/language-model","display_name":"Language model","score":0.701972484588623},{"id":"https://openalex.org/keywords/locality","display_name":"Locality","score":0.6069674491882324},{"id":"https://openalex.org/keywords/deep-learning","display_name":"Deep learning","score":0.5675197839736938},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.5318984985351562},{"id":"https://openalex.org/keywords/code","display_name":"Code (set theory)","score":0.5152021050453186},{"id":"https://openalex.org/keywords/locality-of-reference","display_name":"Locality of reference","score":0.5080060958862305},{"id":"https://openalex.org/keywords/codebase","display_name":"Codebase","score":0.4958837926387787},{"id":"https://openalex.org/keywords/n-gram","display_name":"n-gram","score":0.48434627056121826},{"id":"https://openalex.org/keywords/machine-learning","display_name":"Machine learning","score":0.416208416223526},{"id":"https://openalex.org/keywords/expansive","display_name":"Expansive","score":0.4108961820602417},{"id":"https://openalex.org/keywords/modeling-language","display_name":"Modeling language","score":0.41028571128845215},{"id":"https://openalex.org/keywords/software","display_name":"Software","score":0.3807162344455719},{"id":"https://openalex.org/keywords/cache","display_name":"Cache","score":0.37333011627197266},{"id":"https://openalex.org/keywords/programming-language","display_name":"Programming language","score":0.3246469795703888},{"id":"https://openalex.org/keywords/parallel-computing","display_name":"Parallel computing","score":0.14231231808662415},{"id":"https://openalex.org/keywords/set","display_name":"Set (abstract data type)","score":0.10580459237098694}],"concepts":[{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.8780660629272461},{"id":"https://openalex.org/C43126263","wikidata":"https://www.wikidata.org/wiki/Q128751","display_name":"Source code","level":2,"score":0.7034631371498108},{"id":"https://openalex.org/C137293760","wikidata":"https://www.wikidata.org/wiki/Q3621696","display_name":"Language model","level":2,"score":0.701972484588623},{"id":"https://openalex.org/C2779808786","wikidata":"https://www.wikidata.org/wiki/Q6664603","display_name":"Locality","level":2,"score":0.6069674491882324},{"id":"https://openalex.org/C108583219","wikidata":"https://www.wikidata.org/wiki/Q197536","display_name":"Deep learning","level":2,"score":0.5675197839736938},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.5318984985351562},{"id":"https://openalex.org/C2776760102","wikidata":"https://www.wikidata.org/wiki/Q5139990","display_name":"Code (set theory)","level":3,"score":0.5152021050453186},{"id":"https://openalex.org/C27602214","wikidata":"https://www.wikidata.org/wiki/Q1868547","display_name":"Locality of reference","level":3,"score":0.5080060958862305},{"id":"https://openalex.org/C51929080","wikidata":"https://www.wikidata.org/wiki/Q2425187","display_name":"Codebase","level":3,"score":0.4958837926387787},{"id":"https://openalex.org/C117884012","wikidata":"https://www.wikidata.org/wiki/Q94489","display_name":"n-gram","level":3,"score":0.48434627056121826},{"id":"https://openalex.org/C119857082","wikidata":"https://www.wikidata.org/wiki/Q2539","display_name":"Machine learning","level":1,"score":0.416208416223526},{"id":"https://openalex.org/C2780502288","wikidata":"https://www.wikidata.org/wiki/Q28838156","display_name":"Expansive","level":3,"score":0.4108961820602417},{"id":"https://openalex.org/C179603123","wikidata":"https://www.wikidata.org/wiki/Q1941921","display_name":"Modeling language","level":3,"score":0.41028571128845215},{"id":"https://openalex.org/C2777904410","wikidata":"https://www.wikidata.org/wiki/Q7397","display_name":"Software","level":2,"score":0.3807162344455719},{"id":"https://openalex.org/C115537543","wikidata":"https://www.wikidata.org/wiki/Q165596","display_name":"Cache","level":2,"score":0.37333011627197266},{"id":"https://openalex.org/C199360897","wikidata":"https://www.wikidata.org/wiki/Q9143","display_name":"Programming language","level":1,"score":0.3246469795703888},{"id":"https://openalex.org/C173608175","wikidata":"https://www.wikidata.org/wiki/Q232661","display_name":"Parallel computing","level":1,"score":0.14231231808662415},{"id":"https://openalex.org/C177264268","wikidata":"https://www.wikidata.org/wiki/Q1514741","display_name":"Set (abstract data type)","level":2,"score":0.10580459237098694},{"id":"https://openalex.org/C138885662","wikidata":"https://www.wikidata.org/wiki/Q5891","display_name":"Philosophy","level":0,"score":0.0},{"id":"https://openalex.org/C159985019","wikidata":"https://www.wikidata.org/wiki/Q181790","display_name":"Composite material","level":1,"score":0.0},{"id":"https://openalex.org/C192562407","wikidata":"https://www.wikidata.org/wiki/Q228736","display_name":"Materials science","level":0,"score":0.0},{"id":"https://openalex.org/C30407753","wikidata":"https://www.wikidata.org/wiki/Q186191","display_name":"Compressive strength","level":2,"score":0.0},{"id":"https://openalex.org/C41895202","wikidata":"https://www.wikidata.org/wiki/Q8162","display_name":"Linguistics","level":1,"score":0.0}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.1145/3106237.3106290","is_oa":false,"landing_page_url":"https://doi.org/10.1145/3106237.3106290","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Proceedings of the 2017 11th Joint Meeting on Foundations of Software Engineering","raw_type":"proceedings-article"}],"best_oa_location":null,"sustainable_development_goals":[{"id":"https://metadata.un.org/sdg/4","display_name":"Quality Education","score":0.8100000023841858}],"awards":[{"id":"https://openalex.org/G7432288113","display_name":null,"funder_award_id":"1414172","funder_id":"https://openalex.org/F4320306076","funder_display_name":"National Science Foundation"}],"funders":[{"id":"https://openalex.org/F4320306076","display_name":"National Science Foundation","ror":"https://ror.org/021nxhr62"}],"has_content":{"grobid_xml":false,"pdf":false},"content_urls":null,"referenced_works_count":44,"referenced_works":["https://openalex.org/W179875071","https://openalex.org/W1551431154","https://openalex.org/W1607229519","https://openalex.org/W1655078475","https://openalex.org/W1771830246","https://openalex.org/W1860267373","https://openalex.org/W1938755728","https://openalex.org/W1970607969","https://openalex.org/W1970859802","https://openalex.org/W1972141422","https://openalex.org/W1974020522","https://openalex.org/W1988346254","https://openalex.org/W1994573369","https://openalex.org/W2018389835","https://openalex.org/W2060384944","https://openalex.org/W2064675550","https://openalex.org/W2066714497","https://openalex.org/W2074032109","https://openalex.org/W2083878868","https://openalex.org/W2097927681","https://openalex.org/W2108321481","https://openalex.org/W2125031621","https://openalex.org/W2140609933","https://openalex.org/W2142403498","https://openalex.org/W2143861926","https://openalex.org/W2148190602","https://openalex.org/W2165747537","https://openalex.org/W2166597811","https://openalex.org/W2175297521","https://openalex.org/W2257123346","https://openalex.org/W2259472270","https://openalex.org/W2444132761","https://openalex.org/W2511803001","https://openalex.org/W2547880329","https://openalex.org/W2949237929","https://openalex.org/W2950186769","https://openalex.org/W2951714314","https://openalex.org/W3005855585","https://openalex.org/W3021713638","https://openalex.org/W3104874136","https://openalex.org/W4247610018","https://openalex.org/W4247950230","https://openalex.org/W4300925921","https://openalex.org/W6607333740"],"related_works":["https://openalex.org/W2250909759","https://openalex.org/W2532616038","https://openalex.org/W2624072012","https://openalex.org/W2787311093","https://openalex.org/W2057384730","https://openalex.org/W4307474317","https://openalex.org/W2008468404","https://openalex.org/W2147879411","https://openalex.org/W2132221452","https://openalex.org/W2081295016"],"abstract_inverted_index":{"Current":[0],"statistical":[1],"language":[2,40,68,137],"modeling":[3,41,49,69,117],"techniques,":[4],"including":[5],"deep-learning":[6,136,169],"based":[7,168],"models,":[8,138],"have":[9],"proven":[10],"to":[11,43,78,113],"be":[12,29,114],"quite":[13],"effective":[14],"for":[15,31,73,116,145,156],"source":[16,26,50,143,157],"code.":[17],"We":[18,63,119],"argue":[19],"here":[20],"that":[21,110,151,162],"the":[22,45,76],"special":[23,46],"properties":[24],"of":[25,48,108],"code":[27,144,158],"can":[28,159],"exploited":[30],"further":[32],"improvements.":[33],"In":[34],"this":[35],"work,":[36],"we":[37,91,111],"enhance":[38],"established":[39],"approaches":[42],"handle":[44],"challenges":[47],"code,":[51],"such":[52],"as:":[53],"frequent":[54],"changes,":[55],"larger,":[56],"changing":[57],"vocabularies,":[58],"deeply":[59],"nested":[60,67],"scopes,":[61],"etc.":[62],"present":[64,98,120],"a":[65,99,102],"fast,":[66],"toolkit":[70],"specifically":[71],"designed":[72],"software,":[74],"with":[75,101,127],"ability":[77],"add":[79],"&":[80,85],"remove":[81],"text,":[82],"and":[83,97,134,139,166],"mix":[84],"swap":[86],"out":[87],"many":[88],"models.":[89,170],"Specifically,":[90],"improve":[92],"upon":[93],"prior":[94],"cache-modeling":[95],"work":[96],"model":[100],"much":[103],"more":[104],"expansive,":[105],"multi-level":[106],"notion":[107],"locality":[109],"show":[112],"well-suited":[115],"software.":[118],"results":[121],"on":[122],"varying":[123],"corpora":[124],"in":[125],"comparison":[126],"traditional":[128],"N-gram,":[129],"as":[130,132],"well":[131],"RNN,":[133],"LSTM":[135,167],"release":[140],"all":[141],"our":[142],"public":[146],"use.":[147],"Our":[148],"evaluations":[149],"suggest":[150],"carefully":[152],"adapting":[153],"N-gram":[154],"models":[155],"yield":[160],"performance":[161],"surpasses":[163],"even":[164],"RNN":[165]},"counts_by_year":[{"year":2026,"cited_by_count":1},{"year":2025,"cited_by_count":18},{"year":2024,"cited_by_count":24},{"year":2023,"cited_by_count":32},{"year":2022,"cited_by_count":33},{"year":2021,"cited_by_count":55},{"year":2020,"cited_by_count":59},{"year":2019,"cited_by_count":49},{"year":2018,"cited_by_count":22},{"year":2017,"cited_by_count":2}],"updated_date":"2026-04-04T16:13:02.066488","created_date":"2025-10-10T00:00:00"}
