{"id":"https://openalex.org/W4389163154","doi":"https://doi.org/10.1145/3611643.3616244","title":"On the Usage of Continual Learning for Out-of-Distribution Generalization in Pre-trained Language Models of Code","display_name":"On the Usage of Continual Learning for Out-of-Distribution Generalization in Pre-trained Language Models of Code","publication_year":2023,"publication_date":"2023-11-30","ids":{"openalex":"https://openalex.org/W4389163154","doi":"https://doi.org/10.1145/3611643.3616244"},"language":"en","primary_location":{"id":"doi:10.1145/3611643.3616244","is_oa":false,"landing_page_url":"https://doi.org/10.1145/3611643.3616244","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Proceedings of the 31st ACM Joint European Software Engineering Conference and Symposium on the Foundations of Software Engineering","raw_type":"proceedings-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":false,"oa_status":"closed","oa_url":null,"any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5107246651","display_name":"Martin Weyssow","orcid":"https://orcid.org/0000-0002-5987-850X"},"institutions":[{"id":"https://openalex.org/I70931966","display_name":"Universit\u00e9 de Montr\u00e9al","ror":"https://ror.org/0161xgx34","country_code":"CA","type":"education","lineage":["https://openalex.org/I70931966"]}],"countries":["CA"],"is_corresponding":true,"raw_author_name":"Martin Weyssow","raw_affiliation_strings":["Universit\u00e9 de Montr\u00e9al, Montreal, Canada"],"raw_orcid":"https://orcid.org/0000-0002-5987-850X","affiliations":[{"raw_affiliation_string":"Universit\u00e9 de Montr\u00e9al, Montreal, Canada","institution_ids":["https://openalex.org/I70931966"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5100424233","display_name":"Xin Zhou","orcid":"https://orcid.org/0000-0002-4558-0622"},"institutions":[{"id":"https://openalex.org/I79891267","display_name":"Singapore Management University","ror":"https://ror.org/050qmg959","country_code":"SG","type":"education","lineage":["https://openalex.org/I79891267"]}],"countries":["SG"],"is_corresponding":false,"raw_author_name":"Xin Zhou","raw_affiliation_strings":["Singapore Management University, Singapore, Singapore"],"raw_orcid":"https://orcid.org/0000-0002-4558-0622","affiliations":[{"raw_affiliation_string":"Singapore Management University, Singapore, Singapore","institution_ids":["https://openalex.org/I79891267"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5074029092","display_name":"Kisub Kim","orcid":"https://orcid.org/0000-0002-4462-6916"},"institutions":[{"id":"https://openalex.org/I79891267","display_name":"Singapore Management University","ror":"https://ror.org/050qmg959","country_code":"SG","type":"education","lineage":["https://openalex.org/I79891267"]}],"countries":["SG"],"is_corresponding":false,"raw_author_name":"Kisub Kim","raw_affiliation_strings":["Singapore Management University, Singapore, Singapore"],"raw_orcid":"https://orcid.org/0000-0002-4462-6916","affiliations":[{"raw_affiliation_string":"Singapore Management University, Singapore, Singapore","institution_ids":["https://openalex.org/I79891267"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5081036622","display_name":"David Lo","orcid":"https://orcid.org/0000-0002-4367-7201"},"institutions":[{"id":"https://openalex.org/I79891267","display_name":"Singapore Management University","ror":"https://ror.org/050qmg959","country_code":"SG","type":"education","lineage":["https://openalex.org/I79891267"]}],"countries":["SG"],"is_corresponding":false,"raw_author_name":"David Lo","raw_affiliation_strings":["Singapore Management University, Singapore, Singapore"],"raw_orcid":"https://orcid.org/0000-0002-4367-7201","affiliations":[{"raw_affiliation_string":"Singapore Management University, Singapore, Singapore","institution_ids":["https://openalex.org/I79891267"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5009574640","display_name":"Houari Sahraoui","orcid":"https://orcid.org/0000-0001-6304-9926"},"institutions":[{"id":"https://openalex.org/I70931966","display_name":"Universit\u00e9 de Montr\u00e9al","ror":"https://ror.org/0161xgx34","country_code":"CA","type":"education","lineage":["https://openalex.org/I70931966"]}],"countries":["CA"],"is_corresponding":false,"raw_author_name":"Houari Sahraoui","raw_affiliation_strings":["Universit\u00e9 de Montr\u00e9al, Montreal, Canada"],"raw_orcid":"https://orcid.org/0000-0001-6304-9926","affiliations":[{"raw_affiliation_string":"Universit\u00e9 de Montr\u00e9al, Montreal, Canada","institution_ids":["https://openalex.org/I70931966"]}]}],"institutions":[],"countries_distinct_count":2,"institutions_distinct_count":5,"corresponding_author_ids":["https://openalex.org/A5107246651"],"corresponding_institution_ids":["https://openalex.org/I70931966"],"apc_list":null,"apc_paid":null,"fwci":1.5337,"has_fulltext":false,"cited_by_count":9,"citation_normalized_percentile":{"value":0.86581933,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":{"min":90,"max":99},"biblio":{"volume":null,"issue":null,"first_page":"1470","last_page":"1482"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T11307","display_name":"Domain Adaptation and Few-Shot Learning","score":0.9991000294685364,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T11307","display_name":"Domain Adaptation and Few-Shot Learning","score":0.9991000294685364,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10028","display_name":"Topic Modeling","score":0.9937000274658203,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11714","display_name":"Multimodal Machine Learning Applications","score":0.9625999927520752,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.8630715012550354},{"id":"https://openalex.org/keywords/robustness","display_name":"Robustness (evolution)","score":0.6642400622367859},{"id":"https://openalex.org/keywords/encoder","display_name":"Encoder","score":0.5450419187545776},{"id":"https://openalex.org/keywords/software","display_name":"Software","score":0.504546046257019},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.4970403015613556},{"id":"https://openalex.org/keywords/machine-learning","display_name":"Machine learning","score":0.4943251609802246},{"id":"https://openalex.org/keywords/code","display_name":"Code (set theory)","score":0.47802767157554626},{"id":"https://openalex.org/keywords/language-model","display_name":"Language model","score":0.47642573714256287},{"id":"https://openalex.org/keywords/source-code","display_name":"Source code","score":0.4136325716972351},{"id":"https://openalex.org/keywords/programming-language","display_name":"Programming language","score":0.19397133588790894}],"concepts":[{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.8630715012550354},{"id":"https://openalex.org/C63479239","wikidata":"https://www.wikidata.org/wiki/Q7353546","display_name":"Robustness (evolution)","level":3,"score":0.6642400622367859},{"id":"https://openalex.org/C118505674","wikidata":"https://www.wikidata.org/wiki/Q42586063","display_name":"Encoder","level":2,"score":0.5450419187545776},{"id":"https://openalex.org/C2777904410","wikidata":"https://www.wikidata.org/wiki/Q7397","display_name":"Software","level":2,"score":0.504546046257019},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.4970403015613556},{"id":"https://openalex.org/C119857082","wikidata":"https://www.wikidata.org/wiki/Q2539","display_name":"Machine learning","level":1,"score":0.4943251609802246},{"id":"https://openalex.org/C2776760102","wikidata":"https://www.wikidata.org/wiki/Q5139990","display_name":"Code (set theory)","level":3,"score":0.47802767157554626},{"id":"https://openalex.org/C137293760","wikidata":"https://www.wikidata.org/wiki/Q3621696","display_name":"Language model","level":2,"score":0.47642573714256287},{"id":"https://openalex.org/C43126263","wikidata":"https://www.wikidata.org/wiki/Q128751","display_name":"Source code","level":2,"score":0.4136325716972351},{"id":"https://openalex.org/C199360897","wikidata":"https://www.wikidata.org/wiki/Q9143","display_name":"Programming language","level":1,"score":0.19397133588790894},{"id":"https://openalex.org/C177264268","wikidata":"https://www.wikidata.org/wiki/Q1514741","display_name":"Set (abstract data type)","level":2,"score":0.0},{"id":"https://openalex.org/C185592680","wikidata":"https://www.wikidata.org/wiki/Q2329","display_name":"Chemistry","level":0,"score":0.0},{"id":"https://openalex.org/C55493867","wikidata":"https://www.wikidata.org/wiki/Q7094","display_name":"Biochemistry","level":1,"score":0.0},{"id":"https://openalex.org/C104317684","wikidata":"https://www.wikidata.org/wiki/Q7187","display_name":"Gene","level":2,"score":0.0},{"id":"https://openalex.org/C111919701","wikidata":"https://www.wikidata.org/wiki/Q9135","display_name":"Operating system","level":1,"score":0.0}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.1145/3611643.3616244","is_oa":false,"landing_page_url":"https://doi.org/10.1145/3611643.3616244","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Proceedings of the 31st ACM Joint European Software Engineering Conference and Symposium on the Foundations of Software Engineering","raw_type":"proceedings-article"}],"best_oa_location":null,"sustainable_development_goals":[{"score":0.49000000953674316,"display_name":"Quality Education","id":"https://metadata.un.org/sdg/4"}],"awards":[],"funders":[{"id":"https://openalex.org/F4320334841","display_name":"Fonds de recherche du Qu\u00e9bec \u2013 Nature et technologies","ror":"https://ror.org/00b9f9778"}],"has_content":{"pdf":false,"grobid_xml":false},"content_urls":null,"referenced_works_count":40,"referenced_works":["https://openalex.org/W1682403713","https://openalex.org/W2022775778","https://openalex.org/W2059215200","https://openalex.org/W2135742552","https://openalex.org/W2247374552","https://openalex.org/W2473930607","https://openalex.org/W2509810107","https://openalex.org/W2560647685","https://openalex.org/W2786446225","https://openalex.org/W2788388592","https://openalex.org/W2954451301","https://openalex.org/W2963588172","https://openalex.org/W2963846996","https://openalex.org/W2965373594","https://openalex.org/W2979792666","https://openalex.org/W2979826702","https://openalex.org/W2990138404","https://openalex.org/W3000135256","https://openalex.org/W3011013751","https://openalex.org/W3035342403","https://openalex.org/W3084812981","https://openalex.org/W3097816393","https://openalex.org/W3098511564","https://openalex.org/W3102015031","https://openalex.org/W3105867435","https://openalex.org/W3144723458","https://openalex.org/W3145293720","https://openalex.org/W3160765131","https://openalex.org/W3176740355","https://openalex.org/W3217001695","https://openalex.org/W4224441980","https://openalex.org/W4225484930","https://openalex.org/W4281763794","https://openalex.org/W4285490465","https://openalex.org/W4288055447","https://openalex.org/W4319653845","https://openalex.org/W4385570151","https://openalex.org/W4385572001","https://openalex.org/W6785333560","https://openalex.org/W6950217568"],"related_works":["https://openalex.org/W4390516098","https://openalex.org/W2181948922","https://openalex.org/W2384362569","https://openalex.org/W2142795561","https://openalex.org/W4205302943","https://openalex.org/W2770593030","https://openalex.org/W2561132942","https://openalex.org/W3154990682","https://openalex.org/W3155418658","https://openalex.org/W3081644756"],"abstract_inverted_index":{"Pre-trained":[0],"language":[1],"models":[2],"(PLMs)":[3],"have":[4],"become":[5],"a":[6,15,30,43,75,104,125,136,143,152,170,174],"prevalent":[7],"technique":[8,195],"in":[9,29,74,111,124,248],"deep":[10],"learning":[11,229],"for":[12,91],"code,":[13],"utilizing":[14,240],"two-stage":[16],"pre-training":[17,66],"and":[18,27,48,67,173,183,233],"fine-tuning":[19,129,194],"procedure":[20],"to":[21,45,58,96,120,135,149,203,211],"acquire":[22],"general":[23],"knowledge":[24,217],"about":[25],"code":[26,95],"specialize":[28],"variety":[31],"of":[32,39,50,64,77,94,116,154,208,214],"downstream":[33,82,179,252],"tasks.":[34,83],"However,":[35],"the":[36,46,62,65,78,89,122,146,190,205,212],"dynamic":[37,206],"nature":[38,207],"software":[40,97,137],"codebases":[41],"poses":[42],"challenge":[44],"effectiveness":[47],"robustness":[49],"PLMs.":[51],"In":[52,84],"particular,":[53],"world-realistic":[54],"scenarios":[55],"potentially":[56],"lead":[57],"significant":[59],"differences":[60],"between":[61],"distribution":[63,71,100],"test":[68],"data,":[69],"i.e.,":[70,169,218],"shift,":[72],"resulting":[73],"degradation":[76],"PLM's":[79],"performance":[80],"on":[81,177],"this":[85,117],"paper,":[86],"we":[87,141,225],"stress":[88],"need":[90],"adapting":[92],"PLMs":[93,249],"data":[98,130],"whose":[99],"changes":[101],"over":[102,132,160],"time,":[103],"crucial":[105],"problem":[106],"that":[107,189,239],"has":[108],"been":[109],"overlooked":[110],"previous":[112],"works.":[113],"The":[114],"motivation":[115],"work":[118,198],"is":[119,199],"consider":[121],"PLM":[123,167],"non-stationary":[126],"environment,":[127],"where":[128,145],"evolves":[131],"time":[133],"according":[134],"evolution":[138],"scenario.":[139],"Specifically,":[140],"design":[142],"scenario":[144],"model":[147],"needs":[148],"learn":[150],"from":[151,196],"stream":[153],"programs":[155],"containing":[156],"new,":[157],"unseen":[158],"APIs":[159],"time.":[161],"We":[162,187],"study":[163],"two":[164,178],"widely":[165],"used":[166,193],"architectures,":[168],"GPT2":[171],"decoder":[172],"RoBERTa":[175],"encoder,":[176],"tasks,":[180],"API":[181,184],"call":[182],"usage":[185],"prediction.":[186],"demonstrate":[188,238],"most":[191],"commonly":[192],"prior":[197],"not":[200],"robust":[201],"enough":[202],"handle":[204],"APIs,":[209],"leading":[210],"loss":[213],"previously":[215],"acquired":[216],"catastrophic":[219,246],"forgetting.":[220],"To":[221],"address":[222],"these":[223,241],"issues,":[224],"implement":[226],"five":[227],"continual":[228],"approaches,":[230],"including":[231],"replay-based":[232],"regularization-based":[234],"methods.":[235],"Our":[236],"findings":[237],"straightforward":[242],"methods":[243],"effectively":[244],"mitigates":[245],"forgetting":[247],"across":[250],"both":[251],"tasks":[253],"while":[254],"achieving":[255],"comparable":[256],"or":[257],"superior":[258],"performance.":[259]},"counts_by_year":[{"year":2025,"cited_by_count":6},{"year":2024,"cited_by_count":2},{"year":2023,"cited_by_count":1}],"updated_date":"2026-03-27T05:58:40.876381","created_date":"2025-10-10T00:00:00"}
