{"id":"https://openalex.org/W4414230443","doi":"https://doi.org/10.1109/tse.2025.3609876","title":"An Empirical Study of Exploring the Capabilities of Large Language Models in Code Learning","display_name":"An Empirical Study of Exploring the Capabilities of Large Language Models in Code Learning","publication_year":2025,"publication_date":"2025-09-16","ids":{"openalex":"https://openalex.org/W4414230443","doi":"https://doi.org/10.1109/tse.2025.3609876"},"language":"en","primary_location":{"id":"doi:10.1109/tse.2025.3609876","is_oa":false,"landing_page_url":"https://doi.org/10.1109/tse.2025.3609876","pdf_url":null,"source":{"id":"https://openalex.org/S8351582","display_name":"IEEE Transactions on Software Engineering","issn_l":"0098-5589","issn":["0098-5589","1939-3520","2326-3881"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310320439","host_organization_name":"IEEE Computer Society","host_organization_lineage":["https://openalex.org/P4310320439","https://openalex.org/P4310319808"],"host_organization_lineage_names":["IEEE Computer Society","Institute of Electrical and Electronics Engineers"],"type":"journal"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"IEEE Transactions on Software Engineering","raw_type":"journal-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":false,"oa_status":"closed","oa_url":null,"any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":null,"display_name":"Shangqing Liu","orcid":"https://orcid.org/0000-0002-5598-4006"},"institutions":[{"id":"https://openalex.org/I881766915","display_name":"Nanjing University","ror":"https://ror.org/01rxvg760","country_code":"CN","type":"education","lineage":["https://openalex.org/I881766915"]}],"countries":["CN"],"is_corresponding":true,"raw_author_name":"Shangqing Liu","raw_affiliation_strings":["State Key Laboratory of Novel Software Technology, Nanjing University, Nanjing, China","Nanjing University, China"],"raw_orcid":"https://orcid.org/0000-0002-5598-4006","affiliations":[{"raw_affiliation_string":"State Key Laboratory of Novel Software Technology, Nanjing University, Nanjing, China","institution_ids":["https://openalex.org/I881766915"]},{"raw_affiliation_string":"Nanjing University, China","institution_ids":["https://openalex.org/I881766915"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5060364305","display_name":"Daya Guo","orcid":"https://orcid.org/0009-0008-0822-1517"},"institutions":[{"id":"https://openalex.org/I157773358","display_name":"Sun Yat-sen University","ror":"https://ror.org/0064kty71","country_code":"CN","type":"education","lineage":["https://openalex.org/I157773358"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Daya Guo","raw_affiliation_strings":["SUN YAT-SEN University, Guangzhou, China","SUN YAT-SEN University, China"],"raw_orcid":"https://orcid.org/0009-0008-0822-1517","affiliations":[{"raw_affiliation_string":"SUN YAT-SEN University, Guangzhou, China","institution_ids":["https://openalex.org/I157773358"]},{"raw_affiliation_string":"SUN YAT-SEN University, China","institution_ids":["https://openalex.org/I157773358"]}]},{"author_position":"middle","author":{"id":null,"display_name":"Jian Zhang","orcid":"https://orcid.org/0000-0001-8316-1894"},"institutions":[{"id":"https://openalex.org/I172675005","display_name":"Nanyang Technological University","ror":"https://ror.org/02e7b5302","country_code":"SG","type":"education","lineage":["https://openalex.org/I172675005"]}],"countries":["SG"],"is_corresponding":false,"raw_author_name":"Jian Zhang","raw_affiliation_strings":["Nanyang Technological University, Singapore"],"raw_orcid":"https://orcid.org/0000-0001-8316-1894","affiliations":[{"raw_affiliation_string":"Nanyang Technological University, Singapore","institution_ids":["https://openalex.org/I172675005"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5057849611","display_name":"Wei Ma","orcid":"https://orcid.org/0000-0002-0044-466X"},"institutions":[{"id":"https://openalex.org/I172675005","display_name":"Nanyang Technological University","ror":"https://ror.org/02e7b5302","country_code":"SG","type":"education","lineage":["https://openalex.org/I172675005"]},{"id":"https://openalex.org/I79891267","display_name":"Singapore Management University","ror":"https://ror.org/050qmg959","country_code":"SG","type":"education","lineage":["https://openalex.org/I79891267"]}],"countries":["SG"],"is_corresponding":false,"raw_author_name":"Wei Ma","raw_affiliation_strings":["Singapore Management University, Singapore","Nanyang Technological University, Singapore"],"raw_orcid":"https://orcid.org/0000-0002-0044-466X","affiliations":[{"raw_affiliation_string":"Singapore Management University, Singapore","institution_ids":["https://openalex.org/I79891267"]},{"raw_affiliation_string":"Nanyang Technological University, Singapore","institution_ids":["https://openalex.org/I172675005"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5102015751","display_name":"Yanzhou Li","orcid":"https://orcid.org/0009-0008-2263-7383"},"institutions":[{"id":"https://openalex.org/I172675005","display_name":"Nanyang Technological University","ror":"https://ror.org/02e7b5302","country_code":"SG","type":"education","lineage":["https://openalex.org/I172675005"]}],"countries":["SG"],"is_corresponding":false,"raw_author_name":"Yanzhou Li","raw_affiliation_strings":["Nanyang Technological University, Singapore"],"raw_orcid":"https://orcid.org/0009-0008-2263-7383","affiliations":[{"raw_affiliation_string":"Nanyang Technological University, Singapore","institution_ids":["https://openalex.org/I172675005"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5100355692","display_name":"Yang Liu","orcid":"https://orcid.org/0000-0001-7300-9215"},"institutions":[{"id":"https://openalex.org/I172675005","display_name":"Nanyang Technological University","ror":"https://ror.org/02e7b5302","country_code":"SG","type":"education","lineage":["https://openalex.org/I172675005"]}],"countries":["SG"],"is_corresponding":false,"raw_author_name":"Yang Liu","raw_affiliation_strings":["Nanyang Technological University, Singapore"],"raw_orcid":"https://orcid.org/0000-0001-7300-9215","affiliations":[{"raw_affiliation_string":"Nanyang Technological University, Singapore","institution_ids":["https://openalex.org/I172675005"]}]}],"institutions":[],"countries_distinct_count":2,"institutions_distinct_count":6,"corresponding_author_ids":[],"corresponding_institution_ids":["https://openalex.org/I881766915"],"apc_list":null,"apc_paid":null,"fwci":2.1733,"has_fulltext":false,"cited_by_count":1,"citation_normalized_percentile":{"value":0.90403984,"is_in_top_1_percent":false,"is_in_top_10_percent":true},"cited_by_percentile_year":{"min":91,"max":95},"biblio":{"volume":"51","issue":"11","first_page":"3088","last_page":"3102"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10181","display_name":"Natural Language Processing Techniques","score":0.9437000155448914,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10181","display_name":"Natural Language Processing Techniques","score":0.9437000155448914,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/syntax","display_name":"Syntax","score":0.5306000113487244},{"id":"https://openalex.org/keywords/semantics","display_name":"Semantics (computer science)","score":0.49540001153945923},{"id":"https://openalex.org/keywords/code","display_name":"Code (set theory)","score":0.4537999927997589},{"id":"https://openalex.org/keywords/representation","display_name":"Representation (politics)","score":0.4113999903202057},{"id":"https://openalex.org/keywords/empirical-research","display_name":"Empirical research","score":0.38269999623298645},{"id":"https://openalex.org/keywords/adaptation","display_name":"Adaptation (eye)","score":0.3391999900341034},{"id":"https://openalex.org/keywords/code-review","display_name":"Code review","score":0.33390000462532043},{"id":"https://openalex.org/keywords/code-generation","display_name":"Code generation","score":0.3310000002384186}],"concepts":[{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.7950999736785889},{"id":"https://openalex.org/C60048249","wikidata":"https://www.wikidata.org/wiki/Q37437","display_name":"Syntax","level":2,"score":0.5306000113487244},{"id":"https://openalex.org/C184337299","wikidata":"https://www.wikidata.org/wiki/Q1437428","display_name":"Semantics (computer science)","level":2,"score":0.49540001153945923},{"id":"https://openalex.org/C2776760102","wikidata":"https://www.wikidata.org/wiki/Q5139990","display_name":"Code (set theory)","level":3,"score":0.4537999927997589},{"id":"https://openalex.org/C199360897","wikidata":"https://www.wikidata.org/wiki/Q9143","display_name":"Programming language","level":1,"score":0.42910000681877136},{"id":"https://openalex.org/C2776359362","wikidata":"https://www.wikidata.org/wiki/Q2145286","display_name":"Representation (politics)","level":3,"score":0.4113999903202057},{"id":"https://openalex.org/C120936955","wikidata":"https://www.wikidata.org/wiki/Q2155640","display_name":"Empirical research","level":2,"score":0.38269999623298645},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.373199999332428},{"id":"https://openalex.org/C204321447","wikidata":"https://www.wikidata.org/wiki/Q30642","display_name":"Natural language processing","level":1,"score":0.3637000024318695},{"id":"https://openalex.org/C139807058","wikidata":"https://www.wikidata.org/wiki/Q352374","display_name":"Adaptation (eye)","level":2,"score":0.3391999900341034},{"id":"https://openalex.org/C150292731","wikidata":"https://www.wikidata.org/wiki/Q1342704","display_name":"Code review","level":5,"score":0.33390000462532043},{"id":"https://openalex.org/C133162039","wikidata":"https://www.wikidata.org/wiki/Q1061077","display_name":"Code generation","level":3,"score":0.3310000002384186},{"id":"https://openalex.org/C115903868","wikidata":"https://www.wikidata.org/wiki/Q80993","display_name":"Software engineering","level":1,"score":0.33090001344680786},{"id":"https://openalex.org/C529173508","wikidata":"https://www.wikidata.org/wiki/Q638608","display_name":"Software development","level":3,"score":0.31299999356269836},{"id":"https://openalex.org/C125411270","wikidata":"https://www.wikidata.org/wiki/Q18653","display_name":"Encoding (memory)","level":2,"score":0.3102000057697296},{"id":"https://openalex.org/C2777402240","wikidata":"https://www.wikidata.org/wiki/Q6783436","display_name":"Masking (illustration)","level":2,"score":0.30889999866485596},{"id":"https://openalex.org/C169590947","wikidata":"https://www.wikidata.org/wiki/Q47506","display_name":"Compiler","level":2,"score":0.3068000078201294},{"id":"https://openalex.org/C114408938","wikidata":"https://www.wikidata.org/wiki/Q333373","display_name":"Abstract syntax","level":3,"score":0.29840001463890076},{"id":"https://openalex.org/C2777904410","wikidata":"https://www.wikidata.org/wiki/Q7397","display_name":"Software","level":2,"score":0.2930000126361847},{"id":"https://openalex.org/C43126263","wikidata":"https://www.wikidata.org/wiki/Q128751","display_name":"Source code","level":2,"score":0.28200000524520874},{"id":"https://openalex.org/C2522767166","wikidata":"https://www.wikidata.org/wiki/Q2374463","display_name":"Data science","level":1,"score":0.27730000019073486},{"id":"https://openalex.org/C90559484","wikidata":"https://www.wikidata.org/wiki/Q778379","display_name":"Expression (computer science)","level":2,"score":0.26600000262260437},{"id":"https://openalex.org/C68387754","wikidata":"https://www.wikidata.org/wiki/Q7271585","display_name":"Schedule","level":2,"score":0.25369998812675476},{"id":"https://openalex.org/C2777601897","wikidata":"https://www.wikidata.org/wiki/Q3409113","display_name":"Presentation (obstetrics)","level":2,"score":0.2533000111579895},{"id":"https://openalex.org/C137293760","wikidata":"https://www.wikidata.org/wiki/Q3621696","display_name":"Language model","level":2,"score":0.2500999867916107}],"mesh":[],"locations_count":2,"locations":[{"id":"doi:10.1109/tse.2025.3609876","is_oa":false,"landing_page_url":"https://doi.org/10.1109/tse.2025.3609876","pdf_url":null,"source":{"id":"https://openalex.org/S8351582","display_name":"IEEE Transactions on Software Engineering","issn_l":"0098-5589","issn":["0098-5589","1939-3520","2326-3881"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310320439","host_organization_name":"IEEE Computer Society","host_organization_lineage":["https://openalex.org/P4310320439","https://openalex.org/P4310319808"],"host_organization_lineage_names":["IEEE Computer Society","Institute of Electrical and Electronics Engineers"],"type":"journal"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"IEEE Transactions on Software Engineering","raw_type":"journal-article"},{"id":"pmh:oai:dr.ntu.edu.sg:10356/208755","is_oa":false,"landing_page_url":"https://hdl.handle.net/10356/208755","pdf_url":null,"source":{"id":"https://openalex.org/S4306402609","display_name":"DR-NTU (Nanyang Technological University)","issn_l":null,"issn":null,"is_oa":false,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I172675005","host_organization_name":"Nanyang Technological University","host_organization_lineage":["https://openalex.org/I172675005"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"Journal Article"}],"best_oa_location":null,"sustainable_development_goals":[],"awards":[],"funders":[],"has_content":{"grobid_xml":false,"pdf":false},"content_urls":null,"referenced_works_count":36,"referenced_works":["https://openalex.org/W2065053490","https://openalex.org/W2142112143","https://openalex.org/W2148190602","https://openalex.org/W2282866165","https://openalex.org/W2955426500","https://openalex.org/W2962936887","https://openalex.org/W3014339000","https://openalex.org/W3022049116","https://openalex.org/W3034999214","https://openalex.org/W3098605233","https://openalex.org/W3108032709","https://openalex.org/W3174770825","https://openalex.org/W3176015924","https://openalex.org/W3177323791","https://openalex.org/W4205371973","https://openalex.org/W4205596491","https://openalex.org/W4205991051","https://openalex.org/W4221166942","https://openalex.org/W4252326246","https://openalex.org/W4284710241","https://openalex.org/W4311887664","https://openalex.org/W4313549837","https://openalex.org/W4384302803","https://openalex.org/W4385570973","https://openalex.org/W4385572925","https://openalex.org/W4385573867","https://openalex.org/W4386187806","https://openalex.org/W4388212670","https://openalex.org/W4388483108","https://openalex.org/W4389524426","https://openalex.org/W4396773582","https://openalex.org/W4400681808","https://openalex.org/W4402457546","https://openalex.org/W4403536352","https://openalex.org/W4406688098","https://openalex.org/W4412887834"],"related_works":[],"abstract_inverted_index":{"Since":[0],"the":[1,58,80,158,178,200,213,218],"advent":[2],"of":[3,34,60,126,160],"ChatGPT,":[4],"large":[5,72],"language":[6,73],"models":[7,142,240],"(LLMs)":[8],"have":[9,18],"attracted":[10],"widespread":[11],"attention":[12,187],"from":[13,88],"academia":[14],"and":[15,77,83,101],"industry.":[16],"They":[17],"also":[19],"brought":[20],"significant":[21],"changes":[22],"to":[23,56,109,168,211],"software":[24,64,106],"engineering.":[25],"However,":[26],"until":[27],"now,":[28],"there":[29],"has":[30],"been":[31],"a":[32,51,208,259],"lack":[33],"comprehensive":[35],"studies":[36],"comparing":[37],"LLMs":[38,61,111,145,206,226,232,265],"with":[39,112,138,172,185],"previous":[40,113,139,237],"smaller":[41,140],"code":[42,92,95,114,153,165,238,242,252,283],"pre-trained":[43,115,141,239],"models.":[44,116,284],"To":[45],"address":[46],"this":[47,54],"gap,":[48],"we":[49,68],"conduct":[50],"study":[52,85],"in":[53,62,149,177,193,217,250,266,279],"paper":[55],"illustrate":[57],"performance":[59,103,235],"different":[63,105],"engineering":[65,107],"tasks.":[66,269],"Specifically,":[67],"select":[69],"three":[70],"open-source":[71],"models,":[74],"CodeGen,":[75],"LLaMA,":[76],"StarCoder,":[78],"for":[79,104,128,227,264],"research":[81],"targets,":[82],"our":[84],"is":[86],"conducted":[87],"four":[89],"aspects,":[90],"including":[91],"syntax":[93,154],"understanding,":[94],"semantic":[96,173],"reasoning,":[97],"encoding":[98],"representation":[99,203,216],"quality,":[100],"adaptation":[102],"tasks":[108,229,244],"compare":[110],"Four":[117],"aspects":[118],"build":[119],"on":[120,241],"each":[121],"other,":[122],"forming":[123],"important":[124],"components":[125],"AI":[127],"Software":[129],"Engineering.":[130],"<p":[131],"xmlns:mml=\"http://www.w3.org/1998/Math/MathML\"":[132],"xmlns:xlink=\"http://www.w3.org/1999/xlink\">We":[133],"conclude":[134],"that:":[135],"(1)":[136],"Compared":[137],"like":[143],"CodeBERT,":[144],"exhibit":[146],"distinct":[147],"trends":[148],"how":[150],"they":[151],"learn":[152],"or":[155],"semantics":[156,166],"as":[157,258],"number":[159],"layers":[161],"increases.":[162],"Additionally,":[163],"mastering":[164],"proves":[167],"be":[169,248],"more":[170,260,281],"challenging,":[171],"information":[174],"usually":[175],"learned":[176],"final":[179],"layers;":[180],"(2)":[181],"Causal":[182],"decoder":[183],"architecture":[184],"left-to-right":[186],"masking":[188],"does":[189],"not":[190,247],"perform":[191],"well":[192],"zero-shot":[194],"tasks;":[195,254],"(3)":[196],"For":[197],"classification":[198],"tasks,":[199],"mean":[201],"vector":[202],"generated":[204],"by":[205],"over":[207],"sequence":[209],"tends":[210],"outperform":[212],"last":[214],"token":[215],"sequence;":[219],"(4)":[220],"Incorporating":[221],"parameter-efficient":[222],"fine-tuning":[223],"techniques":[224],"into":[225],"downstream":[228,267],"can":[230],"help":[231],"achieve":[233],"better":[234,275],"than":[236],"generation":[243],"but":[245],"may":[246],"optimal":[249],"some":[251],"understanding":[253],"(5)":[255],"LoRA":[256],"emerges":[257],"effective":[261],"PEFT":[262],"technique":[263],"code-related":[268],"We":[270],"hope":[271],"these":[272],"findings":[273],"will":[274],"guide":[276],"future":[277],"researchers":[278],"designing":[280],"powerful":[282]},"counts_by_year":[{"year":2025,"cited_by_count":1}],"updated_date":"2026-03-27T05:58:40.876381","created_date":"2025-10-10T00:00:00"}
