{"id":"https://openalex.org/W4392739326","doi":"https://doi.org/10.1109/tse.2024.3376964","title":"Active Code Learning: Benchmarking Sample-Efficient Training of Code Models","display_name":"Active Code Learning: Benchmarking Sample-Efficient Training of Code Models","publication_year":2024,"publication_date":"2024-03-13","ids":{"openalex":"https://openalex.org/W4392739326","doi":"https://doi.org/10.1109/tse.2024.3376964"},"language":"en","primary_location":{"id":"doi:10.1109/tse.2024.3376964","is_oa":true,"landing_page_url":"https://doi.org/10.1109/tse.2024.3376964","pdf_url":"https://ieeexplore.ieee.org/ielx7/32/4359463/10471610.pdf","source":{"id":"https://openalex.org/S8351582","display_name":"IEEE Transactions on Software Engineering","issn_l":"0098-5589","issn":["0098-5589","1939-3520","2326-3881"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310320439","host_organization_name":"IEEE Computer Society","host_organization_lineage":["https://openalex.org/P4310320439","https://openalex.org/P4310319808"],"host_organization_lineage_names":["IEEE Computer Society","Institute of Electrical and Electronics Engineers"],"type":"journal"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"IEEE Transactions on Software Engineering","raw_type":"journal-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":true,"oa_status":"bronze","oa_url":"https://ieeexplore.ieee.org/ielx7/32/4359463/10471610.pdf","any_repository_has_fulltext":true},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5101406450","display_name":"Qiang Hu","orcid":"https://orcid.org/0000-0002-8251-1669"},"institutions":[{"id":"https://openalex.org/I186903577","display_name":"University of Luxembourg","ror":"https://ror.org/036x5ad56","country_code":"LU","type":"education","lineage":["https://openalex.org/I186903577"]}],"countries":["LU"],"is_corresponding":true,"raw_author_name":"Qiang Hu","raw_affiliation_strings":["University of Luxembourg, Belval, Luxembourg"],"affiliations":[{"raw_affiliation_string":"University of Luxembourg, Belval, Luxembourg","institution_ids":["https://openalex.org/I186903577"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5023978917","display_name":"Yuejun Guo","orcid":"https://orcid.org/0000-0002-5535-2420"},"institutions":[{"id":"https://openalex.org/I4210112527","display_name":"Luxembourg Institute of Science and Technology","ror":"https://ror.org/01t178j62","country_code":"LU","type":"nonprofit","lineage":["https://openalex.org/I4210112527"]}],"countries":["LU"],"is_corresponding":false,"raw_author_name":"Yuejun Guo","raw_affiliation_strings":["Luxembourg Institute of Science and Technology, Belval, Luxembourg"],"affiliations":[{"raw_affiliation_string":"Luxembourg Institute of Science and Technology, Belval, Luxembourg","institution_ids":["https://openalex.org/I4210112527"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5084396416","display_name":"Xiaofei Xie","orcid":"https://orcid.org/0000-0002-1288-6502"},"institutions":[{"id":"https://openalex.org/I79891267","display_name":"Singapore Management University","ror":"https://ror.org/050qmg959","country_code":"SG","type":"education","lineage":["https://openalex.org/I79891267"]}],"countries":["SG"],"is_corresponding":false,"raw_author_name":"Xiaofei Xie","raw_affiliation_strings":["Singapore Management University, Singapore"],"affiliations":[{"raw_affiliation_string":"Singapore Management University, Singapore","institution_ids":["https://openalex.org/I79891267"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5000695937","display_name":"Maxime Cordy","orcid":"https://orcid.org/0000-0001-8312-1358"},"institutions":[{"id":"https://openalex.org/I186903577","display_name":"University of Luxembourg","ror":"https://ror.org/036x5ad56","country_code":"LU","type":"education","lineage":["https://openalex.org/I186903577"]}],"countries":["LU"],"is_corresponding":false,"raw_author_name":"Maxime Cordy","raw_affiliation_strings":["University of Luxembourg, Belval, Luxembourg"],"affiliations":[{"raw_affiliation_string":"University of Luxembourg, Belval, Luxembourg","institution_ids":["https://openalex.org/I186903577"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5101468661","display_name":"Lei Ma","orcid":"https://orcid.org/0000-0002-8621-2420"},"institutions":[{"id":"https://openalex.org/I154425047","display_name":"University of Alberta","ror":"https://ror.org/0160cpw27","country_code":"CA","type":"education","lineage":["https://openalex.org/I154425047"]},{"id":"https://openalex.org/I74801974","display_name":"The University of Tokyo","ror":"https://ror.org/057zh3y96","country_code":"JP","type":"education","lineage":["https://openalex.org/I74801974"]}],"countries":["CA","JP"],"is_corresponding":false,"raw_author_name":"Lei Ma","raw_affiliation_strings":["University of Tokyo, Tokyo, Japan","University of Tokyo and University of Alberta"],"affiliations":[{"raw_affiliation_string":"University of Tokyo, Tokyo, Japan","institution_ids":["https://openalex.org/I74801974"]},{"raw_affiliation_string":"University of Tokyo and University of Alberta","institution_ids":["https://openalex.org/I154425047","https://openalex.org/I74801974"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5081145634","display_name":"Mike Papadakis","orcid":"https://orcid.org/0000-0003-1852-2547"},"institutions":[{"id":"https://openalex.org/I186903577","display_name":"University of Luxembourg","ror":"https://ror.org/036x5ad56","country_code":"LU","type":"education","lineage":["https://openalex.org/I186903577"]}],"countries":["LU"],"is_corresponding":false,"raw_author_name":"Mike Papadakis","raw_affiliation_strings":["University of Luxembourg, Belval, Luxembourg"],"affiliations":[{"raw_affiliation_string":"University of Luxembourg, Belval, Luxembourg","institution_ids":["https://openalex.org/I186903577"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5040574362","display_name":"Yves Le Traon","orcid":"https://orcid.org/0000-0002-1045-4861"},"institutions":[{"id":"https://openalex.org/I186903577","display_name":"University of Luxembourg","ror":"https://ror.org/036x5ad56","country_code":"LU","type":"education","lineage":["https://openalex.org/I186903577"]}],"countries":["LU"],"is_corresponding":false,"raw_author_name":"Yves Le Traon","raw_affiliation_strings":["University of Luxembourg, Belval, Luxembourg"],"affiliations":[{"raw_affiliation_string":"University of Luxembourg, Belval, Luxembourg","institution_ids":["https://openalex.org/I186903577"]}]}],"institutions":[],"countries_distinct_count":4,"institutions_distinct_count":7,"corresponding_author_ids":["https://openalex.org/A5101406450"],"corresponding_institution_ids":["https://openalex.org/I186903577"],"apc_list":null,"apc_paid":null,"fwci":6.1075,"has_fulltext":true,"cited_by_count":8,"citation_normalized_percentile":{"value":0.96136936,"is_in_top_1_percent":false,"is_in_top_10_percent":true},"cited_by_percentile_year":{"min":94,"max":100},"biblio":{"volume":"50","issue":"5","first_page":"1080","last_page":"1095"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10260","display_name":"Software Engineering Research","score":0.996999979019165,"subfield":{"id":"https://openalex.org/subfields/1710","display_name":"Information Systems"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10260","display_name":"Software Engineering Research","score":0.996999979019165,"subfield":{"id":"https://openalex.org/subfields/1710","display_name":"Information Systems"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T12072","display_name":"Machine Learning and Algorithms","score":0.9959999918937683,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10743","display_name":"Software Testing and Debugging Techniques","score":0.9934999942779541,"subfield":{"id":"https://openalex.org/subfields/1712","display_name":"Software"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.8452873229980469},{"id":"https://openalex.org/keywords/benchmarking","display_name":"Benchmarking","score":0.7830907106399536},{"id":"https://openalex.org/keywords/code","display_name":"Code (set theory)","score":0.61600661277771},{"id":"https://openalex.org/keywords/sample","display_name":"Sample (material)","score":0.570783257484436},{"id":"https://openalex.org/keywords/training","display_name":"Training (meteorology)","score":0.4558502435684204},{"id":"https://openalex.org/keywords/programming-language","display_name":"Programming language","score":0.45578426122665405},{"id":"https://openalex.org/keywords/software-engineering","display_name":"Software engineering","score":0.4284965991973877},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.34570086002349854},{"id":"https://openalex.org/keywords/machine-learning","display_name":"Machine learning","score":0.32424628734588623}],"concepts":[{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.8452873229980469},{"id":"https://openalex.org/C86251818","wikidata":"https://www.wikidata.org/wiki/Q816754","display_name":"Benchmarking","level":2,"score":0.7830907106399536},{"id":"https://openalex.org/C2776760102","wikidata":"https://www.wikidata.org/wiki/Q5139990","display_name":"Code (set theory)","level":3,"score":0.61600661277771},{"id":"https://openalex.org/C198531522","wikidata":"https://www.wikidata.org/wiki/Q485146","display_name":"Sample (material)","level":2,"score":0.570783257484436},{"id":"https://openalex.org/C2777211547","wikidata":"https://www.wikidata.org/wiki/Q17141490","display_name":"Training (meteorology)","level":2,"score":0.4558502435684204},{"id":"https://openalex.org/C199360897","wikidata":"https://www.wikidata.org/wiki/Q9143","display_name":"Programming language","level":1,"score":0.45578426122665405},{"id":"https://openalex.org/C115903868","wikidata":"https://www.wikidata.org/wiki/Q80993","display_name":"Software engineering","level":1,"score":0.4284965991973877},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.34570086002349854},{"id":"https://openalex.org/C119857082","wikidata":"https://www.wikidata.org/wiki/Q2539","display_name":"Machine learning","level":1,"score":0.32424628734588623},{"id":"https://openalex.org/C177264268","wikidata":"https://www.wikidata.org/wiki/Q1514741","display_name":"Set (abstract data type)","level":2,"score":0.0},{"id":"https://openalex.org/C162853370","wikidata":"https://www.wikidata.org/wiki/Q39809","display_name":"Marketing","level":1,"score":0.0},{"id":"https://openalex.org/C153294291","wikidata":"https://www.wikidata.org/wiki/Q25261","display_name":"Meteorology","level":1,"score":0.0},{"id":"https://openalex.org/C121332964","wikidata":"https://www.wikidata.org/wiki/Q413","display_name":"Physics","level":0,"score":0.0},{"id":"https://openalex.org/C144133560","wikidata":"https://www.wikidata.org/wiki/Q4830453","display_name":"Business","level":0,"score":0.0},{"id":"https://openalex.org/C185592680","wikidata":"https://www.wikidata.org/wiki/Q2329","display_name":"Chemistry","level":0,"score":0.0},{"id":"https://openalex.org/C43617362","wikidata":"https://www.wikidata.org/wiki/Q170050","display_name":"Chromatography","level":1,"score":0.0}],"mesh":[],"locations_count":2,"locations":[{"id":"doi:10.1109/tse.2024.3376964","is_oa":true,"landing_page_url":"https://doi.org/10.1109/tse.2024.3376964","pdf_url":"https://ieeexplore.ieee.org/ielx7/32/4359463/10471610.pdf","source":{"id":"https://openalex.org/S8351582","display_name":"IEEE Transactions on Software Engineering","issn_l":"0098-5589","issn":["0098-5589","1939-3520","2326-3881"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310320439","host_organization_name":"IEEE Computer Society","host_organization_lineage":["https://openalex.org/P4310320439","https://openalex.org/P4310319808"],"host_organization_lineage_names":["IEEE Computer Society","Institute of Electrical and Electronics Engineers"],"type":"journal"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"IEEE Transactions on Software Engineering","raw_type":"journal-article"},{"id":"pmh:oai:orbilu.uni.lu:10993/63488","is_oa":true,"landing_page_url":"https://orbilu.uni.lu/handle/10993/63488","pdf_url":"https://orbilu.uni.lu/bitstream/10993/63488/1/Active_Code_Learning_Benchmarking_Sample-Efficient_Training_of_Code_Models.pdf","source":{"id":"https://openalex.org/S4306401815","display_name":"Open Repository and Bibliography (University of Luxembourg)","issn_l":null,"issn":null,"is_oa":false,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I186903577","host_organization_name":"University of Luxembourg","host_organization_lineage":["https://openalex.org/I186903577"],"host_organization_lineage_names":[],"type":"repository"},"license":"other-oa","license_id":"https://openalex.org/licenses/other-oa","version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":"IEEE Transactions on Software Engineering, 50 (5), 1080 - 1095 (2024-05)","raw_type":"peer reviewed"}],"best_oa_location":{"id":"doi:10.1109/tse.2024.3376964","is_oa":true,"landing_page_url":"https://doi.org/10.1109/tse.2024.3376964","pdf_url":"https://ieeexplore.ieee.org/ielx7/32/4359463/10471610.pdf","source":{"id":"https://openalex.org/S8351582","display_name":"IEEE Transactions on Software Engineering","issn_l":"0098-5589","issn":["0098-5589","1939-3520","2326-3881"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310320439","host_organization_name":"IEEE Computer Society","host_organization_lineage":["https://openalex.org/P4310320439","https://openalex.org/P4310319808"],"host_organization_lineage_names":["IEEE Computer Society","Institute of Electrical and Electronics Engineers"],"type":"journal"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"IEEE Transactions on Software Engineering","raw_type":"journal-article"},"sustainable_development_goals":[],"awards":[{"id":"https://openalex.org/G5242316204","display_name":null,"funder_award_id":"101070303","funder_id":"https://openalex.org/F4320320300","funder_display_name":"European Commission"},{"id":"https://openalex.org/G5306067749","display_name":"Materials & Manufacturing of the FUTURE","funder_award_id":"266976","funder_id":"https://openalex.org/F4320320300","funder_display_name":"European Commission"},{"id":"https://openalex.org/G7445321341","display_name":null,"funder_award_id":"C18/IS/12669767/STELLAR/LeTraon","funder_id":"https://openalex.org/F4320321038","funder_display_name":"Fonds National de la Recherche Luxembourg"},{"id":"https://openalex.org/G8051717526","display_name":null,"funder_award_id":"Grant","funder_id":"https://openalex.org/F4320320300","funder_display_name":"European Commission"},{"id":"https://openalex.org/G8318064016","display_name":null,"funder_award_id":"Horizon","funder_id":"https://openalex.org/F4320320300","funder_display_name":"European Commission"}],"funders":[{"id":"https://openalex.org/F4320320300","display_name":"European Commission","ror":"https://ror.org/00k4n6c32"},{"id":"https://openalex.org/F4320321038","display_name":"Fonds National de la Recherche Luxembourg","ror":"https://ror.org/039z13y21"}],"has_content":{"pdf":true,"grobid_xml":true},"content_urls":{"pdf":"https://content.openalex.org/works/W4392739326.pdf","grobid_xml":"https://content.openalex.org/works/W4392739326.grobid-xml"},"referenced_works_count":69,"referenced_works":["https://openalex.org/W1575078351","https://openalex.org/W2011674654","https://openalex.org/W2050855115","https://openalex.org/W2065053490","https://openalex.org/W2102831150","https://openalex.org/W2171671120","https://openalex.org/W2261775381","https://openalex.org/W2408920689","https://openalex.org/W2755846764","https://openalex.org/W2767717989","https://openalex.org/W2785836523","https://openalex.org/W2807964941","https://openalex.org/W2888557792","https://openalex.org/W2895344848","https://openalex.org/W2896457183","https://openalex.org/W2903158431","https://openalex.org/W2962755824","https://openalex.org/W2963935794","https://openalex.org/W2965373594","https://openalex.org/W3042703469","https://openalex.org/W3093464584","https://openalex.org/W3102727295","https://openalex.org/W3119507053","https://openalex.org/W3126675481","https://openalex.org/W3205471381","https://openalex.org/W4220722393","https://openalex.org/W4224214784","https://openalex.org/W4225410698","https://openalex.org/W4249314064","https://openalex.org/W4288089799","https://openalex.org/W4306780108","https://openalex.org/W4310884551","https://openalex.org/W4313563421","https://openalex.org/W4362598291","https://openalex.org/W4367000100","https://openalex.org/W4367189393","https://openalex.org/W4377864824","https://openalex.org/W4378473878","https://openalex.org/W4378591002","https://openalex.org/W4384009718","https://openalex.org/W4384345639","https://openalex.org/W4384345640","https://openalex.org/W4384345698","https://openalex.org/W4384345728","https://openalex.org/W4388483038","https://openalex.org/W4389524484","https://openalex.org/W6735374517","https://openalex.org/W6747231328","https://openalex.org/W6754277761","https://openalex.org/W6756615331","https://openalex.org/W6763607942","https://openalex.org/W6766673545","https://openalex.org/W6767260250","https://openalex.org/W6769243733","https://openalex.org/W6769627184","https://openalex.org/W6773936880","https://openalex.org/W6783227185","https://openalex.org/W6790588633","https://openalex.org/W6800949977","https://openalex.org/W6800994414","https://openalex.org/W6839598838","https://openalex.org/W6846732047","https://openalex.org/W6847206046","https://openalex.org/W6851228291","https://openalex.org/W6852131103","https://openalex.org/W6852318870","https://openalex.org/W6852529130","https://openalex.org/W6852775702","https://openalex.org/W6864870587"],"related_works":["https://openalex.org/W4238897586","https://openalex.org/W435179959","https://openalex.org/W2619091065","https://openalex.org/W2059640416","https://openalex.org/W1490753184","https://openalex.org/W2284465472","https://openalex.org/W2291782699","https://openalex.org/W1993948687","https://openalex.org/W2000169967","https://openalex.org/W2112883198"],"abstract_inverted_index":{"The":[0,163],"costly":[1],"human":[2,39],"effort":[3,40],"required":[4],"to":[5,52,59,113,152,177,203,222],"prepare":[6],"the":[7,93,110,181,185,204,240],"training":[8,33],"data":[9,65,132,179],"of":[10,35,95,212,242],"machine":[11],"learning":[12,47,97,172,191,215],"(ML)":[13],"models":[14,34,68,196],"hinders":[15],"their":[16],"practical":[17],"development":[18],"and":[19,80,140,173,230,239],"usage":[20],"in":[21,77,134],"software":[22],"engineering":[23],"(ML4Code),":[24],"especially":[25],"for":[26,98,131,143,160],"those":[27],"with":[28,37,63,69,197,216,227],"limited":[29],"budgets.":[30],"Therefore,":[31],"efficiently":[32],"code":[36,99,120,161,186,190,214,243],"less":[38],"has":[41,73],"become":[42],"an":[43,149,217],"emergent":[44],"problem.":[45],"Active":[46],"is":[48,87,180,192],"such":[49,89],"a":[50,61,199,232],"technique":[51],"address":[53],"this":[54,102,106,115],"issue":[55],"that":[56,91,166],"allows":[57],"developers":[58],"train":[60],"model":[62],"reduced":[64],"while":[66],"producing":[67],"desired":[70],"performance,":[71],"which":[72,194],"been":[74],"well":[75],"studied":[76],"computer":[78],"vision":[79],"natural":[81],"language":[82],"processing":[83],"domains.":[84],"Unfortunately,":[85],"there":[86],"no":[88],"work":[90],"explores":[92],"effectiveness":[94],"active":[96,119,135,171,189,213],"models.":[100,244],"In":[101],"paper,":[103],"we":[104,123,147,208],"bridge":[105],"gap":[107,201],"by":[108],"building":[109],"first":[111],"benchmark":[112],"study":[114,151],"critical":[116],"problem":[117],"-":[118],"learning.":[121],"Specifically,":[122],"collect":[124],"11":[125],"acquisition":[126,156],"functions":[127,157],"(which":[128],"are":[129],"used":[130],"selection":[133,168],"learning)":[136],"from":[137],"existing":[138],"works":[139],"adapt":[141],"them":[142],"code-related":[144],"tasks.":[145],"Then,":[146],"conduct":[148],"empirical":[150],"check":[153],"whether":[154],"these":[155,235],"maintain":[158],"performance":[159,241],"data.":[162],"results":[164],"demonstrate":[165],"feature":[167],"highly":[169],"affects":[170],"using":[174],"output":[175],"vectors":[176],"select":[178],"best":[182],"choice.":[183],"For":[184],"summarization":[187],"task,":[188],"ineffective":[193],"produces":[195],"over":[198],"29.64%":[200],"compared":[202],"expected":[205],"performance.":[206],"Furthermore,":[207],"explore":[209],"future":[210],"directions":[211],"exploratory":[218],"study.":[219],"We":[220],"propose":[221],"replace":[223],"distance":[224,237],"calculation":[225],"methods":[226,238],"evaluation":[228],"metrics":[229],"find":[231],"correlation":[233],"between":[234],"evaluation-based":[236]},"counts_by_year":[{"year":2026,"cited_by_count":3},{"year":2025,"cited_by_count":3},{"year":2024,"cited_by_count":2}],"updated_date":"2026-04-10T15:06:20.359241","created_date":"2025-10-10T00:00:00"}
