{"id":"https://openalex.org/W3178061567","doi":"https://doi.org/10.1145/3460319.3464819","title":"Deep just-in-time defect prediction: how far are we?","display_name":"Deep just-in-time defect prediction: how far are we?","publication_year":2021,"publication_date":"2021-07-08","ids":{"openalex":"https://openalex.org/W3178061567","doi":"https://doi.org/10.1145/3460319.3464819","mag":"3178061567"},"language":"en","primary_location":{"id":"doi:10.1145/3460319.3464819","is_oa":false,"landing_page_url":"https://doi.org/10.1145/3460319.3464819","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Proceedings of the 30th ACM SIGSOFT International Symposium on Software Testing and Analysis","raw_type":"proceedings-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":false,"oa_status":"closed","oa_url":null,"any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5010506833","display_name":"Zhengran Zeng","orcid":"https://orcid.org/0009-0009-8422-4522"},"institutions":[{"id":"https://openalex.org/I3045169105","display_name":"Southern University of Science and Technology","ror":"https://ror.org/049tv2d57","country_code":"CN","type":"education","lineage":["https://openalex.org/I3045169105"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Zhengran Zeng","raw_affiliation_strings":["Southern University of Science and Technology, China"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"Southern University of Science and Technology, China","institution_ids":["https://openalex.org/I3045169105"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5030322956","display_name":"Yuqun Zhang","orcid":"https://orcid.org/0000-0002-1499-5729"},"institutions":[{"id":"https://openalex.org/I3045169105","display_name":"Southern University of Science and Technology","ror":"https://ror.org/049tv2d57","country_code":"CN","type":"education","lineage":["https://openalex.org/I3045169105"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Yuqun Zhang","raw_affiliation_strings":["Southern University of Science and Technology, China"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"Southern University of Science and Technology, China","institution_ids":["https://openalex.org/I3045169105"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5100392967","display_name":"Haotian Zhang","orcid":"https://orcid.org/0000-0003-0478-3869"},"institutions":[{"id":"https://openalex.org/I2801745840","display_name":"Kwai Chung Hospital","ror":"https://ror.org/05kz7bw59","country_code":"CN","type":"healthcare","lineage":["https://openalex.org/I1294586568","https://openalex.org/I2801745840"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Haotian Zhang","raw_affiliation_strings":["Kwai, China"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"Kwai, China","institution_ids":["https://openalex.org/I2801745840"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5043546718","display_name":"Lingming Zhang","orcid":"https://orcid.org/0000-0001-5175-2702"},"institutions":[{"id":"https://openalex.org/I157725225","display_name":"University of Illinois Urbana-Champaign","ror":"https://ror.org/047426m28","country_code":"US","type":"education","lineage":["https://openalex.org/I157725225"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Lingming Zhang","raw_affiliation_strings":["University of Illinois at Urbana-Champaign, USA"],"raw_orcid":"https://orcid.org/0000-0001-5175-2702","affiliations":[{"raw_affiliation_string":"University of Illinois at Urbana-Champaign, USA","institution_ids":["https://openalex.org/I157725225"]}]}],"institutions":[],"countries_distinct_count":2,"institutions_distinct_count":4,"corresponding_author_ids":[],"corresponding_institution_ids":[],"apc_list":null,"apc_paid":null,"fwci":18.7768,"has_fulltext":false,"cited_by_count":97,"citation_normalized_percentile":{"value":0.99312511,"is_in_top_1_percent":true,"is_in_top_10_percent":true},"cited_by_percentile_year":{"min":99,"max":100},"biblio":{"volume":null,"issue":null,"first_page":"427","last_page":"438"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10260","display_name":"Software Engineering Research","score":0.9998000264167786,"subfield":{"id":"https://openalex.org/subfields/1710","display_name":"Information Systems"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10260","display_name":"Software Engineering Research","score":0.9998000264167786,"subfield":{"id":"https://openalex.org/subfields/1710","display_name":"Information Systems"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10743","display_name":"Software Testing and Debugging Techniques","score":0.9980000257492065,"subfield":{"id":"https://openalex.org/subfields/1712","display_name":"Software"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T12423","display_name":"Software Reliability and Analysis Research","score":0.9940999746322632,"subfield":{"id":"https://openalex.org/subfields/1712","display_name":"Software"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/commit","display_name":"Commit","score":0.8291874527931213},{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.8078011274337769},{"id":"https://openalex.org/keywords/code","display_name":"Code (set theory)","score":0.5932275056838989},{"id":"https://openalex.org/keywords/feature","display_name":"Feature (linguistics)","score":0.5611521005630493},{"id":"https://openalex.org/keywords/construct","display_name":"Construct (python library)","score":0.5563454627990723},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.5217450857162476},{"id":"https://openalex.org/keywords/embedding","display_name":"Embedding","score":0.4885309934616089},{"id":"https://openalex.org/keywords/feature-engineering","display_name":"Feature engineering","score":0.45628342032432556},{"id":"https://openalex.org/keywords/machine-learning","display_name":"Machine learning","score":0.45145735144615173},{"id":"https://openalex.org/keywords/predictive-modelling","display_name":"Predictive modelling","score":0.44817060232162476},{"id":"https://openalex.org/keywords/source-code","display_name":"Source code","score":0.4147995412349701},{"id":"https://openalex.org/keywords/source-lines-of-code","display_name":"Source lines of code","score":0.41141706705093384},{"id":"https://openalex.org/keywords/data-mining","display_name":"Data mining","score":0.33541420102119446},{"id":"https://openalex.org/keywords/deep-learning","display_name":"Deep learning","score":0.32496780157089233},{"id":"https://openalex.org/keywords/software","display_name":"Software","score":0.23508936166763306},{"id":"https://openalex.org/keywords/set","display_name":"Set (abstract data type)","score":0.12178391218185425},{"id":"https://openalex.org/keywords/database","display_name":"Database","score":0.10111552476882935},{"id":"https://openalex.org/keywords/programming-language","display_name":"Programming language","score":0.09773379564285278}],"concepts":[{"id":"https://openalex.org/C153180980","wikidata":"https://www.wikidata.org/wiki/Q19776675","display_name":"Commit","level":2,"score":0.8291874527931213},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.8078011274337769},{"id":"https://openalex.org/C2776760102","wikidata":"https://www.wikidata.org/wiki/Q5139990","display_name":"Code (set theory)","level":3,"score":0.5932275056838989},{"id":"https://openalex.org/C2776401178","wikidata":"https://www.wikidata.org/wiki/Q12050496","display_name":"Feature (linguistics)","level":2,"score":0.5611521005630493},{"id":"https://openalex.org/C2780801425","wikidata":"https://www.wikidata.org/wiki/Q5164392","display_name":"Construct (python library)","level":2,"score":0.5563454627990723},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.5217450857162476},{"id":"https://openalex.org/C41608201","wikidata":"https://www.wikidata.org/wiki/Q980509","display_name":"Embedding","level":2,"score":0.4885309934616089},{"id":"https://openalex.org/C2778827112","wikidata":"https://www.wikidata.org/wiki/Q22245680","display_name":"Feature engineering","level":3,"score":0.45628342032432556},{"id":"https://openalex.org/C119857082","wikidata":"https://www.wikidata.org/wiki/Q2539","display_name":"Machine learning","level":1,"score":0.45145735144615173},{"id":"https://openalex.org/C45804977","wikidata":"https://www.wikidata.org/wiki/Q7239673","display_name":"Predictive modelling","level":2,"score":0.44817060232162476},{"id":"https://openalex.org/C43126263","wikidata":"https://www.wikidata.org/wiki/Q128751","display_name":"Source code","level":2,"score":0.4147995412349701},{"id":"https://openalex.org/C199519371","wikidata":"https://www.wikidata.org/wiki/Q942695","display_name":"Source lines of code","level":3,"score":0.41141706705093384},{"id":"https://openalex.org/C124101348","wikidata":"https://www.wikidata.org/wiki/Q172491","display_name":"Data mining","level":1,"score":0.33541420102119446},{"id":"https://openalex.org/C108583219","wikidata":"https://www.wikidata.org/wiki/Q197536","display_name":"Deep learning","level":2,"score":0.32496780157089233},{"id":"https://openalex.org/C2777904410","wikidata":"https://www.wikidata.org/wiki/Q7397","display_name":"Software","level":2,"score":0.23508936166763306},{"id":"https://openalex.org/C177264268","wikidata":"https://www.wikidata.org/wiki/Q1514741","display_name":"Set (abstract data type)","level":2,"score":0.12178391218185425},{"id":"https://openalex.org/C77088390","wikidata":"https://www.wikidata.org/wiki/Q8513","display_name":"Database","level":1,"score":0.10111552476882935},{"id":"https://openalex.org/C199360897","wikidata":"https://www.wikidata.org/wiki/Q9143","display_name":"Programming language","level":1,"score":0.09773379564285278},{"id":"https://openalex.org/C138885662","wikidata":"https://www.wikidata.org/wiki/Q5891","display_name":"Philosophy","level":0,"score":0.0},{"id":"https://openalex.org/C41895202","wikidata":"https://www.wikidata.org/wiki/Q8162","display_name":"Linguistics","level":1,"score":0.0}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.1145/3460319.3464819","is_oa":false,"landing_page_url":"https://doi.org/10.1145/3460319.3464819","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Proceedings of the 30th ACM SIGSOFT International Symposium on Software Testing and Analysis","raw_type":"proceedings-article"}],"best_oa_location":null,"sustainable_development_goals":[],"awards":[{"id":"https://openalex.org/G3814908347","display_name":null,"funder_award_id":"KQTD2016112514355531","funder_id":"https://openalex.org/F4320335790","funder_display_name":"Shenzhen Peacock Plan"},{"id":"https://openalex.org/G5511685887","display_name":null,"funder_award_id":"61902169","funder_id":"https://openalex.org/F4320321001","funder_display_name":"National Natural Science Foundation of China"}],"funders":[{"id":"https://openalex.org/F4320321001","display_name":"National Natural Science Foundation of China","ror":"https://ror.org/01h0zpd94"},{"id":"https://openalex.org/F4320335790","display_name":"Shenzhen Peacock Plan","ror":null}],"has_content":{"grobid_xml":false,"pdf":false},"content_urls":null,"referenced_works_count":47,"referenced_works":["https://openalex.org/W132347231","https://openalex.org/W1655956671","https://openalex.org/W1680392829","https://openalex.org/W2007705030","https://openalex.org/W2065547122","https://openalex.org/W2073649165","https://openalex.org/W2100945416","https://openalex.org/W2104329051","https://openalex.org/W2105300539","https://openalex.org/W2105776892","https://openalex.org/W2110229593","https://openalex.org/W2120703352","https://openalex.org/W2126166995","https://openalex.org/W2132887549","https://openalex.org/W2147105902","https://openalex.org/W2147386665","https://openalex.org/W2158744032","https://openalex.org/W2163732854","https://openalex.org/W2276400542","https://openalex.org/W2344367508","https://openalex.org/W2470673105","https://openalex.org/W2599212561","https://openalex.org/W2606150376","https://openalex.org/W2743316948","https://openalex.org/W2744611928","https://openalex.org/W2774919641","https://openalex.org/W2787407015","https://openalex.org/W2792987835","https://openalex.org/W2887758210","https://openalex.org/W2898124301","https://openalex.org/W2898435572","https://openalex.org/W2919115771","https://openalex.org/W2955232136","https://openalex.org/W2955991060","https://openalex.org/W2962858109","https://openalex.org/W2963548617","https://openalex.org/W2964279097","https://openalex.org/W2966592377","https://openalex.org/W3009761259","https://openalex.org/W3011013751","https://openalex.org/W3033234605","https://openalex.org/W3089692094","https://openalex.org/W3093046707","https://openalex.org/W3105867435","https://openalex.org/W3106142244","https://openalex.org/W3122184684","https://openalex.org/W4302798214"],"related_works":["https://openalex.org/W2033235985","https://openalex.org/W2763289028","https://openalex.org/W2031796104","https://openalex.org/W4213113901","https://openalex.org/W1498479218","https://openalex.org/W2923727989","https://openalex.org/W1792679987","https://openalex.org/W4361792201","https://openalex.org/W3023254737","https://openalex.org/W2953504043"],"abstract_inverted_index":{"Defect":[0],"prediction":[1,24,45,178,210,232,279],"aims":[2],"to":[3,54,87,104,131],"automatically":[4],"identify":[5],"potential":[6],"defective":[7],"code":[8,61,79],"with":[9,69,126,152,240],"minimal":[10],"human":[11],"intervention":[12],"and":[13,33,63,65,77,123,136,173,190,212,253,258],"has":[14,34,101],"been":[15,35,102],"widely":[16,36],"studied":[17],"in":[18,38,255,265,280],"the":[19,83,106,109,134,160,204,215,237,241,268,281],"literature.":[20],"Just-in-Time":[21],"(JIT)":[22],"defect":[23,44,113,177,199,209,231,256,278],"focuses":[25],"on":[26,119,148],"program":[27],"changes":[28,80,155],"rather":[29],"than":[30,159],"whole":[31],"programs,":[32],"adopted":[37],"continuous":[39],"testing.":[40],"CC2Vec,":[41,139],"state-of-the-art":[42],"JIT":[43,112,176,198,230,277],"tool,":[46],"first":[47],"constructs":[48],"a":[49,89,94,120,149,228,247],"hierarchical":[50],"attention":[51],"network":[52],"(HAN)":[53],"learn":[55],"distributed":[56],"vector":[57],"representations":[58],"of":[59,108,138,146,192,206],"both":[60],"additions":[62],"deletions,":[64],"then":[66],"concatenates":[67],"them":[68,193],"two":[70],"other":[71,219],"embedding":[72],"vectors":[73],"representing":[74],"commit":[75,96],"messages":[76],"overall":[78],"extracted":[81],"by":[82,223],"existing":[84],"DeepJIT":[85,172,254],"approach":[86,233,249],"train":[88],"model":[90],"for":[91,111,275],"predicting":[92],"whether":[93],"given":[95],"is":[97],"defective.":[98],"Although":[99],"CC2Vec":[100,147,162,170,185,252],"shown":[103],"be":[105,260],"state":[107],"art":[110],"prediction,":[114,257],"it":[115],"was":[116],"only":[117],"evaluated":[118],"limited":[121],"dataset":[122,151],"not":[124],"compared":[125],"all":[127],"representative":[128,174],"baselines.":[129],"Therefore,":[130],"further":[132],"investigate":[133,203],"efficacy":[135],"limitations":[137],"this":[140,224],"paper":[141,269],"performs":[142],"an":[143],"extensive":[144],"study":[145],"large-scale":[150],"over":[153],"310,370":[154],"(8.3":[156],"X":[157,263],"larger":[158],"original":[161],"dataset).":[163],"More":[164],"specifically,":[165],"we":[166,226],"also":[167,202,270],"empirically":[168],"compare":[169],"against":[171],"traditional":[175,197,208,220],"techniques.":[179],"The":[180],"experimental":[181],"results":[182],"show":[183],"that":[184,214],"cannot":[186],"consistently":[187,195],"outperform":[188,196,251],"DeepJIT,":[189],"neither":[191],"can":[194,250,259],"prediction.":[200],"We":[201],"impact":[205],"individual":[207],"features":[211],"find":[213],"added-line-number":[216,238],"feature":[217,239],"outperforms":[218],"features.":[221],"Inspired":[222],"finding,":[225],"construct":[227],"simplistic":[229,248],"which":[234],"simply":[235],"adopts":[236],"logistic":[242],"regression":[243],"classifier.":[244],"Surprisingly,":[245],"such":[246],"81k":[261],"X/120k":[262],"faster":[264],"training/testing.":[266],"Furthermore,":[267],"provides":[271],"various":[272],"practical":[273],"guidelines":[274],"advancing":[276],"near":[282],"future.":[283]},"counts_by_year":[{"year":2026,"cited_by_count":10},{"year":2025,"cited_by_count":21},{"year":2024,"cited_by_count":25},{"year":2023,"cited_by_count":24},{"year":2022,"cited_by_count":17}],"updated_date":"2026-06-11T09:08:48.828518","created_date":"2025-10-10T00:00:00"}
