{"id":"https://openalex.org/W4411450081","doi":"https://doi.org/10.1145/3715727","title":"COFFE: A Code Efficiency Benchmark for Code Generation","display_name":"COFFE: A Code Efficiency Benchmark for Code Generation","publication_year":2025,"publication_date":"2025-06-19","ids":{"openalex":"https://openalex.org/W4411450081","doi":"https://doi.org/10.1145/3715727"},"language":"en","primary_location":{"id":"doi:10.1145/3715727","is_oa":true,"landing_page_url":"https://doi.org/10.1145/3715727","pdf_url":null,"source":{"id":"https://openalex.org/S4404663975","display_name":"Proceedings of the ACM on software engineering.","issn_l":"2994-970X","issn":["2994-970X"],"is_oa":false,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/P4310319798","host_organization_name":"Association for Computing Machinery","host_organization_lineage":["https://openalex.org/P4310319798"],"host_organization_lineage_names":["Association for Computing Machinery"],"type":"journal"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Proceedings of the ACM on Software Engineering","raw_type":"journal-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":true,"oa_status":"hybrid","oa_url":"https://doi.org/10.1145/3715727","any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5101845156","display_name":"Yun Peng","orcid":"https://orcid.org/0000-0003-1936-5598"},"institutions":[{"id":"https://openalex.org/I177725633","display_name":"Chinese University of Hong Kong","ror":"https://ror.org/00t33hh48","country_code":"HK","type":"education","lineage":["https://openalex.org/I177725633"]}],"countries":["HK"],"is_corresponding":true,"raw_author_name":"Yun Peng","raw_affiliation_strings":["The Chinese University of Hong Kong, HongKong, China"],"raw_orcid":"https://orcid.org/0000-0003-1936-5598","affiliations":[{"raw_affiliation_string":"The Chinese University of Hong Kong, HongKong, China","institution_ids":["https://openalex.org/I177725633"]}]},{"author_position":"middle","author":{"id":null,"display_name":"Jun Wan","orcid":"https://orcid.org/0009-0006-3294-688X"},"institutions":[{"id":"https://openalex.org/I76130692","display_name":"Zhejiang University","ror":"https://ror.org/00a2xv884","country_code":"CN","type":"education","lineage":["https://openalex.org/I76130692"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Jun Wan","raw_affiliation_strings":["Zhejiang University, Hangzhou, China"],"raw_orcid":"https://orcid.org/0009-0006-3294-688X","affiliations":[{"raw_affiliation_string":"Zhejiang University, Hangzhou, China","institution_ids":["https://openalex.org/I76130692"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5100426730","display_name":"Yichen Li","orcid":"https://orcid.org/0009-0009-8370-644X"},"institutions":[{"id":"https://openalex.org/I177725633","display_name":"Chinese University of Hong Kong","ror":"https://ror.org/00t33hh48","country_code":"HK","type":"education","lineage":["https://openalex.org/I177725633"]}],"countries":["HK"],"is_corresponding":false,"raw_author_name":"Yichen Li","raw_affiliation_strings":["The Chinese University of Hong Kong, Hangzhou, China"],"raw_orcid":"https://orcid.org/0009-0009-8370-644X","affiliations":[{"raw_affiliation_string":"The Chinese University of Hong Kong, Hangzhou, China","institution_ids":["https://openalex.org/I177725633"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5043600295","display_name":"Xiaoxue Ren","orcid":"https://orcid.org/0000-0002-5526-1617"},"institutions":[{"id":"https://openalex.org/I76130692","display_name":"Zhejiang University","ror":"https://ror.org/00a2xv884","country_code":"CN","type":"education","lineage":["https://openalex.org/I76130692"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Xiaoxue Ren","raw_affiliation_strings":["Zhejiang University, Hangzhou, China"],"raw_orcid":"https://orcid.org/0000-0002-5526-1617","affiliations":[{"raw_affiliation_string":"Zhejiang University, Hangzhou, China","institution_ids":["https://openalex.org/I76130692"]}]}],"institutions":[],"countries_distinct_count":2,"institutions_distinct_count":4,"corresponding_author_ids":["https://openalex.org/A5101845156"],"corresponding_institution_ids":["https://openalex.org/I177725633"],"apc_list":null,"apc_paid":null,"fwci":14.881,"has_fulltext":false,"cited_by_count":7,"citation_normalized_percentile":{"value":0.98884608,"is_in_top_1_percent":false,"is_in_top_10_percent":true},"cited_by_percentile_year":{"min":96,"max":99},"biblio":{"volume":"2","issue":"FSE","first_page":"242","last_page":"265"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T11450","display_name":"Model-Driven Software Engineering Techniques","score":0.9965999722480774,"subfield":{"id":"https://openalex.org/subfields/1712","display_name":"Software"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T11450","display_name":"Model-Driven Software Engineering Techniques","score":0.9965999722480774,"subfield":{"id":"https://openalex.org/subfields/1712","display_name":"Software"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10743","display_name":"Software Testing and Debugging Techniques","score":0.9961000084877014,"subfield":{"id":"https://openalex.org/subfields/1712","display_name":"Software"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10054","display_name":"Parallel Computing and Optimization Techniques","score":0.9937999844551086,"subfield":{"id":"https://openalex.org/subfields/1708","display_name":"Hardware and Architecture"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/correctness","display_name":"Correctness","score":0.7873370051383972},{"id":"https://openalex.org/keywords/benchmark","display_name":"Benchmark (surveying)","score":0.6946272850036621},{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.6849777102470398},{"id":"https://openalex.org/keywords/code-generation","display_name":"Code generation","score":0.6195152997970581},{"id":"https://openalex.org/keywords/code","display_name":"Code (set theory)","score":0.618541955947876},{"id":"https://openalex.org/keywords/metric","display_name":"Metric (unit)","score":0.445615291595459},{"id":"https://openalex.org/keywords/test","display_name":"Test (biology)","score":0.4364953637123108},{"id":"https://openalex.org/keywords/software","display_name":"Software","score":0.43545156717300415},{"id":"https://openalex.org/keywords/programming-language","display_name":"Programming language","score":0.20549792051315308},{"id":"https://openalex.org/keywords/computer-security","display_name":"Computer security","score":0.19679683446884155},{"id":"https://openalex.org/keywords/engineering","display_name":"Engineering","score":0.15492835640907288},{"id":"https://openalex.org/keywords/operations-management","display_name":"Operations management","score":0.11671417951583862},{"id":"https://openalex.org/keywords/set","display_name":"Set (abstract data type)","score":0.07006266713142395}],"concepts":[{"id":"https://openalex.org/C55439883","wikidata":"https://www.wikidata.org/wiki/Q360812","display_name":"Correctness","level":2,"score":0.7873370051383972},{"id":"https://openalex.org/C185798385","wikidata":"https://www.wikidata.org/wiki/Q1161707","display_name":"Benchmark (surveying)","level":2,"score":0.6946272850036621},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.6849777102470398},{"id":"https://openalex.org/C133162039","wikidata":"https://www.wikidata.org/wiki/Q1061077","display_name":"Code generation","level":3,"score":0.6195152997970581},{"id":"https://openalex.org/C2776760102","wikidata":"https://www.wikidata.org/wiki/Q5139990","display_name":"Code (set theory)","level":3,"score":0.618541955947876},{"id":"https://openalex.org/C176217482","wikidata":"https://www.wikidata.org/wiki/Q860554","display_name":"Metric (unit)","level":2,"score":0.445615291595459},{"id":"https://openalex.org/C2777267654","wikidata":"https://www.wikidata.org/wiki/Q3519023","display_name":"Test (biology)","level":2,"score":0.4364953637123108},{"id":"https://openalex.org/C2777904410","wikidata":"https://www.wikidata.org/wiki/Q7397","display_name":"Software","level":2,"score":0.43545156717300415},{"id":"https://openalex.org/C199360897","wikidata":"https://www.wikidata.org/wiki/Q9143","display_name":"Programming language","level":1,"score":0.20549792051315308},{"id":"https://openalex.org/C38652104","wikidata":"https://www.wikidata.org/wiki/Q3510521","display_name":"Computer security","level":1,"score":0.19679683446884155},{"id":"https://openalex.org/C127413603","wikidata":"https://www.wikidata.org/wiki/Q11023","display_name":"Engineering","level":0,"score":0.15492835640907288},{"id":"https://openalex.org/C21547014","wikidata":"https://www.wikidata.org/wiki/Q1423657","display_name":"Operations management","level":1,"score":0.11671417951583862},{"id":"https://openalex.org/C177264268","wikidata":"https://www.wikidata.org/wiki/Q1514741","display_name":"Set (abstract data type)","level":2,"score":0.07006266713142395},{"id":"https://openalex.org/C13280743","wikidata":"https://www.wikidata.org/wiki/Q131089","display_name":"Geodesy","level":1,"score":0.0},{"id":"https://openalex.org/C86803240","wikidata":"https://www.wikidata.org/wiki/Q420","display_name":"Biology","level":0,"score":0.0},{"id":"https://openalex.org/C26517878","wikidata":"https://www.wikidata.org/wiki/Q228039","display_name":"Key (lock)","level":2,"score":0.0},{"id":"https://openalex.org/C151730666","wikidata":"https://www.wikidata.org/wiki/Q7205","display_name":"Paleontology","level":1,"score":0.0},{"id":"https://openalex.org/C205649164","wikidata":"https://www.wikidata.org/wiki/Q1071","display_name":"Geography","level":0,"score":0.0}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.1145/3715727","is_oa":true,"landing_page_url":"https://doi.org/10.1145/3715727","pdf_url":null,"source":{"id":"https://openalex.org/S4404663975","display_name":"Proceedings of the ACM on software engineering.","issn_l":"2994-970X","issn":["2994-970X"],"is_oa":false,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/P4310319798","host_organization_name":"Association for Computing Machinery","host_organization_lineage":["https://openalex.org/P4310319798"],"host_organization_lineage_names":["Association for Computing Machinery"],"type":"journal"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Proceedings of the ACM on Software Engineering","raw_type":"journal-article"}],"best_oa_location":{"id":"doi:10.1145/3715727","is_oa":true,"landing_page_url":"https://doi.org/10.1145/3715727","pdf_url":null,"source":{"id":"https://openalex.org/S4404663975","display_name":"Proceedings of the ACM on software engineering.","issn_l":"2994-970X","issn":["2994-970X"],"is_oa":false,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/P4310319798","host_organization_name":"Association for Computing Machinery","host_organization_lineage":["https://openalex.org/P4310319798"],"host_organization_lineage_names":["Association for Computing Machinery"],"type":"journal"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Proceedings of the ACM on Software Engineering","raw_type":"journal-article"},"sustainable_development_goals":[{"display_name":"Industry, innovation and infrastructure","score":0.550000011920929,"id":"https://metadata.un.org/sdg/9"}],"awards":[],"funders":[],"has_content":{"pdf":false,"grobid_xml":false},"content_urls":null,"referenced_works_count":50,"referenced_works":["https://openalex.org/W398859631","https://openalex.org/W2145705994","https://openalex.org/W2316269269","https://openalex.org/W2747329762","https://openalex.org/W2930957955","https://openalex.org/W3108371183","https://openalex.org/W3198685994","https://openalex.org/W4206251287","https://openalex.org/W4307079201","https://openalex.org/W4307789634","https://openalex.org/W4311887664","https://openalex.org/W4315706637","https://openalex.org/W4323570365","https://openalex.org/W4327810158","https://openalex.org/W4361866100","https://openalex.org/W4365205411","https://openalex.org/W4368755703","https://openalex.org/W4376167329","https://openalex.org/W4378591002","https://openalex.org/W4379548473","https://openalex.org/W4380993527","https://openalex.org/W4386185625","https://openalex.org/W4387356199","https://openalex.org/W4387561453","https://openalex.org/W4389104713","https://openalex.org/W4389364446","https://openalex.org/W4389422760","https://openalex.org/W4389519225","https://openalex.org/W4389519352","https://openalex.org/W4389983379","https://openalex.org/W4390092490","https://openalex.org/W4390723197","https://openalex.org/W4390963096","https://openalex.org/W4391272793","https://openalex.org/W4391555701","https://openalex.org/W4391590673","https://openalex.org/W4391988244","https://openalex.org/W4394654277","https://openalex.org/W4394906122","https://openalex.org/W4395064918","https://openalex.org/W4395474395","https://openalex.org/W4396813586","https://openalex.org/W4396815229","https://openalex.org/W4399114781","https://openalex.org/W4399511783","https://openalex.org/W4399598203","https://openalex.org/W4399836661","https://openalex.org/W4399912173","https://openalex.org/W4400484392","https://openalex.org/W6967084484"],"related_works":["https://openalex.org/W3008339103","https://openalex.org/W1667647204","https://openalex.org/W2404647514","https://openalex.org/W4247536566","https://openalex.org/W1482441085","https://openalex.org/W2966858528","https://openalex.org/W2151687600","https://openalex.org/W2048831961","https://openalex.org/W1606349578","https://openalex.org/W4399567378"],"abstract_inverted_index":{"Code":[0],"generation":[1,133,168],"has":[2],"largely":[3],"improved":[4],"development":[5],"efficiency":[6,66,81,92,114,123,139],"in":[7,33,120,241],"the":[8,16,44,56,60,64,90,98,109,112,118,121,137,159,181,186,221],"era":[9],"of":[10,46,67,93,111,125,140,176,183,239],"large":[11],"language":[12],"models":[13],"(LLMs).":[14],"With":[15],"ability":[17],"to":[18,26,42,54,179,198,233],"follow":[19],"instructions,":[20],"current":[21,99],"LLMs":[22,212,240],"can":[23],"be":[24],"prompted":[25],"generate":[27],"code":[28,69,95,126,132,142,154,242],"solutions":[29,70],"given":[30],"detailed":[31],"descriptions":[32],"natural":[34],"language.":[35],"Many":[36],"research":[37,236],"efforts":[38],"are":[39,52,76],"being":[40],"devoted":[41],"improving":[43],"correctness":[45,57,74],"LLM-generated":[47,68,141],"code,":[48],"and":[49,106,147,152,172,202,215,230,237],"many":[50],"benchmarks":[51,75],"proposed":[53],"evaluate":[55,209],"comprehensively.":[58],"Despite":[59],"focus":[61],"on":[62,194,213,220],"correctness,":[63],"time":[65,80,91,101,113,122,138,187],"is":[71,103],"under-explored.":[72],"Current":[73],"not":[77,104],"suitable":[78],"for":[79,135,150,227],"evaluation":[82,124,188],"since":[83],"their":[84],"test":[85,166,177],"cases":[86,178],"cannot":[87],"well":[88],"distinguish":[89],"different":[94,206],"solutions.":[96,143,207],"Besides,":[97],"execution":[100],"measurement":[102],"stable":[105,201],"comprehensive,":[107],"threatening":[108],"validity":[110],"evaluation.":[115],"To":[116,157],"address":[117],"challenges":[119],"generation,":[127,155],"we":[128,161,190,223],"propose":[129,191],"COFFE,":[130],"a":[131,163,200],"benchmark":[134],"evaluating":[136],"COFFE":[144,214],"contains":[145],"398":[146],"358":[148],"problems":[149],"function-level":[151],"file-level":[153],"respectively.":[156],"improve":[158,180],"distinguishability,":[160],"design":[162],"novel":[164],"stressful":[165],"case":[167],"approach":[169],"with":[170],"contracts":[171],"two":[173],"new":[174],"formats":[175],"accuracy":[182],"generation.":[184,243],"For":[185],"metric,":[189],"efficienct@k":[192],"based":[193],"CPU":[195],"instruction":[196],"count":[197],"ensure":[199],"solid":[203],"comparison":[204],"between":[205],"We":[208],"14":[210],"popular":[211],"identify":[216],"four":[217],"findings.":[218],"Based":[219],"findings,":[222],"draw":[224],"some":[225],"implications":[226],"LLM":[228],"researchers":[229],"software":[231],"practitioners":[232],"facilitate":[234],"future":[235],"usage":[238]},"counts_by_year":[{"year":2026,"cited_by_count":1},{"year":2025,"cited_by_count":6}],"updated_date":"2026-03-27T05:58:40.876381","created_date":"2025-10-10T00:00:00"}
