{"id":"https://openalex.org/W4415413157","doi":"https://doi.org/10.18293/seke2025-053","title":"Beyond Test Cases: Multi-Agent Collaboration for Detecting Errors in Full-Score Code Implementations","display_name":"Beyond Test Cases: Multi-Agent Collaboration for Detecting Errors in Full-Score Code Implementations","publication_year":2025,"publication_date":"2025-09-29","ids":{"openalex":"https://openalex.org/W4415413157","doi":"https://doi.org/10.18293/seke2025-053"},"language":null,"primary_location":{"id":"doi:10.18293/seke2025-053","is_oa":true,"landing_page_url":"https://doi.org/10.18293/seke2025-053","pdf_url":"https://doi.org/10.18293/seke2025-053","source":{"id":"https://openalex.org/S4220650826","display_name":"Proceedings/Proceedings of the ... International Conference on Software Engineering and Knowledge Engineering","issn_l":"2325-9000","issn":["2325-9000","2325-9086"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":null,"host_organization_name":null,"host_organization_lineage":[],"host_organization_lineage_names":[],"type":"journal"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"International Conferences on Software Engineering and Knowledge Engineering","raw_type":"proceedings-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":true,"oa_status":"bronze","oa_url":"https://doi.org/10.18293/seke2025-053","any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5107952085","display_name":"Yiwei Li","orcid":"https://orcid.org/0009-0009-3329-810X"},"institutions":[{"id":"https://openalex.org/I170215575","display_name":"National University of Defense Technology","ror":"https://ror.org/05d2yfz11","country_code":"CN","type":"education","lineage":["https://openalex.org/I170215575"]}],"countries":["CN"],"is_corresponding":true,"raw_author_name":"Yiwei Li","raw_affiliation_strings":["College of Computer Science and Technology National University of Defense Technology Changsha , China"],"affiliations":[{"raw_affiliation_string":"College of Computer Science and Technology National University of Defense Technology Changsha , China","institution_ids":["https://openalex.org/I170215575"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5053312950","display_name":"Jiaxin Liu","orcid":"https://orcid.org/0000-0003-2449-1150"},"institutions":[{"id":"https://openalex.org/I170215575","display_name":"National University of Defense Technology","ror":"https://ror.org/05d2yfz11","country_code":"CN","type":"education","lineage":["https://openalex.org/I170215575"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Jiaxin Liu","raw_affiliation_strings":["College of Computer Science and Technology National University of Defense Technology Changsha , China"],"affiliations":[{"raw_affiliation_string":"College of Computer Science and Technology National University of Defense Technology Changsha , China","institution_ids":["https://openalex.org/I170215575"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5104097662","display_name":"Yanfeng Hu","orcid":null},"institutions":[{"id":"https://openalex.org/I170215575","display_name":"National University of Defense Technology","ror":"https://ror.org/05d2yfz11","country_code":"CN","type":"education","lineage":["https://openalex.org/I170215575"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Yanfeng Hu","raw_affiliation_strings":["College of Computer Science and Technology National University of Defense Technology Changsha , China"],"affiliations":[{"raw_affiliation_string":"College of Computer Science and Technology National University of Defense Technology Changsha , China","institution_ids":["https://openalex.org/I170215575"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5079131572","display_name":"Chen Liu","orcid":"https://orcid.org/0000-0002-8803-9617"},"institutions":[{"id":"https://openalex.org/I170215575","display_name":"National University of Defense Technology","ror":"https://ror.org/05d2yfz11","country_code":"CN","type":"education","lineage":["https://openalex.org/I170215575"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Chen Liu","raw_affiliation_strings":["College of Computer Science and Technology National University of Defense Technology Changsha , China"],"affiliations":[{"raw_affiliation_string":"College of Computer Science and Technology National University of Defense Technology Changsha , China","institution_ids":["https://openalex.org/I170215575"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5083915061","display_name":"Yating Zhang","orcid":null},"institutions":[{"id":"https://openalex.org/I170215575","display_name":"National University of Defense Technology","ror":"https://ror.org/05d2yfz11","country_code":"CN","type":"education","lineage":["https://openalex.org/I170215575"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Yating Zhang","raw_affiliation_strings":["College of Computer Science and Technology National University of Defense Technology Changsha , China"],"affiliations":[{"raw_affiliation_string":"College of Computer Science and Technology National University of Defense Technology Changsha , China","institution_ids":["https://openalex.org/I170215575"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5101846770","display_name":"Liangze Yin","orcid":"https://orcid.org/0000-0002-1645-2787"},"institutions":[{"id":"https://openalex.org/I170215575","display_name":"National University of Defense Technology","ror":"https://ror.org/05d2yfz11","country_code":"CN","type":"education","lineage":["https://openalex.org/I170215575"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Liangze Yin","raw_affiliation_strings":["College of Computer Science and Technology National University of Defense Technology Changsha , China"],"affiliations":[{"raw_affiliation_string":"College of Computer Science and Technology National University of Defense Technology Changsha , China","institution_ids":["https://openalex.org/I170215575"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5100654380","display_name":"Wei Dong","orcid":"https://orcid.org/0000-0002-8033-7943"},"institutions":[{"id":"https://openalex.org/I170215575","display_name":"National University of Defense Technology","ror":"https://ror.org/05d2yfz11","country_code":"CN","type":"education","lineage":["https://openalex.org/I170215575"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Wei Dong","raw_affiliation_strings":["College of Computer Science and Technology National University of Defense Technology Changsha , China"],"affiliations":[{"raw_affiliation_string":"College of Computer Science and Technology National University of Defense Technology Changsha , China","institution_ids":["https://openalex.org/I170215575"]}]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":7,"corresponding_author_ids":["https://openalex.org/A5107952085"],"corresponding_institution_ids":["https://openalex.org/I170215575"],"apc_list":null,"apc_paid":null,"fwci":0.0,"has_fulltext":true,"cited_by_count":0,"citation_normalized_percentile":{"value":0.43230977,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":null,"biblio":{"volume":"2025","issue":null,"first_page":"124","last_page":"129"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10260","display_name":"Software Engineering Research","score":0.9979000091552734,"subfield":{"id":"https://openalex.org/subfields/1710","display_name":"Information Systems"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10260","display_name":"Software Engineering Research","score":0.9979000091552734,"subfield":{"id":"https://openalex.org/subfields/1710","display_name":"Information Systems"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10743","display_name":"Software Testing and Debugging Techniques","score":0.9968000054359436,"subfield":{"id":"https://openalex.org/subfields/1712","display_name":"Software"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11450","display_name":"Model-Driven Software Engineering Techniques","score":0.991100013256073,"subfield":{"id":"https://openalex.org/subfields/1712","display_name":"Software"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/code","display_name":"Code (set theory)","score":0.5253000259399414},{"id":"https://openalex.org/keywords/implementation","display_name":"Implementation","score":0.4747999906539917},{"id":"https://openalex.org/keywords/test","display_name":"Test (biology)","score":0.44929999113082886},{"id":"https://openalex.org/keywords/scheme","display_name":"Scheme (mathematics)","score":0.2711000144481659},{"id":"https://openalex.org/keywords/error-detection-and-correction","display_name":"Error detection and correction","score":0.26249998807907104},{"id":"https://openalex.org/keywords/source-code","display_name":"Source code","score":0.258899986743927}],"concepts":[{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.656000018119812},{"id":"https://openalex.org/C2776760102","wikidata":"https://www.wikidata.org/wiki/Q5139990","display_name":"Code (set theory)","level":3,"score":0.5253000259399414},{"id":"https://openalex.org/C26713055","wikidata":"https://www.wikidata.org/wiki/Q245962","display_name":"Implementation","level":2,"score":0.4747999906539917},{"id":"https://openalex.org/C2777267654","wikidata":"https://www.wikidata.org/wiki/Q3519023","display_name":"Test (biology)","level":2,"score":0.44929999113082886},{"id":"https://openalex.org/C199360897","wikidata":"https://www.wikidata.org/wiki/Q9143","display_name":"Programming language","level":1,"score":0.3732999861240387},{"id":"https://openalex.org/C77618280","wikidata":"https://www.wikidata.org/wiki/Q1155772","display_name":"Scheme (mathematics)","level":2,"score":0.2711000144481659},{"id":"https://openalex.org/C103088060","wikidata":"https://www.wikidata.org/wiki/Q1062839","display_name":"Error detection and correction","level":2,"score":0.26249998807907104},{"id":"https://openalex.org/C43126263","wikidata":"https://www.wikidata.org/wiki/Q128751","display_name":"Source code","level":2,"score":0.258899986743927},{"id":"https://openalex.org/C116834253","wikidata":"https://www.wikidata.org/wiki/Q2039217","display_name":"Identification (biology)","level":2,"score":0.2574000060558319},{"id":"https://openalex.org/C115903868","wikidata":"https://www.wikidata.org/wiki/Q80993","display_name":"Software engineering","level":1,"score":0.2567000091075897},{"id":"https://openalex.org/C26517878","wikidata":"https://www.wikidata.org/wiki/Q228039","display_name":"Key (lock)","level":2,"score":0.25279998779296875},{"id":"https://openalex.org/C25343380","wikidata":"https://www.wikidata.org/wiki/Q277521","display_name":"Relation (database)","level":2,"score":0.25029999017715454}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.18293/seke2025-053","is_oa":true,"landing_page_url":"https://doi.org/10.18293/seke2025-053","pdf_url":"https://doi.org/10.18293/seke2025-053","source":{"id":"https://openalex.org/S4220650826","display_name":"Proceedings/Proceedings of the ... International Conference on Software Engineering and Knowledge Engineering","issn_l":"2325-9000","issn":["2325-9000","2325-9086"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":null,"host_organization_name":null,"host_organization_lineage":[],"host_organization_lineage_names":[],"type":"journal"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"International Conferences on Software Engineering and Knowledge Engineering","raw_type":"proceedings-article"}],"best_oa_location":{"id":"doi:10.18293/seke2025-053","is_oa":true,"landing_page_url":"https://doi.org/10.18293/seke2025-053","pdf_url":"https://doi.org/10.18293/seke2025-053","source":{"id":"https://openalex.org/S4220650826","display_name":"Proceedings/Proceedings of the ... International Conference on Software Engineering and Knowledge Engineering","issn_l":"2325-9000","issn":["2325-9000","2325-9086"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":null,"host_organization_name":null,"host_organization_lineage":[],"host_organization_lineage_names":[],"type":"journal"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"International Conferences on Software Engineering and Knowledge Engineering","raw_type":"proceedings-article"},"sustainable_development_goals":[],"awards":[{"id":"https://openalex.org/G2087396116","display_name":null,"funder_award_id":"China","funder_id":"https://openalex.org/F4320321001","funder_display_name":"National Natural Science Foundation of China"},{"id":"https://openalex.org/G3317480652","display_name":null,"funder_award_id":"Science","funder_id":"https://openalex.org/F4320321001","funder_display_name":"National Natural Science Foundation of China"},{"id":"https://openalex.org/G41279851","display_name":null,"funder_award_id":"62032024","funder_id":"https://openalex.org/F4320321001","funder_display_name":"National Natural Science Foundation of China"},{"id":"https://openalex.org/G5994120800","display_name":null,"funder_award_id":"Natural","funder_id":"https://openalex.org/F4320321001","funder_display_name":"National Natural Science Foundation of China"},{"id":"https://openalex.org/G6058138561","display_name":null,"funder_award_id":", No.","funder_id":"https://openalex.org/F4320321001","funder_display_name":"National Natural Science Foundation of China"},{"id":"https://openalex.org/G7360548921","display_name":null,"funder_award_id":"U2341212","funder_id":"https://openalex.org/F4320321001","funder_display_name":"National Natural Science Foundation of China"}],"funders":[{"id":"https://openalex.org/F4320321001","display_name":"National Natural Science Foundation of China","ror":"https://ror.org/01h0zpd94"}],"has_content":{"pdf":true,"grobid_xml":true},"content_urls":{"pdf":"https://content.openalex.org/works/W4415413157.pdf","grobid_xml":"https://content.openalex.org/works/W4415413157.grobid-xml"},"referenced_works_count":0,"referenced_works":[],"related_works":[],"abstract_inverted_index":{"Automated":[0],"evaluation":[1,124,176],"of":[2,48,116,125],"programming":[3,97],"code":[4,45,69,92],"on":[5,10,89],"online":[6,104],"platforms":[7],"often":[8],"relies":[9],"predefined":[11],"test":[12,17],"cases.However,":[13],"due":[14],"to":[15,41],"limited":[16],"coverage,":[18],"many":[19],"programs":[20],"receive":[21],"full":[22],"marks":[23],"despite":[24],"violating":[25],"intended":[26],"specifications.We":[27],"present":[28],"Maveric,":[29],"a":[30,51,61,68,79,101],"framework":[31],"that":[32,54,64,71,82],"combines":[33],"large":[34],"language":[35],"models":[36],"(LLMs)":[37],"with":[38,110,118],"formal":[39,56,144],"verification":[40,145],"more":[42],"rigorously":[43],"assess":[44],"correctness.Maveric":[46],"consists":[47],"four":[49],"agents:":[50],"template":[52],"generator":[53],"derives":[55],"specifications":[57],"from":[58,94,100],"problem":[59],"descriptions,":[60],"consistency":[62],"checker":[63],"validates":[65],"semantic":[66,165],"alignment,":[67],"analyzer":[70],"detects":[72],"potential":[73],"defects":[74,137,154],"and":[75,78,149,171],"synthesizes":[76],"counterexamples,":[77,162],"counterexample":[80],"validator":[81],"formally":[83],"verifies":[84],"their":[85,164],"validity.We":[86],"evaluated":[87],"Maveric":[88,157],"100":[90],"full-score":[91],"submissions":[93],"10":[95],"real-world":[96],"tasks":[98],"sourced":[99],"widely":[102],"used":[103],"education":[105],"platform.Manual":[106],"review":[107],"identified":[108],"32":[109],"functional":[111],"defects.Maveric":[112],"accurately":[113],"detected":[114,135],"31":[115],"these":[117],"no":[119],"false":[120,141],"positives,":[121,142],"completing":[122],"the":[123],"each":[126],"program":[127,175],"in":[128,177],"under":[129],"one":[130],"minute.In":[131],"contrast,":[132],"LLM-only":[133],"methods":[134],"25":[136],"but":[138],"yielded":[139],"6":[140],"while":[143],"alone":[146],"found":[147],"23":[148],"suffered":[150],"frequent":[151],"timeouts.Importantly,":[152],"all":[153],"reported":[155],"by":[156,160],"were":[158],"supported":[159],"verifiable":[161],"confirming":[163],"violations.These":[166],"results":[167],"demonstrate":[168],"Maveric's":[169],"effectiveness":[170],"practicality":[172],"for":[173],"automated":[174],"educational":[178],"settings.":[179]},"counts_by_year":[],"updated_date":"2026-04-10T15:06:20.359241","created_date":"2025-10-24T00:00:00"}
