{"id":"https://openalex.org/W7161134843","doi":"https://doi.org/10.48550/arxiv.2605.12857","title":"ChipMATE: Multi-Agent Training via Reinforcement Learning for Enhanced RTL Generation","display_name":"ChipMATE: Multi-Agent Training via Reinforcement Learning for Enhanced RTL Generation","publication_year":2026,"publication_date":"2026-05-13","ids":{"openalex":"https://openalex.org/W7161134843","doi":"https://doi.org/10.48550/arxiv.2605.12857"},"language":null,"primary_location":{"id":"doi:10.48550/arxiv.2605.12857","is_oa":true,"landing_page_url":"https://doi.org/10.48550/arxiv.2605.12857","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":null,"is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"article"},"type":"preprint","indexed_in":["datacite"],"open_access":{"is_oa":true,"oa_status":"green","oa_url":"https://doi.org/10.48550/arxiv.2605.12857","any_repository_has_fulltext":true},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5136129808","display_name":"Zhongkai Yu","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Yu, Zhongkai","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5121811662","display_name":"Yichen Lin","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Lin, Yichen","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5136172269","display_name":"Chenyang Zhou","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Zhou, Chenyang","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5136171584","display_name":"Yuwei Zhang","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Zhang, Yuwei","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5136137819","display_name":"Kun Zhou","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Zhou, Kun","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5027637051","display_name":"Cui Junxia","orcid":"https://orcid.org/0009-0006-7097-3854"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Cui, Junxia","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5136146098","display_name":"Haotian Ye","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Ye, Haotian","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5136108010","display_name":"Zhengding Hu","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Hu, Zhengding","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5136158786","display_name":"Zaifeng Pan","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Pan, Zaifeng","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5136165968","display_name":"Ruiyi Wang","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Wang, Ruiyi","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5136152340","display_name":"Yujie Zhao","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Zhao, Yujie","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5136127796","display_name":"Hejia Zhang","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Zhang, Hejia","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5136091190","display_name":"Jingbo Shang","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Shang, Jingbo","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5136142797","display_name":"Jishen Zhao","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Zhao, Jishen","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"last","author":{"id":"https://openalex.org/A5136153321","display_name":"Yufei Ding","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Ding, Yufei","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]}],"institutions":[],"countries_distinct_count":0,"institutions_distinct_count":15,"corresponding_author_ids":[],"corresponding_institution_ids":[],"apc_list":null,"apc_paid":null,"fwci":null,"has_fulltext":false,"cited_by_count":0,"citation_normalized_percentile":null,"cited_by_percentile_year":null,"biblio":{"volume":null,"issue":null,"first_page":null,"last_page":null},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T11241","display_name":"Advanced Malware Detection Techniques","score":0.28220000863075256,"subfield":{"id":"https://openalex.org/subfields/1711","display_name":"Signal Processing"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T11241","display_name":"Advanced Malware Detection Techniques","score":0.28220000863075256,"subfield":{"id":"https://openalex.org/subfields/1711","display_name":"Signal Processing"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10743","display_name":"Software Testing and Debugging Techniques","score":0.05249999836087227,"subfield":{"id":"https://openalex.org/subfields/1712","display_name":"Software"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11689","display_name":"Adversarial Robustness in Machine Learning","score":0.05209999904036522,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/correctness","display_name":"Correctness","score":0.6715999841690063},{"id":"https://openalex.org/keywords/workflow","display_name":"Workflow","score":0.46700000762939453},{"id":"https://openalex.org/keywords/code-generation","display_name":"Code generation","score":0.44850000739097595},{"id":"https://openalex.org/keywords/train","display_name":"Train","score":0.43700000643730164},{"id":"https://openalex.org/keywords/leverage","display_name":"Leverage (statistics)","score":0.4009999930858612},{"id":"https://openalex.org/keywords/pipeline","display_name":"Pipeline (software)","score":0.3589000105857849},{"id":"https://openalex.org/keywords/verilog","display_name":"Verilog","score":0.3450999855995178},{"id":"https://openalex.org/keywords/knowledge-base","display_name":"Knowledge base","score":0.33880001306533813},{"id":"https://openalex.org/keywords/satisfiability-modulo-theories","display_name":"Satisfiability modulo theories","score":0.3312000036239624}],"concepts":[{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.7756999731063843},{"id":"https://openalex.org/C55439883","wikidata":"https://www.wikidata.org/wiki/Q360812","display_name":"Correctness","level":2,"score":0.6715999841690063},{"id":"https://openalex.org/C177212765","wikidata":"https://www.wikidata.org/wiki/Q627335","display_name":"Workflow","level":2,"score":0.46700000762939453},{"id":"https://openalex.org/C133162039","wikidata":"https://www.wikidata.org/wiki/Q1061077","display_name":"Code generation","level":3,"score":0.44850000739097595},{"id":"https://openalex.org/C190839683","wikidata":"https://www.wikidata.org/wiki/Q2448197","display_name":"Train","level":2,"score":0.43700000643730164},{"id":"https://openalex.org/C199360897","wikidata":"https://www.wikidata.org/wiki/Q9143","display_name":"Programming language","level":1,"score":0.415800005197525},{"id":"https://openalex.org/C115903868","wikidata":"https://www.wikidata.org/wiki/Q80993","display_name":"Software engineering","level":1,"score":0.4133000075817108},{"id":"https://openalex.org/C153083717","wikidata":"https://www.wikidata.org/wiki/Q6535263","display_name":"Leverage (statistics)","level":2,"score":0.4009999930858612},{"id":"https://openalex.org/C43521106","wikidata":"https://www.wikidata.org/wiki/Q2165493","display_name":"Pipeline (software)","level":2,"score":0.3589000105857849},{"id":"https://openalex.org/C149635348","wikidata":"https://www.wikidata.org/wiki/Q193040","display_name":"Embedded system","level":1,"score":0.34860000014305115},{"id":"https://openalex.org/C2779030575","wikidata":"https://www.wikidata.org/wiki/Q827773","display_name":"Verilog","level":3,"score":0.3450999855995178},{"id":"https://openalex.org/C4554734","wikidata":"https://www.wikidata.org/wiki/Q593744","display_name":"Knowledge base","level":2,"score":0.33880001306533813},{"id":"https://openalex.org/C164155591","wikidata":"https://www.wikidata.org/wiki/Q2067766","display_name":"Satisfiability modulo theories","level":2,"score":0.3312000036239624},{"id":"https://openalex.org/C42058472","wikidata":"https://www.wikidata.org/wiki/Q810214","display_name":"Base (topology)","level":2,"score":0.3310000002384186},{"id":"https://openalex.org/C168065819","wikidata":"https://www.wikidata.org/wiki/Q845566","display_name":"Debugging","level":2,"score":0.3246000111103058},{"id":"https://openalex.org/C2776760102","wikidata":"https://www.wikidata.org/wiki/Q5139990","display_name":"Code (set theory)","level":3,"score":0.32109999656677246},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.3203999996185303},{"id":"https://openalex.org/C193702766","wikidata":"https://www.wikidata.org/wiki/Q1414548","display_name":"Concurrency","level":2,"score":0.3140999972820282},{"id":"https://openalex.org/C99138194","wikidata":"https://www.wikidata.org/wiki/Q183427","display_name":"Hash function","level":2,"score":0.3061999976634979},{"id":"https://openalex.org/C519991488","wikidata":"https://www.wikidata.org/wiki/Q28865","display_name":"Python (programming language)","level":2,"score":0.3019999861717224},{"id":"https://openalex.org/C2776214188","wikidata":"https://www.wikidata.org/wiki/Q408386","display_name":"Inference","level":2,"score":0.29490000009536743},{"id":"https://openalex.org/C46686674","wikidata":"https://www.wikidata.org/wiki/Q466303","display_name":"Boosting (machine learning)","level":2,"score":0.2750000059604645},{"id":"https://openalex.org/C195344581","wikidata":"https://www.wikidata.org/wiki/Q2555318","display_name":"Automated reasoning","level":2,"score":0.26600000262260437},{"id":"https://openalex.org/C120314980","wikidata":"https://www.wikidata.org/wiki/Q180634","display_name":"Distributed computing","level":1,"score":0.26499998569488525},{"id":"https://openalex.org/C100776233","wikidata":"https://www.wikidata.org/wiki/Q2532492","display_name":"Bridge (graph theory)","level":2,"score":0.2630999982357025},{"id":"https://openalex.org/C2779639559","wikidata":"https://www.wikidata.org/wiki/Q7661178","display_name":"Symbolic execution","level":3,"score":0.2574000060558319},{"id":"https://openalex.org/C199519371","wikidata":"https://www.wikidata.org/wiki/Q942695","display_name":"Source lines of code","level":3,"score":0.2531999945640564}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.48550/arxiv.2605.12857","is_oa":true,"landing_page_url":"https://doi.org/10.48550/arxiv.2605.12857","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":null,"is_accepted":false,"is_published":null,"raw_source_name":null,"raw_type":"article"}],"best_oa_location":{"id":"doi:10.48550/arxiv.2605.12857","is_oa":true,"landing_page_url":"https://doi.org/10.48550/arxiv.2605.12857","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":null,"is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"article"},"sustainable_development_goals":[{"id":"https://metadata.un.org/sdg/9","score":0.5937871336936951,"display_name":"Industry, innovation and infrastructure"}],"awards":[],"funders":[],"has_content":{"pdf":false,"grobid_xml":false},"content_urls":null,"referenced_works_count":0,"referenced_works":[],"related_works":[],"abstract_inverted_index":{"Existing":[0],"API-based":[1],"agentic":[2],"systems":[3],"for":[4,83],"RTL":[5,42,84,98],"code":[6,206],"generation":[7,22],"are":[8,210],"fundamentally":[9],"misaligned":[10],"with":[11,29,108,187,202],"industrial":[12,69,88],"practice:":[13],"they":[14],"assume":[15],"a":[16,105,109,125,136,166],"golden":[17,121],"testbench":[18],"is":[19],"available":[20,212],"at":[21],"time,":[23],"rely":[24],"on":[25,39,184],"closed-source":[26],"APIs":[27],"incompatible":[28],"chip":[30],"vendors'":[31,40],"air-gapped":[32],"security":[33],"requirements,":[34],"and":[35,100,135,181,189,198,207],"cannot":[36],"be":[37],"trained":[38],"proprietary":[41],"codebases,":[43],"leaving":[44],"valuable":[45],"internal":[46],"data":[47],"unused.":[48],"Recent":[49],"self-trained":[50,80,196],"models":[51,197],"address":[52],"the":[53,62,78,153,161],"deployment":[54],"constraint":[55],"but":[56],"remain":[57],"single-turn":[58],"generators":[59],"that":[60,113,140,170],"overlook":[61],"critical":[63],"role":[64],"of":[65],"verification":[66],"in":[67,213],"real":[68],"flows.":[70],"To":[71,159],"bridge":[72],"these":[73],"gaps,":[74],"we":[75,163],"present":[76],"ChipMATE,":[77],"first":[79,141],"multi-agent":[81],"framework":[82,169],"generation.":[85],"Inspired":[86],"by":[87],"practice":[89],"where":[90],"correctness":[91],"emerges":[92],"from":[93],"cross-comparison":[94],"between":[95],"independently":[96],"written":[97],"modules":[99],"reference":[101,174],"models,":[102,192],"ChipMATE":[103,178],"pairs":[104],"Verilog":[106],"agent":[107,112,144],"Python":[110],"reference-model":[111],"mutually":[114],"verify":[115],"each":[116,143],"other's":[117],"outputs":[118],"without":[119],"any":[120],"oracle.":[122],"We":[123],"design":[124],"backtrack-based":[126],"inference":[127],"workflow":[128],"to":[129,146,156],"prevent":[130],"error":[131],"propagation":[132],"across":[133],"turns,":[134],"two-stage":[137],"training":[138,176],"pipeline":[139],"trains":[142,152],"individually":[145],"saturate":[147],"its":[148],"code-generation":[149],"capability,":[150],"then":[151],"team":[154],"jointly":[155],"collaborate":[157],"effectively.":[158],"support":[160],"training,":[162],"further":[164],"build":[165],"hybrid":[167],"data-generation":[168],"produces":[171],"64.4K":[172],"high-quality":[173],"model":[175,208],"samples.":[177],"achieves":[179],"75.0\\%":[180],"80.1\\%":[182],"pass@1":[183],"VerilogEval":[185],"V2":[186],"4B":[188],"9B":[190],"base":[191],"outperforming":[193],"all":[194],"existing":[195],"even":[199],"DeepSeek":[200],"V4":[201],"1600B":[203],"parameters.":[204],"Our":[205],"weights":[209],"publicly":[211],"https://github.com/zhongkaiyu/ChipMATE.":[214]},"counts_by_year":[],"updated_date":"2026-06-11T09:08:48.828518","created_date":"2026-05-15T00:00:00"}
