{"id":"https://openalex.org/W4409671919","doi":"https://doi.org/10.1145/3696410.3714889","title":"WebCode2M: A Real-World Dataset for Code Generation from Webpage Designs","display_name":"WebCode2M: A Real-World Dataset for Code Generation from Webpage Designs","publication_year":2025,"publication_date":"2025-04-22","ids":{"openalex":"https://openalex.org/W4409671919","doi":"https://doi.org/10.1145/3696410.3714889"},"language":"en","primary_location":{"id":"doi:10.1145/3696410.3714889","is_oa":false,"landing_page_url":"https://doi.org/10.1145/3696410.3714889","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Proceedings of the ACM on Web Conference 2025","raw_type":"proceedings-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":false,"oa_status":"closed","oa_url":null,"any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5084159330","display_name":"Yi Gui","orcid":"https://orcid.org/0009-0006-2841-7942"},"institutions":[{"id":"https://openalex.org/I47720641","display_name":"Huazhong University of Science and Technology","ror":"https://ror.org/00p991c53","country_code":"CN","type":"education","lineage":["https://openalex.org/I47720641"]}],"countries":["CN"],"is_corresponding":true,"raw_author_name":"Yi Gui","raw_affiliation_strings":["National Engineering Research Center for Big Data Technology and System, Services Computing Technology and System Lab, Cluster and Grid Computing Lab, School of Computer Science and Technology, Huazhong University of Science and Technology, Wuhan, China"],"affiliations":[{"raw_affiliation_string":"National Engineering Research Center for Big Data Technology and System, Services Computing Technology and System Lab, Cluster and Grid Computing Lab, School of Computer Science and Technology, Huazhong University of Science and Technology, Wuhan, China","institution_ids":["https://openalex.org/I47720641"]}]},{"author_position":"middle","author":{"id":null,"display_name":"Zhen Li","orcid":"https://orcid.org/0009-0007-0873-6126"},"institutions":[{"id":"https://openalex.org/I47720641","display_name":"Huazhong University of Science and Technology","ror":"https://ror.org/00p991c53","country_code":"CN","type":"education","lineage":["https://openalex.org/I47720641"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Zhen Li","raw_affiliation_strings":["National Engineering Research Center for Big Data Technology and System, Services Computing Technology and System Lab, Cluster and Grid Computing Lab, School of Computer Science and Technology, Huazhong University of Science and Technology, Wuhan, China"],"affiliations":[{"raw_affiliation_string":"National Engineering Research Center for Big Data Technology and System, Services Computing Technology and System Lab, Cluster and Grid Computing Lab, School of Computer Science and Technology, Huazhong University of Science and Technology, Wuhan, China","institution_ids":["https://openalex.org/I47720641"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5101555948","display_name":"Yao Wan","orcid":"https://orcid.org/0000-0001-6937-4180"},"institutions":[{"id":"https://openalex.org/I47720641","display_name":"Huazhong University of Science and Technology","ror":"https://ror.org/00p991c53","country_code":"CN","type":"education","lineage":["https://openalex.org/I47720641"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Yao Wan","raw_affiliation_strings":["National Engineering Research Center for Big Data Technology and System, Services Computing Technology and System Lab, Cluster and Grid Computing Lab, School of Computer Science and Technology, Huazhong University of Science and Technology, Wuhan, China"],"affiliations":[{"raw_affiliation_string":"National Engineering Research Center for Big Data Technology and System, Services Computing Technology and System Lab, Cluster and Grid Computing Lab, School of Computer Science and Technology, Huazhong University of Science and Technology, Wuhan, China","institution_ids":["https://openalex.org/I47720641"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5081388259","display_name":"Yemin Shi","orcid":"https://orcid.org/0000-0001-9024-7266"},"institutions":[{"id":"https://openalex.org/I20231570","display_name":"Peking University","ror":"https://ror.org/02v51f717","country_code":"CN","type":"education","lineage":["https://openalex.org/I20231570"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Yemin Shi","raw_affiliation_strings":["Peking University, Beijing, China"],"affiliations":[{"raw_affiliation_string":"Peking University, Beijing, China","institution_ids":["https://openalex.org/I20231570"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5100412598","display_name":"Hongyu Zhang","orcid":"https://orcid.org/0000-0002-3063-9425"},"institutions":[{"id":"https://openalex.org/I158842170","display_name":"Chongqing University","ror":"https://ror.org/023rhb549","country_code":"CN","type":"education","lineage":["https://openalex.org/I158842170"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Hongyu Zhang","raw_affiliation_strings":["Chongqing University, Chongqing, China"],"affiliations":[{"raw_affiliation_string":"Chongqing University, Chongqing, China","institution_ids":["https://openalex.org/I158842170"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5111133708","display_name":"Bohua Chen","orcid":"https://orcid.org/0009-0004-8927-8902"},"institutions":[{"id":"https://openalex.org/I47720641","display_name":"Huazhong University of Science and Technology","ror":"https://ror.org/00p991c53","country_code":"CN","type":"education","lineage":["https://openalex.org/I47720641"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Bohua Chen","raw_affiliation_strings":["Huazhong University of Science and Technology, Wuhan, China"],"affiliations":[{"raw_affiliation_string":"Huazhong University of Science and Technology, Wuhan, China","institution_ids":["https://openalex.org/I47720641"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5109980408","display_name":"Yi Su","orcid":"https://orcid.org/0009-0007-9336-3562"},"institutions":[{"id":"https://openalex.org/I4210126203","display_name":"Hubei University of Automotive Technology","ror":"https://ror.org/039m95m06","country_code":"CN","type":"education","lineage":["https://openalex.org/I4210126203"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Yi Su","raw_affiliation_strings":["Hubei University of Automotive Technology, Shiyan, China"],"affiliations":[{"raw_affiliation_string":"Hubei University of Automotive Technology, Shiyan, China","institution_ids":["https://openalex.org/I4210126203"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5015370659","display_name":"Dongping Chen","orcid":"https://orcid.org/0009-0009-9848-2557"},"institutions":[{"id":"https://openalex.org/I4210157617","display_name":"Huazhong University of Science and Technology Hospital","ror":"https://ror.org/05f9vfg11","country_code":"CN","type":"healthcare","lineage":["https://openalex.org/I4210157617"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Dongping Chen","raw_affiliation_strings":["Huazhong University of Science and Technology, Hubei, China"],"affiliations":[{"raw_affiliation_string":"Huazhong University of Science and Technology, Hubei, China","institution_ids":["https://openalex.org/I4210157617"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5083141914","display_name":"Siyuan Wu","orcid":"https://orcid.org/0009-0006-0960-1699"},"institutions":[{"id":"https://openalex.org/I47720641","display_name":"Huazhong University of Science and Technology","ror":"https://ror.org/00p991c53","country_code":"CN","type":"education","lineage":["https://openalex.org/I47720641"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Siyuan Wu","raw_affiliation_strings":["Huazhong University of Science and Technology, Wuhan, China"],"affiliations":[{"raw_affiliation_string":"Huazhong University of Science and Technology, Wuhan, China","institution_ids":["https://openalex.org/I47720641"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5101316823","display_name":"Xing Zhou","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Xing Zhou","raw_affiliation_strings":["Rabbitpre AI, Shenzhen, China"],"affiliations":[{"raw_affiliation_string":"Rabbitpre AI, Shenzhen, China","institution_ids":[]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5003231472","display_name":"Wenbin Jiang","orcid":"https://orcid.org/0000-0001-5628-8806"},"institutions":[{"id":"https://openalex.org/I47720641","display_name":"Huazhong University of Science and Technology","ror":"https://ror.org/00p991c53","country_code":"CN","type":"education","lineage":["https://openalex.org/I47720641"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Wenbin Jiang","raw_affiliation_strings":["National Engineering Research Center for Big Data Technology and System, Services Computing Technology and System Lab, Cluster and Grid Computing Lab, School of Computer Science and Technology, Huazhong University of Science and Technology, Wuhan, China"],"affiliations":[{"raw_affiliation_string":"National Engineering Research Center for Big Data Technology and System, Services Computing Technology and System Lab, Cluster and Grid Computing Lab, School of Computer Science and Technology, Huazhong University of Science and Technology, Wuhan, China","institution_ids":["https://openalex.org/I47720641"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5022262922","display_name":"Hai Jin","orcid":"https://orcid.org/0000-0002-3934-7605"},"institutions":[{"id":"https://openalex.org/I47720641","display_name":"Huazhong University of Science and Technology","ror":"https://ror.org/00p991c53","country_code":"CN","type":"education","lineage":["https://openalex.org/I47720641"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Hai Jin","raw_affiliation_strings":["National Engineering Research Center for Big Data Technology and System, Services Computing Technology and System Lab, Cluster and Grid Computing Lab, School of Computer Science and Technology, Huazhong University of Science and Technology, Wuhan, China"],"affiliations":[{"raw_affiliation_string":"National Engineering Research Center for Big Data Technology and System, Services Computing Technology and System Lab, Cluster and Grid Computing Lab, School of Computer Science and Technology, Huazhong University of Science and Technology, Wuhan, China","institution_ids":["https://openalex.org/I47720641"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5000755750","display_name":"Xiangliang Zhang","orcid":"https://orcid.org/0000-0002-3574-5665"},"institutions":[{"id":"https://openalex.org/I107639228","display_name":"University of Notre Dame","ror":"https://ror.org/00mkhxb43","country_code":"US","type":"education","lineage":["https://openalex.org/I107639228"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Xiangliang Zhang","raw_affiliation_strings":["University of Notre Dame, Notre Dame, USA"],"affiliations":[{"raw_affiliation_string":"University of Notre Dame, Notre Dame, USA","institution_ids":["https://openalex.org/I107639228"]}]}],"institutions":[],"countries_distinct_count":2,"institutions_distinct_count":13,"corresponding_author_ids":["https://openalex.org/A5084159330"],"corresponding_institution_ids":["https://openalex.org/I47720641"],"apc_list":null,"apc_paid":null,"fwci":15.3115,"has_fulltext":false,"cited_by_count":7,"citation_normalized_percentile":{"value":0.98860399,"is_in_top_1_percent":false,"is_in_top_10_percent":true},"cited_by_percentile_year":{"min":96,"max":100},"biblio":{"volume":null,"issue":null,"first_page":"1834","last_page":"1845"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10743","display_name":"Software Testing and Debugging Techniques","score":0.9923999905586243,"subfield":{"id":"https://openalex.org/subfields/1712","display_name":"Software"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10743","display_name":"Software Testing and Debugging Techniques","score":0.9923999905586243,"subfield":{"id":"https://openalex.org/subfields/1712","display_name":"Software"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T12016","display_name":"Web Data Mining and Analysis","score":0.9861999750137329,"subfield":{"id":"https://openalex.org/subfields/1710","display_name":"Information Systems"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10260","display_name":"Software Engineering Research","score":0.9818000197410583,"subfield":{"id":"https://openalex.org/subfields/1710","display_name":"Information Systems"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.7516317963600159},{"id":"https://openalex.org/keywords/code","display_name":"Code (set theory)","score":0.6577559113502502},{"id":"https://openalex.org/keywords/web-page","display_name":"Web page","score":0.5702866911888123},{"id":"https://openalex.org/keywords/information-retrieval","display_name":"Information retrieval","score":0.4648496210575104},{"id":"https://openalex.org/keywords/world-wide-web","display_name":"World Wide Web","score":0.38291001319885254},{"id":"https://openalex.org/keywords/programming-language","display_name":"Programming language","score":0.3676772713661194},{"id":"https://openalex.org/keywords/data-mining","display_name":"Data mining","score":0.3358301520347595},{"id":"https://openalex.org/keywords/set","display_name":"Set (abstract data type)","score":0.057718127965927124}],"concepts":[{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.7516317963600159},{"id":"https://openalex.org/C2776760102","wikidata":"https://www.wikidata.org/wiki/Q5139990","display_name":"Code (set theory)","level":3,"score":0.6577559113502502},{"id":"https://openalex.org/C21959979","wikidata":"https://www.wikidata.org/wiki/Q36774","display_name":"Web page","level":2,"score":0.5702866911888123},{"id":"https://openalex.org/C23123220","wikidata":"https://www.wikidata.org/wiki/Q816826","display_name":"Information retrieval","level":1,"score":0.4648496210575104},{"id":"https://openalex.org/C136764020","wikidata":"https://www.wikidata.org/wiki/Q466","display_name":"World Wide Web","level":1,"score":0.38291001319885254},{"id":"https://openalex.org/C199360897","wikidata":"https://www.wikidata.org/wiki/Q9143","display_name":"Programming language","level":1,"score":0.3676772713661194},{"id":"https://openalex.org/C124101348","wikidata":"https://www.wikidata.org/wiki/Q172491","display_name":"Data mining","level":1,"score":0.3358301520347595},{"id":"https://openalex.org/C177264268","wikidata":"https://www.wikidata.org/wiki/Q1514741","display_name":"Set (abstract data type)","level":2,"score":0.057718127965927124}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.1145/3696410.3714889","is_oa":false,"landing_page_url":"https://doi.org/10.1145/3696410.3714889","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Proceedings of the ACM on Web Conference 2025","raw_type":"proceedings-article"}],"best_oa_location":null,"sustainable_development_goals":[],"awards":[],"funders":[],"has_content":{"grobid_xml":false,"pdf":false},"content_urls":null,"referenced_works_count":19,"referenced_works":["https://openalex.org/W1895577753","https://openalex.org/W2102605133","https://openalex.org/W2117539524","https://openalex.org/W2194775991","https://openalex.org/W2395611524","https://openalex.org/W2560674852","https://openalex.org/W2888557792","https://openalex.org/W2930957955","https://openalex.org/W2962724148","https://openalex.org/W2981852735","https://openalex.org/W3011632945","https://openalex.org/W4288089799","https://openalex.org/W4307472389","https://openalex.org/W4312933868","https://openalex.org/W4397032804","https://openalex.org/W4402753874","https://openalex.org/W4403536858","https://openalex.org/W6600488088","https://openalex.org/W6602003647"],"related_works":["https://openalex.org/W3135843367","https://openalex.org/W2611741382","https://openalex.org/W3112355890","https://openalex.org/W2613685774","https://openalex.org/W4220741973","https://openalex.org/W2326464900","https://openalex.org/W4391422656","https://openalex.org/W2061176321","https://openalex.org/W1994667531","https://openalex.org/W2000745862"],"abstract_inverted_index":{"Automatically":[0],"generating":[1],"webpage":[2,5,53,80,98,182],"code":[3,54,81,99,180,211],"from":[4,86,181],"designs":[6],"can":[7],"significantly":[8,172],"reduce":[9],"the":[10,40,78,128,139,161,174],"workload":[11],"of":[12,42,104,130,176],"front-end":[13,193],"developers,":[14],"and":[15,82,94,145,187,212],"recent":[16],"Multimodal":[17],"Large":[18],"Language":[19],"Models":[20],"(MLLMs)":[21],"have":[22],"shown":[23],"promising":[24],"potential":[25],"in":[26,48,51,192],"this":[27,58,60],"area.":[28],"However,":[29],"our":[30,170,204,218],"investigation":[31],"reveals":[32],"that":[33,115,169],"most":[34],"existing":[35],"MLLMs":[36,177],"are":[37,214],"constrained":[38],"by":[39,111,203],"absence":[41],"high-quality,":[43],"large-scale,":[44],"real-world":[45,87],"datasets,":[46],"resulting":[47],"inadequate":[49],"performance":[50],"automated":[52],"generation.":[55],"To":[56,126],"fill":[57],"gap,":[59],"paper":[61],"introduces":[62],"WebCode2M,":[63,131],"a":[64,73,92,102,112,134,147,155],"new":[65,156],"dataset":[66,96,107,171,213],"comprising":[67],"2.56":[68],"million":[69],"instances,":[70],"each":[71],"containing":[72],"design":[74,194],"image":[75],"along":[76],"with":[77,119],"corresponding":[79],"layout":[83],"details.":[84],"Sourced":[85],"web":[88],"resources,":[89],"WebCode2M":[90],"offers":[91],"rich":[93],"valuable":[95],"for":[97,149,189,207],"generation":[100],"across":[101],"variety":[103],"applications.":[105],"The":[106,165,210],"quality":[108],"is":[109],"ensured":[110],"scoring":[113],"model":[114,136],"filters":[116],"out":[117],"instances":[118],"aesthetic":[120],"deficiencies":[121],"or":[122],"other":[123],"incomplete":[124],"elements.":[125],"validate":[127],"effectiveness":[129,186],"we":[132,153,197],"introduce":[133,154],"baseline":[135],"based":[137],"on":[138],"Vision":[140],"Transformer":[141],"(ViT),":[142],"named":[143],"WebCoder,":[144],"establish":[146],"benchmark":[148],"fair":[150],"comparison.":[151],"Additionally,":[152],"metric,":[157],"TreeBLEU,":[158],"to":[159,178],"measure":[160],"structural":[162],"hierarchy":[163],"recall.":[164],"benchmarking":[166],"results":[167],"demonstrate":[168],"improves":[173],"ability":[175],"generate":[179],"designs,":[183],"confirming":[184],"its":[185],"usability":[188],"future":[190],"applications":[191],"tools.":[195],"Finally,":[196],"highlight":[198],"several":[199],"practical":[200],"challenges":[201],"introduced":[202],"dataset,":[205],"calling":[206],"further":[208],"research.":[209],"publicly":[215],"available":[216],"at":[217],"project":[219],"homepage:":[220],"https://webcode2m.github.io.":[221]},"counts_by_year":[{"year":2026,"cited_by_count":4},{"year":2025,"cited_by_count":3}],"updated_date":"2026-04-13T07:58:08.660418","created_date":"2025-10-10T00:00:00"}
