{"id":"https://openalex.org/W4400222257","doi":"https://doi.org/10.48550/arxiv.2406.20098","title":"Web2Code: A Large-scale Webpage-to-Code Dataset and Evaluation Framework for Multimodal LLMs","display_name":"Web2Code: A Large-scale Webpage-to-Code Dataset and Evaluation Framework for Multimodal LLMs","publication_year":2024,"publication_date":"2024-06-28","ids":{"openalex":"https://openalex.org/W4400222257","doi":"https://doi.org/10.48550/arxiv.2406.20098"},"language":"en","primary_location":{"id":"pmh:oai:arXiv.org:2406.20098","is_oa":true,"landing_page_url":"http://arxiv.org/abs/2406.20098","pdf_url":"https://arxiv.org/pdf/2406.20098","source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":"","raw_type":"text"},"type":"preprint","indexed_in":["arxiv","datacite"],"open_access":{"is_oa":true,"oa_status":"green","oa_url":"https://arxiv.org/pdf/2406.20098","any_repository_has_fulltext":true},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5108950452","display_name":"Sukmin Yun","orcid":null},"institutions":[],"countries":[],"is_corresponding":true,"raw_author_name":"Yun, Sukmin","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5025724191","display_name":"Haokun Lin","orcid":"https://orcid.org/0009-0004-8395-392X"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Lin, Haokun","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5099801437","display_name":"Rusiru Thushara","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Thushara, Rusiru","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5101390509","display_name":"Mohammad Qazim Bhat","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Bhat, Mohammad Qazim","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5100661148","display_name":"Yongxin Wang","orcid":"https://orcid.org/0000-0002-0172-9085"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Wang, Yongxin","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5101692928","display_name":"Zutao Jiang","orcid":"https://orcid.org/0000-0002-6787-5499"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Jiang, Zutao","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5113273837","display_name":"Mingkai Deng","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Deng, Mingkai","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5100775331","display_name":"Jinhong Wang","orcid":"https://orcid.org/0000-0001-7975-0565"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Wang, Jinhong","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5081822522","display_name":"Tianhua Tao","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Tao, Tianhua","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5101548643","display_name":"Junbo Li","orcid":"https://orcid.org/0009-0002-2516-9227"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Li, Junbo","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5100742670","display_name":"Haonan Li","orcid":"https://orcid.org/0000-0002-0501-4394"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Li, Haonan","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5012055259","display_name":"Preslav Nakov","orcid":"https://orcid.org/0000-0002-3600-1510"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Nakov, Preslav","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5060332228","display_name":"Timothy Baldwin","orcid":"https://orcid.org/0000-0003-4525-6950"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Baldwin, Timothy","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5029648803","display_name":"Zhengzhong Liu","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Liu, Zhengzhong","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5009547049","display_name":"Eric P. Xing","orcid":"https://orcid.org/0009-0005-9158-4201"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Xing, Eric P.","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5047878798","display_name":"Xiaodan Liang","orcid":"https://orcid.org/0000-0003-3213-3062"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Liang, Xiaodan","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"last","author":{"id":"https://openalex.org/A5068778761","display_name":"Zhiqiang Shen","orcid":"https://orcid.org/0000-0003-0804-2478"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Shen, Zhiqiang","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]}],"institutions":[],"countries_distinct_count":0,"institutions_distinct_count":17,"corresponding_author_ids":["https://openalex.org/A5108950452"],"corresponding_institution_ids":[],"apc_list":null,"apc_paid":null,"fwci":null,"has_fulltext":false,"cited_by_count":0,"citation_normalized_percentile":null,"cited_by_percentile_year":null,"biblio":{"volume":null,"issue":null,"first_page":null,"last_page":null},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10181","display_name":"Natural Language Processing Techniques","score":0.9940999746322632,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10181","display_name":"Natural Language Processing Techniques","score":0.9940999746322632,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10759","display_name":"Translation Studies and Practices","score":0.9437000155448914,"subfield":{"id":"https://openalex.org/subfields/1203","display_name":"Language and Linguistics"},"field":{"id":"https://openalex.org/fields/12","display_name":"Arts and Humanities"},"domain":{"id":"https://openalex.org/domains/2","display_name":"Social Sciences"}},{"id":"https://openalex.org/T12478","display_name":"Wikis in Education and Collaboration","score":0.942799985408783,"subfield":{"id":"https://openalex.org/subfields/3315","display_name":"Communication"},"field":{"id":"https://openalex.org/fields/33","display_name":"Social Sciences"},"domain":{"id":"https://openalex.org/domains/2","display_name":"Social Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/code","display_name":"Code (set theory)","score":0.6389212608337402},{"id":"https://openalex.org/keywords/scale","display_name":"Scale (ratio)","score":0.6331666111946106},{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.5499552488327026},{"id":"https://openalex.org/keywords/information-retrieval","display_name":"Information retrieval","score":0.38656941056251526},{"id":"https://openalex.org/keywords/data-science","display_name":"Data science","score":0.34466075897216797},{"id":"https://openalex.org/keywords/world-wide-web","display_name":"World Wide Web","score":0.34179186820983887},{"id":"https://openalex.org/keywords/geography","display_name":"Geography","score":0.2497948706150055},{"id":"https://openalex.org/keywords/cartography","display_name":"Cartography","score":0.15314564108848572},{"id":"https://openalex.org/keywords/programming-language","display_name":"Programming language","score":0.10581129789352417}],"concepts":[{"id":"https://openalex.org/C2776760102","wikidata":"https://www.wikidata.org/wiki/Q5139990","display_name":"Code (set theory)","level":3,"score":0.6389212608337402},{"id":"https://openalex.org/C2778755073","wikidata":"https://www.wikidata.org/wiki/Q10858537","display_name":"Scale (ratio)","level":2,"score":0.6331666111946106},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.5499552488327026},{"id":"https://openalex.org/C23123220","wikidata":"https://www.wikidata.org/wiki/Q816826","display_name":"Information retrieval","level":1,"score":0.38656941056251526},{"id":"https://openalex.org/C2522767166","wikidata":"https://www.wikidata.org/wiki/Q2374463","display_name":"Data science","level":1,"score":0.34466075897216797},{"id":"https://openalex.org/C136764020","wikidata":"https://www.wikidata.org/wiki/Q466","display_name":"World Wide Web","level":1,"score":0.34179186820983887},{"id":"https://openalex.org/C205649164","wikidata":"https://www.wikidata.org/wiki/Q1071","display_name":"Geography","level":0,"score":0.2497948706150055},{"id":"https://openalex.org/C58640448","wikidata":"https://www.wikidata.org/wiki/Q42515","display_name":"Cartography","level":1,"score":0.15314564108848572},{"id":"https://openalex.org/C199360897","wikidata":"https://www.wikidata.org/wiki/Q9143","display_name":"Programming language","level":1,"score":0.10581129789352417},{"id":"https://openalex.org/C177264268","wikidata":"https://www.wikidata.org/wiki/Q1514741","display_name":"Set (abstract data type)","level":2,"score":0.0}],"mesh":[],"locations_count":3,"locations":[{"id":"pmh:oai:arXiv.org:2406.20098","is_oa":true,"landing_page_url":"http://arxiv.org/abs/2406.20098","pdf_url":"https://arxiv.org/pdf/2406.20098","source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":"","raw_type":"text"},{"id":"pmh:oai:repository.hkust.edu.hk:1783.1-152733","is_oa":false,"landing_page_url":"http://repository.hkust.edu.hk/ir/Record/1783.1-152733","pdf_url":null,"source":{"id":"https://openalex.org/S4306401796","display_name":"Rare & Special e-Zone (The Hong Kong University of Science and Technology)","issn_l":null,"issn":null,"is_oa":false,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I200769079","host_organization_name":"Hong Kong University of Science and Technology","host_organization_lineage":["https://openalex.org/I200769079"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"Conference paper"},{"id":"doi:10.48550/arxiv.2406.20098","is_oa":true,"landing_page_url":"https://doi.org/10.48550/arxiv.2406.20098","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":null,"is_accepted":false,"is_published":null,"raw_source_name":null,"raw_type":"article"}],"best_oa_location":{"id":"pmh:oai:arXiv.org:2406.20098","is_oa":true,"landing_page_url":"http://arxiv.org/abs/2406.20098","pdf_url":"https://arxiv.org/pdf/2406.20098","source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":"","raw_type":"text"},"sustainable_development_goals":[],"awards":[],"funders":[],"has_content":{"pdf":false,"grobid_xml":false},"content_urls":null,"referenced_works_count":0,"referenced_works":[],"related_works":["https://openalex.org/W2748952813","https://openalex.org/W4213212078","https://openalex.org/W2187227032","https://openalex.org/W2112788825","https://openalex.org/W1963735073","https://openalex.org/W4233129888","https://openalex.org/W106707639","https://openalex.org/W2146247781","https://openalex.org/W2144684733","https://openalex.org/W4299950557"],"abstract_inverted_index":{"Multimodal":[0],"large":[1],"language":[2,121],"models":[3],"(MLLMs)":[4],"have":[5],"shown":[6],"impressive":[7],"success":[8],"across":[9],"modalities":[10],"such":[11],"as":[12,87,89],"image,":[13],"video,":[14],"and":[15,22,35,60,68,106,160,202,207],"audio":[16],"in":[17,128,145,157,180],"a":[18,48,52,91,133],"variety":[19],"of":[20,51,73,94,137,194],"understanding":[21,32,67,136,159],"generation":[23,201],"tasks.":[24],"However,":[25],"current":[26],"MLLMs":[27,196],"are":[28,103,111,209],"surprisingly":[29],"poor":[30],"at":[31,211],"webpage":[33,66,104,126,158],"screenshots":[34],"generating":[36],"their":[37],"corresponding":[38],"HTML":[39,69,114],"code.":[40,115],"To":[41,141],"address":[42],"this":[43],"problem,":[44],"we":[45,78,148],"propose":[46],"$\\texttt{Web2Code}$,":[47],"benchmark":[49],"consisting":[50],"new":[53,95],"large-scale":[54],"webpage-to-code":[55,85],"dataset":[56,76,169],"for":[57,64,153,198],"instruction":[58],"tuning":[59],"an":[61,150],"evaluation":[62,151],"framework":[63,152],"the":[65,101,109,112,125,129,138,181,192],"code":[70,208],"translation":[71],"abilities":[72,156],"MLLMs.":[74],"For":[75],"construction,":[77],"leverage":[79],"pretrained":[80],"LLMs":[81],"to":[82,131,174,191],"enhance":[83],"existing":[84],"datasets":[86],"well":[88],"generate":[90],"diverse":[92,119],"pool":[93],"webpages":[96],"rendered":[97],"into":[98],"images.":[99],"Specifically,":[100],"inputs":[102],"images":[105],"instructions,":[107],"while":[108],"responses":[110,130],"webpage's":[113],"We":[116,185],"further":[117],"include":[118],"natural":[120],"QA":[122],"pairs":[123],"about":[124],"content":[127,200],"enable":[132],"more":[134],"comprehensive":[135],"web":[139],"content.":[140],"evaluate":[142],"model":[143],"performance":[144],"these":[146],"tasks,":[147],"develop":[149],"testing":[154],"MLLMs'":[155],"web-to-code":[161],"generation.":[162],"Extensive":[163],"experiments":[164],"show":[165],"that":[166],"our":[167,175,187],"proposed":[168,176],"is":[170],"beneficial":[171],"not":[172],"only":[173],"tasks":[177],"but":[178],"also":[179],"general":[182,195],"visual":[183],"domain.":[184],"hope":[186],"work":[188],"will":[189],"contribute":[190],"development":[193],"suitable":[197],"web-based":[199],"task":[203],"automation.":[204],"Our":[205],"data":[206],"available":[210],"https://github.com/MBZUAI-LLM/web2code.":[212]},"counts_by_year":[],"updated_date":"2026-05-04T08:30:34.212998","created_date":"2024-07-02T00:00:00"}
