{"id":"https://openalex.org/W7155166020","doi":"https://doi.org/10.48550/arxiv.2604.19667","title":"Chat2Workflow: A Benchmark for Generating Executable Visual Workflows with Natural Language","display_name":"Chat2Workflow: A Benchmark for Generating Executable Visual Workflows with Natural Language","publication_year":2026,"publication_date":"2026-04-21","ids":{"openalex":"https://openalex.org/W7155166020","doi":"https://doi.org/10.48550/arxiv.2604.19667"},"language":null,"primary_location":{"id":"doi:10.48550/arxiv.2604.19667","is_oa":true,"landing_page_url":"https://doi.org/10.48550/arxiv.2604.19667","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":null,"is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"article"},"type":"preprint","indexed_in":["datacite"],"open_access":{"is_oa":true,"oa_status":"green","oa_url":"https://doi.org/10.48550/arxiv.2604.19667","any_repository_has_fulltext":true},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5073925367","display_name":"Yi Zhong","orcid":"https://orcid.org/0000-0002-0929-8224"},"institutions":[],"countries":[],"is_corresponding":true,"raw_author_name":"Zhong, Yi","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5082272714","display_name":"Xu BuQiang","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Xu, Buqiang","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5134258647","display_name":"Yijun Wang","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Wang, Yijun","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5134257746","display_name":"Zifei Shan","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Shan, Zifei","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5091748443","display_name":"Shuofei Qiao","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Qiao, Shuofei","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5030057133","display_name":"Guozhou Zheng","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Zheng, Guozhou","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"last","author":{"id":"https://openalex.org/A5134359649","display_name":"Ningyu Zhang","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Zhang, Ningyu","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]}],"institutions":[],"countries_distinct_count":0,"institutions_distinct_count":7,"corresponding_author_ids":["https://openalex.org/A5073925367"],"corresponding_institution_ids":[],"apc_list":null,"apc_paid":null,"fwci":null,"has_fulltext":false,"cited_by_count":0,"citation_normalized_percentile":null,"cited_by_percentile_year":null,"biblio":{"volume":null,"issue":null,"first_page":null,"last_page":null},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10799","display_name":"Data Visualization and Analytics","score":0.14659999310970306,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10799","display_name":"Data Visualization and Analytics","score":0.14659999310970306,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11948","display_name":"Machine Learning in Materials Science","score":0.09200000017881393,"subfield":{"id":"https://openalex.org/subfields/2505","display_name":"Materials Chemistry"},"field":{"id":"https://openalex.org/fields/25","display_name":"Materials Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11986","display_name":"Scientific Computing and Data Management","score":0.059700001031160355,"subfield":{"id":"https://openalex.org/subfields/1802","display_name":"Information Systems and Management"},"field":{"id":"https://openalex.org/fields/18","display_name":"Decision Sciences"},"domain":{"id":"https://openalex.org/domains/2","display_name":"Social Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/executable","display_name":"Executable","score":0.9171000123023987},{"id":"https://openalex.org/keywords/workflow","display_name":"Workflow","score":0.8284000158309937},{"id":"https://openalex.org/keywords/benchmark","display_name":"Benchmark (surveying)","score":0.5981000065803528},{"id":"https://openalex.org/keywords/visual-language","display_name":"Visual language","score":0.5781999826431274},{"id":"https://openalex.org/keywords/natural-language","display_name":"Natural language","score":0.44130000472068787},{"id":"https://openalex.org/keywords/semantics","display_name":"Semantics (computer science)","score":0.3384999930858612}],"concepts":[{"id":"https://openalex.org/C160145156","wikidata":"https://www.wikidata.org/wiki/Q778586","display_name":"Executable","level":2,"score":0.9171000123023987},{"id":"https://openalex.org/C177212765","wikidata":"https://www.wikidata.org/wiki/Q627335","display_name":"Workflow","level":2,"score":0.8284000158309937},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.8065000176429749},{"id":"https://openalex.org/C199360897","wikidata":"https://www.wikidata.org/wiki/Q9143","display_name":"Programming language","level":1,"score":0.6037999987602234},{"id":"https://openalex.org/C185798385","wikidata":"https://www.wikidata.org/wiki/Q1161707","display_name":"Benchmark (surveying)","level":2,"score":0.5981000065803528},{"id":"https://openalex.org/C2780878386","wikidata":"https://www.wikidata.org/wiki/Q1659648","display_name":"Visual language","level":2,"score":0.5781999826431274},{"id":"https://openalex.org/C115903868","wikidata":"https://www.wikidata.org/wiki/Q80993","display_name":"Software engineering","level":1,"score":0.45969998836517334},{"id":"https://openalex.org/C195324797","wikidata":"https://www.wikidata.org/wiki/Q33742","display_name":"Natural language","level":2,"score":0.44130000472068787},{"id":"https://openalex.org/C184337299","wikidata":"https://www.wikidata.org/wiki/Q1437428","display_name":"Semantics (computer science)","level":2,"score":0.3384999930858612},{"id":"https://openalex.org/C43126263","wikidata":"https://www.wikidata.org/wiki/Q128751","display_name":"Source code","level":2,"score":0.2985999882221222},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.2816999852657318},{"id":"https://openalex.org/C43214815","wikidata":"https://www.wikidata.org/wiki/Q7310987","display_name":"Reliability (semiconductor)","level":3,"score":0.2635999917984009},{"id":"https://openalex.org/C2780330621","wikidata":"https://www.wikidata.org/wiki/Q7936609","display_name":"Visual modeling","level":4,"score":0.258899986743927},{"id":"https://openalex.org/C2776760102","wikidata":"https://www.wikidata.org/wiki/Q5139990","display_name":"Code (set theory)","level":3,"score":0.2565999925136566}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.48550/arxiv.2604.19667","is_oa":true,"landing_page_url":"https://doi.org/10.48550/arxiv.2604.19667","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":null,"is_accepted":false,"is_published":null,"raw_source_name":null,"raw_type":"article"}],"best_oa_location":{"id":"doi:10.48550/arxiv.2604.19667","is_oa":true,"landing_page_url":"https://doi.org/10.48550/arxiv.2604.19667","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":null,"is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"article"},"sustainable_development_goals":[{"display_name":"Industry, innovation and infrastructure","score":0.6444393992424011,"id":"https://metadata.un.org/sdg/9"}],"awards":[],"funders":[],"has_content":{"pdf":false,"grobid_xml":false},"content_urls":null,"referenced_works_count":0,"referenced_works":[],"related_works":[],"abstract_inverted_index":{"At":[0],"present,":[1],"executable":[2,77,149],"visual":[3,78],"workflows":[4,25,79],"have":[5],"emerged":[6],"as":[7,48,125,174],"a":[8,73,86,98,175],"mainstream":[9],"paradigm":[10],"in":[11,21],"real-world":[12,102,170],"industrial":[13],"deployments,":[14],"offering":[15],"strong":[16],"reliability":[17],"and":[18,43,56,84,117,127,148,154],"controllability.":[19],"However,":[20],"current":[22],"practice,":[23],"such":[24,124],"are":[26],"almost":[27],"entirely":[28],"constructed":[29],"through":[30],"manual":[31],"engineering:":[32],"developers":[33],"must":[34],"carefully":[35],"design":[36],"workflows,":[37,104,150],"write":[38],"prompts":[39],"for":[40,75,177],"each":[41,106],"step,":[42],"repeatedly":[44],"revise":[45],"the":[46,111,168],"logic":[47],"requirements":[49],"evolve":[50],"--":[51],"making":[52],"development":[53],"costly,":[54],"time-consuming,":[55],"error-prone.":[57],"To":[58],"study":[59],"whether":[60],"large":[61,99],"language":[62,135],"models":[63,136],"can":[64,114,137],"automate":[65],"this":[66],"multi-round":[67],"interaction":[68],"process,":[69],"we":[70],"introduce":[71],"Chat2Workflow,":[72],"benchmark":[74,94],"generating":[76],"directly":[80,118],"from":[81,97],"natural":[82],"language,":[83],"propose":[85],"robust":[87],"agentic":[88,159],"baseline":[89,160],"to":[90,120,144,163],"improve":[91],"performance.":[92],"The":[93],"is":[95,182],"built":[96],"collection":[100],"of":[101],"business":[103],"with":[105],"instance":[107],"designed":[108],"so":[109],"that":[110,132],"generated":[112],"workflow":[113,122],"be":[115],"transformed":[116],"deployed":[119],"practical":[121],"platforms":[123],"Dify":[126],"Coze.":[128],"Experimental":[129],"results":[130],"show":[131],"while":[133],"state-of-the-art":[134],"often":[138],"capture":[139],"high-level":[140],"intent,":[141],"they":[142],"struggle":[143],"generate":[145],"correct,":[146],"stable,":[147],"especially":[151],"given":[152],"complex":[153],"evolving":[155],"requirements.":[156],"Although":[157],"our":[158],"yields":[161],"up":[162],"6.05%":[164],"resolve":[165],"rate":[166],"gains,":[167],"remaining":[169],"gap":[171],"positions":[172],"Chat2Workflow":[173],"foundation":[176],"advancing":[178],"industrial-grade":[179],"automation.":[180],"Code":[181],"available":[183],"at":[184],"https://github.com/zjunlp/Chat2Workflow.":[185]},"counts_by_year":[],"updated_date":"2026-05-28T06:12:49.907903","created_date":"2026-04-23T00:00:00"}
