{"id":"https://openalex.org/W7123846008","doi":"https://doi.org/10.48550/arxiv.2601.07477","title":"JudgeFlow: Agentic Workflow Optimization via Block Judge","display_name":"JudgeFlow: Agentic Workflow Optimization via Block Judge","publication_year":2026,"publication_date":"2026-01-12","ids":{"openalex":"https://openalex.org/W7123846008","doi":"https://doi.org/10.48550/arxiv.2601.07477"},"language":null,"primary_location":{"id":"pmh:doi:10.48550/arxiv.2601.07477","is_oa":true,"landing_page_url":null,"pdf_url":null,"source":{"id":"https://openalex.org/S4406922384","display_name":"Open MIND","issn_l":null,"issn":null,"is_oa":false,"is_in_doaj":false,"is_core":false,"host_organization":null,"host_organization_name":null,"host_organization_lineage":[],"host_organization_lineage_names":[],"type":"repository"},"license":"publisher-specific-oa","license_id":"https://openalex.org/licenses/publisher-specific-oa","version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"Article"},"type":"preprint","indexed_in":["datacite"],"open_access":{"is_oa":true,"oa_status":"green","oa_url":null,"any_repository_has_fulltext":true},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5122938392","display_name":"Zihan Ma","orcid":null},"institutions":[],"countries":[],"is_corresponding":true,"raw_author_name":"Ma, Zihan","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5122940781","display_name":"Zhikai Zhao","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Zhao, Zhikai","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5039806945","display_name":"Chuanbo Hua","orcid":"https://orcid.org/0000-0001-7700-792X"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Hua, Chuanbo","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":null,"display_name":"Berto, Federico","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Berto, Federico","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"last","author":{"id":"https://openalex.org/A5122967102","display_name":"Jinkyoo Park","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Park, Jinkyoo","raw_affiliation_strings":[],"affiliations":[]}],"institutions":[],"countries_distinct_count":0,"institutions_distinct_count":5,"corresponding_author_ids":["https://openalex.org/A5122938392"],"corresponding_institution_ids":[],"apc_list":null,"apc_paid":null,"fwci":null,"has_fulltext":false,"cited_by_count":0,"citation_normalized_percentile":null,"cited_by_percentile_year":null,"biblio":{"volume":null,"issue":null,"first_page":null,"last_page":null},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T11986","display_name":"Scientific Computing and Data Management","score":0.7753999829292297,"subfield":{"id":"https://openalex.org/subfields/1802","display_name":"Information Systems and Management"},"field":{"id":"https://openalex.org/fields/18","display_name":"Decision Sciences"},"domain":{"id":"https://openalex.org/domains/2","display_name":"Social Sciences"}},"topics":[{"id":"https://openalex.org/T11986","display_name":"Scientific Computing and Data Management","score":0.7753999829292297,"subfield":{"id":"https://openalex.org/subfields/1802","display_name":"Information Systems and Management"},"field":{"id":"https://openalex.org/fields/18","display_name":"Decision Sciences"},"domain":{"id":"https://openalex.org/domains/2","display_name":"Social Sciences"}},{"id":"https://openalex.org/T11948","display_name":"Machine Learning in Materials Science","score":0.0746999979019165,"subfield":{"id":"https://openalex.org/subfields/2505","display_name":"Materials Chemistry"},"field":{"id":"https://openalex.org/fields/25","display_name":"Materials Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T12026","display_name":"Explainable Artificial Intelligence (XAI)","score":0.015399999916553497,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/interpretability","display_name":"Interpretability","score":0.8840000033378601},{"id":"https://openalex.org/keywords/workflow","display_name":"Workflow","score":0.796500027179718},{"id":"https://openalex.org/keywords/scalability","display_name":"Scalability","score":0.6416000127792358},{"id":"https://openalex.org/keywords/block","display_name":"Block (permutation group theory)","score":0.5975000262260437},{"id":"https://openalex.org/keywords/code","display_name":"Code (set theory)","score":0.39489999413490295},{"id":"https://openalex.org/keywords/representation","display_name":"Representation (politics)","score":0.3386000096797943}],"concepts":[{"id":"https://openalex.org/C2781067378","wikidata":"https://www.wikidata.org/wiki/Q17027399","display_name":"Interpretability","level":2,"score":0.8840000033378601},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.8009999990463257},{"id":"https://openalex.org/C177212765","wikidata":"https://www.wikidata.org/wiki/Q627335","display_name":"Workflow","level":2,"score":0.796500027179718},{"id":"https://openalex.org/C48044578","wikidata":"https://www.wikidata.org/wiki/Q727490","display_name":"Scalability","level":2,"score":0.6416000127792358},{"id":"https://openalex.org/C2777210771","wikidata":"https://www.wikidata.org/wiki/Q4927124","display_name":"Block (permutation group theory)","level":2,"score":0.5975000262260437},{"id":"https://openalex.org/C80444323","wikidata":"https://www.wikidata.org/wiki/Q2878974","display_name":"Theoretical computer science","level":1,"score":0.4302000105381012},{"id":"https://openalex.org/C2776760102","wikidata":"https://www.wikidata.org/wiki/Q5139990","display_name":"Code (set theory)","level":3,"score":0.39489999413490295},{"id":"https://openalex.org/C119857082","wikidata":"https://www.wikidata.org/wiki/Q2539","display_name":"Machine learning","level":1,"score":0.37770000100135803},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.3741999864578247},{"id":"https://openalex.org/C199360897","wikidata":"https://www.wikidata.org/wiki/Q9143","display_name":"Programming language","level":1,"score":0.3684000074863434},{"id":"https://openalex.org/C115903868","wikidata":"https://www.wikidata.org/wiki/Q80993","display_name":"Software engineering","level":1,"score":0.353300005197525},{"id":"https://openalex.org/C2776359362","wikidata":"https://www.wikidata.org/wiki/Q2145286","display_name":"Representation (politics)","level":3,"score":0.3386000096797943},{"id":"https://openalex.org/C198531522","wikidata":"https://www.wikidata.org/wiki/Q485146","display_name":"Sample (material)","level":2,"score":0.3379000127315521},{"id":"https://openalex.org/C12725497","wikidata":"https://www.wikidata.org/wiki/Q810247","display_name":"Baseline (sea)","level":2,"score":0.3172999918460846},{"id":"https://openalex.org/C99844830","wikidata":"https://www.wikidata.org/wiki/Q102441924","display_name":"Scaling","level":2,"score":0.28439998626708984},{"id":"https://openalex.org/C124101348","wikidata":"https://www.wikidata.org/wiki/Q172491","display_name":"Data mining","level":1,"score":0.2782000005245209},{"id":"https://openalex.org/C168167062","wikidata":"https://www.wikidata.org/wiki/Q1117970","display_name":"Component (thermodynamics)","level":2,"score":0.2703000009059906},{"id":"https://openalex.org/C26517878","wikidata":"https://www.wikidata.org/wiki/Q228039","display_name":"Key (lock)","level":2,"score":0.25099998712539673}],"mesh":[],"locations_count":2,"locations":[{"id":"pmh:doi:10.48550/arxiv.2601.07477","is_oa":true,"landing_page_url":null,"pdf_url":null,"source":{"id":"https://openalex.org/S4406922384","display_name":"Open MIND","issn_l":null,"issn":null,"is_oa":false,"is_in_doaj":false,"is_core":false,"host_organization":null,"host_organization_name":null,"host_organization_lineage":[],"host_organization_lineage_names":[],"type":"repository"},"license":"publisher-specific-oa","license_id":"https://openalex.org/licenses/publisher-specific-oa","version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"Article"},{"id":"doi:10.48550/arxiv.2601.07477","is_oa":true,"landing_page_url":"https://doi.org/10.48550/arxiv.2601.07477","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":null,"is_accepted":false,"is_published":null,"raw_source_name":null,"raw_type":"article"}],"best_oa_location":{"id":"pmh:doi:10.48550/arxiv.2601.07477","is_oa":true,"landing_page_url":null,"pdf_url":null,"source":{"id":"https://openalex.org/S4406922384","display_name":"Open MIND","issn_l":null,"issn":null,"is_oa":false,"is_in_doaj":false,"is_core":false,"host_organization":null,"host_organization_name":null,"host_organization_lineage":[],"host_organization_lineage_names":[],"type":"repository"},"license":"publisher-specific-oa","license_id":"https://openalex.org/licenses/publisher-specific-oa","version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"Article"},"sustainable_development_goals":[],"awards":[],"funders":[],"has_content":{"grobid_xml":false,"pdf":false},"content_urls":null,"referenced_works_count":0,"referenced_works":[],"related_works":[],"abstract_inverted_index":{"Optimizing":[0],"LLM-based":[1,93],"agentic":[2,50,125],"workflows":[3,51],"is":[4],"challenging":[5],"for":[6,121],"scaling":[7],"AI":[8],"capabilities.":[9],"Current":[10],"methods":[11],"rely":[12],"on":[13,22,98,130],"coarse,":[14],"end-to-end":[15],"evaluation":[16],"signals":[17,21,87],"and":[18,76,116,133,142],"lack":[19],"fine-grained":[20,85],"where":[23,137],"to":[24,52,81,145],"refine,":[25],"often":[26],"resulting":[27],"in":[28,103],"inefficient":[29],"or":[30],"low-impact":[31],"modifications.":[32],"To":[33],"address":[34],"these":[35],"limitations,":[36],"we":[37,63],"propose":[38],"JudgeFlow,":[39],"an":[40,92],"Evaluation-Judge-Optimization-Update":[41],"pipeline.":[42],"We":[43,127],"incorporate":[44],"reusable,":[45],"configurable":[46],"logic":[47],"blocks":[48],"into":[49],"capture":[53],"fundamental":[54],"forms":[55],"of":[56,60],"logic.":[57],"On":[58],"top":[59],"this":[61],"abstraction,":[62],"design":[64],"a":[65,118],"dedicated":[66],"Judge":[67],"module":[68],"that":[69],"inspects":[70],"execution":[71],"traces":[72],"particularly":[73],"failed":[74],"runs":[75],"assigns":[77],"rank-based":[78],"responsibility":[79],"scores":[80],"problematic":[82,101],"blocks.":[83],"These":[84],"diagnostic":[86],"are":[88],"then":[89],"leveraged":[90],"by":[91],"optimizer,":[94],"which":[95],"focuses":[96],"modifications":[97],"the":[99,104],"most":[100],"block":[102],"workflow.":[105],"Our":[106],"approach":[107],"improves":[108],"sample":[109],"efficiency,":[110],"enhances":[111],"interpretability":[112],"through":[113],"block-level":[114],"diagnostics,":[115],"provides":[117],"scalable":[119],"foundation":[120],"automating":[122],"increasingly":[123],"complex":[124],"workflows.":[126],"evaluate":[128],"JudgeFlow":[129,138],"mathematical":[131],"reasoning":[132],"code":[134],"generation":[135],"benchmarks,":[136],"achieves":[139],"superior":[140],"performance":[141],"efficiency":[143],"compared":[144],"existing":[146],"methods.":[147]},"counts_by_year":[],"updated_date":"2026-04-04T16:13:02.066488","created_date":"2026-01-14T00:00:00"}
