{"id":"https://openalex.org/W4388964369","doi":"https://doi.org/10.48550/arxiv.2311.12890","title":"De-fine: Decomposing and Refining Visual Programs with Auto-Feedback","display_name":"De-fine: Decomposing and Refining Visual Programs with Auto-Feedback","publication_year":2023,"publication_date":"2023-11-21","ids":{"openalex":"https://openalex.org/W4388964369","doi":"https://doi.org/10.48550/arxiv.2311.12890"},"language":"en","primary_location":{"id":"pmh:oai:arXiv.org:2311.12890","is_oa":true,"landing_page_url":"http://arxiv.org/abs/2311.12890","pdf_url":"https://arxiv.org/pdf/2311.12890","source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":"","raw_type":"text"},"type":"preprint","indexed_in":["arxiv","datacite"],"open_access":{"is_oa":true,"oa_status":"green","oa_url":"https://arxiv.org/pdf/2311.12890","any_repository_has_fulltext":true},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5061203331","display_name":"Minghe Gao","orcid":null},"institutions":[],"countries":[],"is_corresponding":true,"raw_author_name":"Gao, Minghe","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5100648014","display_name":"Juncheng Li","orcid":"https://orcid.org/0000-0001-7314-6754"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Li, Juncheng","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5002241280","display_name":"Fei Hao","orcid":"https://orcid.org/0000-0001-5288-5523"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Fei, Hao","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5110470213","display_name":"Wei Ji","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Pang, Liang","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5101477058","display_name":"Guoming Wang","orcid":"https://orcid.org/0000-0003-3131-6916"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Ji, Wei","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5082131901","display_name":"Wenqiao Zhang","orcid":"https://orcid.org/0000-0002-5988-7609"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Wang, Guoming","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5063062444","display_name":"Siliang Tang","orcid":"https://orcid.org/0000-0002-7356-9711"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Lv, Zheqi","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5008666077","display_name":"Yueting Zhuang","orcid":"https://orcid.org/0000-0001-9017-2508"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Zhang, Wenqiao","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":null,"display_name":"Tang, Siliang","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Tang, Siliang","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"last","author":{"id":null,"display_name":"Zhuang, Yueting","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Zhuang, Yueting","raw_affiliation_strings":[],"affiliations":[]}],"institutions":[],"countries_distinct_count":0,"institutions_distinct_count":10,"corresponding_author_ids":["https://openalex.org/A5061203331"],"corresponding_institution_ids":[],"apc_list":null,"apc_paid":null,"fwci":null,"has_fulltext":true,"cited_by_count":0,"citation_normalized_percentile":null,"cited_by_percentile_year":null,"biblio":{"volume":null,"issue":null,"first_page":null,"last_page":null},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T11714","display_name":"Multimodal Machine Learning Applications","score":0.9901000261306763,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T11714","display_name":"Multimodal Machine Learning Applications","score":0.9901000261306763,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10260","display_name":"Software Engineering Research","score":0.9697999954223633,"subfield":{"id":"https://openalex.org/subfields/1710","display_name":"Information Systems"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11122","display_name":"Online Learning and Analytics","score":0.9419000148773193,"subfield":{"id":"https://openalex.org/subfields/1706","display_name":"Computer Science Applications"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.8156808614730835},{"id":"https://openalex.org/keywords/modular-design","display_name":"Modular design","score":0.6392413377761841},{"id":"https://openalex.org/keywords/task","display_name":"Task (project management)","score":0.574120819568634},{"id":"https://openalex.org/keywords/python","display_name":"Python (programming language)","score":0.5704745650291443},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.5497341156005859},{"id":"https://openalex.org/keywords/visual-programming-language","display_name":"Visual programming language","score":0.49472615122795105},{"id":"https://openalex.org/keywords/field","display_name":"Field (mathematics)","score":0.48298612236976624},{"id":"https://openalex.org/keywords/machine-learning","display_name":"Machine learning","score":0.4015589952468872},{"id":"https://openalex.org/keywords/programming-language","display_name":"Programming language","score":0.3117036521434784}],"concepts":[{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.8156808614730835},{"id":"https://openalex.org/C101468663","wikidata":"https://www.wikidata.org/wiki/Q1620158","display_name":"Modular design","level":2,"score":0.6392413377761841},{"id":"https://openalex.org/C2780451532","wikidata":"https://www.wikidata.org/wiki/Q759676","display_name":"Task (project management)","level":2,"score":0.574120819568634},{"id":"https://openalex.org/C519991488","wikidata":"https://www.wikidata.org/wiki/Q28865","display_name":"Python (programming language)","level":2,"score":0.5704745650291443},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.5497341156005859},{"id":"https://openalex.org/C128644962","wikidata":"https://www.wikidata.org/wiki/Q683111","display_name":"Visual programming language","level":2,"score":0.49472615122795105},{"id":"https://openalex.org/C9652623","wikidata":"https://www.wikidata.org/wiki/Q190109","display_name":"Field (mathematics)","level":2,"score":0.48298612236976624},{"id":"https://openalex.org/C119857082","wikidata":"https://www.wikidata.org/wiki/Q2539","display_name":"Machine learning","level":1,"score":0.4015589952468872},{"id":"https://openalex.org/C199360897","wikidata":"https://www.wikidata.org/wiki/Q9143","display_name":"Programming language","level":1,"score":0.3117036521434784},{"id":"https://openalex.org/C187736073","wikidata":"https://www.wikidata.org/wiki/Q2920921","display_name":"Management","level":1,"score":0.0},{"id":"https://openalex.org/C162324750","wikidata":"https://www.wikidata.org/wiki/Q8134","display_name":"Economics","level":0,"score":0.0},{"id":"https://openalex.org/C202444582","wikidata":"https://www.wikidata.org/wiki/Q837863","display_name":"Pure mathematics","level":1,"score":0.0},{"id":"https://openalex.org/C33923547","wikidata":"https://www.wikidata.org/wiki/Q395","display_name":"Mathematics","level":0,"score":0.0}],"mesh":[],"locations_count":2,"locations":[{"id":"pmh:oai:arXiv.org:2311.12890","is_oa":true,"landing_page_url":"http://arxiv.org/abs/2311.12890","pdf_url":"https://arxiv.org/pdf/2311.12890","source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":"","raw_type":"text"},{"id":"doi:10.48550/arxiv.2311.12890","is_oa":true,"landing_page_url":"https://doi.org/10.48550/arxiv.2311.12890","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":null,"is_accepted":false,"is_published":null,"raw_source_name":null,"raw_type":"article"}],"best_oa_location":{"id":"pmh:oai:arXiv.org:2311.12890","is_oa":true,"landing_page_url":"http://arxiv.org/abs/2311.12890","pdf_url":"https://arxiv.org/pdf/2311.12890","source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":"","raw_type":"text"},"sustainable_development_goals":[],"awards":[],"funders":[],"has_content":{"grobid_xml":false,"pdf":true},"content_urls":{"pdf":"https://content.openalex.org/works/W4388964369.pdf"},"referenced_works_count":0,"referenced_works":[],"related_works":["https://openalex.org/W2341492732","https://openalex.org/W3187193180","https://openalex.org/W106542691","https://openalex.org/W4287027380","https://openalex.org/W1699080303","https://openalex.org/W4297799326","https://openalex.org/W2207495067","https://openalex.org/W1906486629","https://openalex.org/W2161373261","https://openalex.org/W1924502949"],"abstract_inverted_index":{"Visual":[0],"programming,":[1],"a":[2,44,80],"modular":[3],"and":[4,10,31,55,91],"generalizable":[5],"paradigm,":[6],"integrates":[7],"different":[8],"modules":[9],"Python":[11],"operators":[12],"to":[13,53],"solve":[14],"various":[15,114],"vision-language":[16],"tasks.":[17],"Unlike":[18],"end-to-end":[19],"models":[20],"that":[21,83,118],"need":[22],"task-specific":[23],"data,":[24],"it":[25],"advances":[26],"in":[27,33,43],"performing":[28],"visual":[29,38,115],"processing":[30],"reasoning":[32,102],"an":[34,130],"unsupervised":[35],"manner.":[36],"Current":[37],"programming":[39],"methods":[40],"generate":[41],"programs":[42,93],"single":[45],"pass":[46],"for":[47,68,137],"each":[48,126],"task":[49],"where":[50],"the":[51,106,138],"ability":[52],"evaluate":[54],"optimize":[56],"based":[57],"on":[58],"feedback,":[59],"unfortunately,":[60],"is":[61],"lacking,":[62],"which":[63],"consequentially":[64],"limits":[65],"their":[66],"effectiveness":[67],"complex,":[69],"multi-step":[70],"problems.":[71],"Drawing":[72],"inspiration":[73],"from":[74],"benders":[75],"decomposition,":[76],"we":[77],"introduce":[78],"De-fine,":[79],"training-free":[81],"framework":[82],"automatically":[84],"decomposes":[85],"complex":[86],"tasks":[87,116],"into":[88],"simpler":[89],"subtasks":[90],"refines":[92],"through":[94],"auto-feedback.":[95],"This":[96],"model-agnostic":[97],"approach":[98],"can":[99],"improve":[100],"logical":[101],"performance":[103],"by":[104],"integrating":[105],"strengths":[107],"of":[108,140],"multiple":[109],"models.":[110],"Our":[111],"experiments":[112],"across":[113],"show":[117],"De-fine":[119],"creates":[120],"more":[121],"robust":[122],"programs.":[123],"Moreover,":[124],"viewing":[125],"feedback":[127],"module":[128],"as":[129],"independent":[131],"agent":[132,141],"will":[133],"yield":[134],"fresh":[135],"prospects":[136],"field":[139],"research.":[142]},"counts_by_year":[],"updated_date":"2026-03-11T14:59:36.786465","created_date":"2025-10-10T00:00:00"}
