{"id":"https://openalex.org/W7140340982","doi":"https://doi.org/10.48550/arxiv.2603.22622","title":"A Vision Language Model for Generating Procedural Plant Architecture Representations from Simulated Images","display_name":"A Vision Language Model for Generating Procedural Plant Architecture Representations from Simulated Images","publication_year":2026,"publication_date":"2026-03-23","ids":{"openalex":"https://openalex.org/W7140340982","doi":"https://doi.org/10.48550/arxiv.2603.22622"},"language":null,"primary_location":{"id":"doi:10.48550/arxiv.2603.22622","is_oa":true,"landing_page_url":"https://doi.org/10.48550/arxiv.2603.22622","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":null,"is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"Preprint"},"type":"preprint","indexed_in":["datacite"],"open_access":{"is_oa":true,"oa_status":"green","oa_url":"https://doi.org/10.48550/arxiv.2603.22622","any_repository_has_fulltext":true},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5048969131","display_name":"Heesup Yun","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Yun, Heesup","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5130602834","display_name":"Isaac Kazuo Uyehara","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Uyehara, Isaac Kazuo","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5032759144","display_name":"Ioannis Droutsas","orcid":"https://orcid.org/0000-0002-5123-3379"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Droutsas, Ioannis","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5119248971","display_name":"Earl Ranario","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Ranario, Earl","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5013340604","display_name":"Christine Diepenbrock","orcid":"https://orcid.org/0000-0001-8411-0343"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Diepenbrock, Christine H.","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5008008876","display_name":"Brian N. Bailey","orcid":"https://orcid.org/0000-0003-1919-2324"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Bailey, Brian N.","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"last","author":{"id":"https://openalex.org/A5130544215","display_name":"J. Mason Earles","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Earles, J. Mason","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]}],"institutions":[],"countries_distinct_count":0,"institutions_distinct_count":0,"corresponding_author_ids":[],"corresponding_institution_ids":[],"apc_list":null,"apc_paid":null,"fwci":null,"has_fulltext":false,"cited_by_count":0,"citation_normalized_percentile":null,"cited_by_percentile_year":null,"biblio":{"volume":null,"issue":null,"first_page":null,"last_page":null},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T12093","display_name":"Greenhouse Technology and Climate Control","score":0.7516000270843506,"subfield":{"id":"https://openalex.org/subfields/1110","display_name":"Plant Science"},"field":{"id":"https://openalex.org/fields/11","display_name":"Agricultural and Biological Sciences"},"domain":{"id":"https://openalex.org/domains/1","display_name":"Life Sciences"}},"topics":[{"id":"https://openalex.org/T12093","display_name":"Greenhouse Technology and Climate Control","score":0.7516000270843506,"subfield":{"id":"https://openalex.org/subfields/1110","display_name":"Plant Science"},"field":{"id":"https://openalex.org/fields/11","display_name":"Agricultural and Biological Sciences"},"domain":{"id":"https://openalex.org/domains/1","display_name":"Life Sciences"}},{"id":"https://openalex.org/T10616","display_name":"Smart Agriculture and AI","score":0.048500001430511475,"subfield":{"id":"https://openalex.org/subfields/1110","display_name":"Plant Science"},"field":{"id":"https://openalex.org/fields/11","display_name":"Agricultural and Biological Sciences"},"domain":{"id":"https://openalex.org/domains/1","display_name":"Life Sciences"}},{"id":"https://openalex.org/T12813","display_name":"Plant and Biological Electrophysiology Studies","score":0.014700000174343586,"subfield":{"id":"https://openalex.org/subfields/1110","display_name":"Plant Science"},"field":{"id":"https://openalex.org/fields/11","display_name":"Agricultural and Biological Sciences"},"domain":{"id":"https://openalex.org/domains/1","display_name":"Life Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/security-token","display_name":"Security token","score":0.6984000205993652},{"id":"https://openalex.org/keywords/encode","display_name":"ENCODE","score":0.6238999962806702},{"id":"https://openalex.org/keywords/xml","display_name":"XML","score":0.6097000241279602},{"id":"https://openalex.org/keywords/architecture","display_name":"Architecture","score":0.5746999979019165},{"id":"https://openalex.org/keywords/representation","display_name":"Representation (politics)","score":0.5496000051498413},{"id":"https://openalex.org/keywords/architectural-model","display_name":"Architectural model","score":0.4781000018119812},{"id":"https://openalex.org/keywords/field","display_name":"Field (mathematics)","score":0.4575999975204468},{"id":"https://openalex.org/keywords/component","display_name":"Component (thermodynamics)","score":0.43290001153945923}],"concepts":[{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.7067000269889832},{"id":"https://openalex.org/C48145219","wikidata":"https://www.wikidata.org/wiki/Q1335365","display_name":"Security token","level":2,"score":0.6984000205993652},{"id":"https://openalex.org/C66746571","wikidata":"https://www.wikidata.org/wiki/Q1134833","display_name":"ENCODE","level":3,"score":0.6238999962806702},{"id":"https://openalex.org/C8797682","wikidata":"https://www.wikidata.org/wiki/Q2115","display_name":"XML","level":2,"score":0.6097000241279602},{"id":"https://openalex.org/C123657996","wikidata":"https://www.wikidata.org/wiki/Q12271","display_name":"Architecture","level":2,"score":0.5746999979019165},{"id":"https://openalex.org/C2776359362","wikidata":"https://www.wikidata.org/wiki/Q2145286","display_name":"Representation (politics)","level":3,"score":0.5496000051498413},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.4799000024795532},{"id":"https://openalex.org/C2778544944","wikidata":"https://www.wikidata.org/wiki/Q1352349","display_name":"Architectural model","level":3,"score":0.4781000018119812},{"id":"https://openalex.org/C9652623","wikidata":"https://www.wikidata.org/wiki/Q190109","display_name":"Field (mathematics)","level":2,"score":0.4575999975204468},{"id":"https://openalex.org/C168167062","wikidata":"https://www.wikidata.org/wiki/Q1117970","display_name":"Component (thermodynamics)","level":2,"score":0.43290001153945923},{"id":"https://openalex.org/C159877910","wikidata":"https://www.wikidata.org/wiki/Q2202883","display_name":"Autoregressive model","level":2,"score":0.42640000581741333},{"id":"https://openalex.org/C125411270","wikidata":"https://www.wikidata.org/wiki/Q18653","display_name":"Encoding (memory)","level":2,"score":0.3508000075817108},{"id":"https://openalex.org/C124101348","wikidata":"https://www.wikidata.org/wiki/Q172491","display_name":"Data mining","level":1,"score":0.3262999951839447},{"id":"https://openalex.org/C137293760","wikidata":"https://www.wikidata.org/wiki/Q3621696","display_name":"Language model","level":2,"score":0.3248000144958496},{"id":"https://openalex.org/C195807954","wikidata":"https://www.wikidata.org/wiki/Q1662562","display_name":"Information extraction","level":2,"score":0.319599986076355},{"id":"https://openalex.org/C67186912","wikidata":"https://www.wikidata.org/wiki/Q367664","display_name":"Data modeling","level":2,"score":0.31060001254081726},{"id":"https://openalex.org/C160920958","wikidata":"https://www.wikidata.org/wiki/Q7662746","display_name":"Synthetic data","level":2,"score":0.2921999990940094},{"id":"https://openalex.org/C100463513","wikidata":"https://www.wikidata.org/wiki/Q5227322","display_name":"Data model (GIS)","level":2,"score":0.2904999852180481},{"id":"https://openalex.org/C119857082","wikidata":"https://www.wikidata.org/wiki/Q2539","display_name":"Machine learning","level":1,"score":0.29019999504089355},{"id":"https://openalex.org/C80444323","wikidata":"https://www.wikidata.org/wiki/Q2878974","display_name":"Theoretical computer science","level":1,"score":0.28929999470710754},{"id":"https://openalex.org/C3019235130","wikidata":"https://www.wikidata.org/wiki/Q188956","display_name":"Plant disease","level":2,"score":0.28769999742507935},{"id":"https://openalex.org/C153180895","wikidata":"https://www.wikidata.org/wiki/Q7148389","display_name":"Pattern recognition (psychology)","level":2,"score":0.28450000286102295},{"id":"https://openalex.org/C31972630","wikidata":"https://www.wikidata.org/wiki/Q844240","display_name":"Computer vision","level":1,"score":0.27379998564720154},{"id":"https://openalex.org/C199360897","wikidata":"https://www.wikidata.org/wiki/Q9143","display_name":"Programming language","level":1,"score":0.2669999897480011},{"id":"https://openalex.org/C189474733","wikidata":"https://www.wikidata.org/wiki/Q917912","display_name":"Model building","level":2,"score":0.2542000114917755}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.48550/arxiv.2603.22622","is_oa":true,"landing_page_url":"https://doi.org/10.48550/arxiv.2603.22622","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":null,"is_accepted":false,"is_published":null,"raw_source_name":null,"raw_type":"Preprint"}],"best_oa_location":{"id":"doi:10.48550/arxiv.2603.22622","is_oa":true,"landing_page_url":"https://doi.org/10.48550/arxiv.2603.22622","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":null,"is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"Preprint"},"sustainable_development_goals":[],"awards":[],"funders":[],"has_content":{"pdf":false,"grobid_xml":false},"content_urls":null,"referenced_works_count":0,"referenced_works":[],"related_works":[],"abstract_inverted_index":{"Three-dimensional":[0],"(3D)":[1],"procedural":[2,120],"plant":[3,16,21,62,71,123,165,173,178,187,195,249],"architecture":[4,63,179,188,250],"models":[5,45],"have":[6],"emerged":[7],"as":[8],"an":[9,65],"important":[10],"tool":[11],"for":[12,28,43,131,190],"simulation-based":[13],"studies":[14],"of":[15,86,91,107,122,142,163,216,222,234,240],"structure":[17,106],"and":[18,27,40,77,80,133,236,253],"function,":[19],"extracting":[20],"architectural":[22,38,137,147],"parameters":[23,39,79,138,148],"from":[24,64,152,258],"field":[25,48],"measurements,":[26],"generating":[29],"realistic":[30],"plants":[31],"in":[32,181],"computer":[33,100],"graphics.":[34],"However,":[35],"measuring":[36],"the":[37,47,87,104,143,170,176,191,223,245,266],"nested":[41],"structures":[42],"these":[44],"at":[46],"scales":[49],"remains":[50],"prohibitively":[51],"labor-intensive.":[52],"We":[53,184],"present":[54],"a":[55,60,68,82,111,119,156,186,200,204,212,231,237],"novel":[56],"algorithm":[57],"that":[58,73,113,117,145,203,247],"generates":[59,114],"3D":[61,93,105,172],"image,":[66],"creating":[67],"functional":[69],"structural":[70],"model":[72,158,206,210,224,251],"reflects":[74],"organ-level":[75,146],"geometric":[76],"topological":[78],"provides":[81],"more":[83],"comprehensive":[84],"representation":[85],"plant's":[88],"architecture.":[89,124],"Instead":[90],"using":[92,155,169],"sensors":[94],"or":[95],"processing":[96],"multi-view":[97],"images":[98,130,166],"with":[99,135,175],"vision":[101],"to":[102,244,268],"obtain":[103],"plants,":[108],"we":[109],"proposed":[110],"method":[112],"token":[115,201,213],"sequences":[116],"encode":[118],"definition":[121],"This":[125,242],"work":[126,263],"used":[127],"only":[128],"synthetic":[129,161,259],"training":[132],"testing,":[134],"exact":[136],"known,":[139],"allowing":[140],"testing":[141],"hypothesis":[144],"could":[149],"be":[150],"extracted":[151],"image":[153],"data":[154],"vision-language":[157],"(VLM).":[159],"A":[160],"dataset":[162],"cowpea":[164],"was":[167,225],"generated":[168],"Helios":[171],"simulator,":[174],"detailed":[177],"encoded":[180],"XML":[182,192],"files.":[183],"developed":[185],"tokenizer":[189],"file":[193],"defining":[194],"architecture,":[196],"converting":[197],"it":[198],"into":[199],"sequence":[202],"language":[205],"can":[207],"predict.":[208],"The":[209],"achieved":[211],"F1":[214],"score":[215,233,239],"0.73":[217],"during":[218],"teacher-forced":[219],"training.":[220],"Evaluation":[221],"performed":[226],"through":[227],"autoregressive":[228],"generation,":[229],"achieving":[230],"BLEU-4":[232],"94.00%":[235],"ROUGE-L":[238],"0.5182.":[241],"led":[243],"conclusion":[246],"such":[248],"generation":[252],"parameter":[254],"extraction":[255],"were":[256],"possible":[257],"images;":[260],"thus,":[261],"future":[262],"will":[264],"extend":[265],"approach":[267],"real":[269],"imagery":[270],"data.":[271]},"counts_by_year":[],"updated_date":"2026-07-01T06:00:48.157686","created_date":"2026-03-26T00:00:00"}
