{"id":"https://openalex.org/W7147360831","doi":"https://doi.org/10.48550/arxiv.2603.27519","title":"SPROUT: A Scalable Diffusion Foundation Model for Agricultural Vision","display_name":"SPROUT: A Scalable Diffusion Foundation Model for Agricultural Vision","publication_year":2026,"publication_date":"2026-03-29","ids":{"openalex":"https://openalex.org/W7147360831","doi":"https://doi.org/10.48550/arxiv.2603.27519"},"language":null,"primary_location":{"id":"doi:10.48550/arxiv.2603.27519","is_oa":true,"landing_page_url":"https://doi.org/10.48550/arxiv.2603.27519","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":null,"is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"Preprint"},"type":"preprint","indexed_in":["datacite"],"open_access":{"is_oa":true,"oa_status":"green","oa_url":"https://doi.org/10.48550/arxiv.2603.27519","any_repository_has_fulltext":true},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5007059437","display_name":"Shuai Xiang","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Xiang, Shuai","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5132657566","display_name":"Wei Guo","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Guo, Wei","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5016540675","display_name":"James Burridge","orcid":"https://orcid.org/0000-0002-2194-9894"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Burridge, James","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5040788606","display_name":"Shouyang Liu","orcid":"https://orcid.org/0000-0003-4649-4192"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Liu, Shouyang","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5132597469","display_name":"Hao Lu","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Lu, Hao","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"last","author":{"id":"https://openalex.org/A5110288768","display_name":"Tokihiro Fukatsu","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Fukatsu, Tokihiro","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]}],"institutions":[],"countries_distinct_count":0,"institutions_distinct_count":0,"corresponding_author_ids":[],"corresponding_institution_ids":[],"apc_list":null,"apc_paid":null,"fwci":null,"has_fulltext":false,"cited_by_count":0,"citation_normalized_percentile":null,"cited_by_percentile_year":null,"biblio":{"volume":null,"issue":null,"first_page":null,"last_page":null},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10616","display_name":"Smart Agriculture and AI","score":0.8934000134468079,"subfield":{"id":"https://openalex.org/subfields/1110","display_name":"Plant Science"},"field":{"id":"https://openalex.org/fields/11","display_name":"Agricultural and Biological Sciences"},"domain":{"id":"https://openalex.org/domains/1","display_name":"Life Sciences"}},"topics":[{"id":"https://openalex.org/T10616","display_name":"Smart Agriculture and AI","score":0.8934000134468079,"subfield":{"id":"https://openalex.org/subfields/1110","display_name":"Plant Science"},"field":{"id":"https://openalex.org/fields/11","display_name":"Agricultural and Biological Sciences"},"domain":{"id":"https://openalex.org/domains/1","display_name":"Life Sciences"}},{"id":"https://openalex.org/T10036","display_name":"Advanced Neural Network Applications","score":0.01119999960064888,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T12093","display_name":"Greenhouse Technology and Climate Control","score":0.006899999920278788,"subfield":{"id":"https://openalex.org/subfields/1110","display_name":"Plant Science"},"field":{"id":"https://openalex.org/fields/11","display_name":"Agricultural and Biological Sciences"},"domain":{"id":"https://openalex.org/domains/1","display_name":"Life Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/scalability","display_name":"Scalability","score":0.6238999962806702},{"id":"https://openalex.org/keywords/foundation","display_name":"Foundation (evidence)","score":0.5665000081062317},{"id":"https://openalex.org/keywords/agriculture","display_name":"Agriculture","score":0.48910000920295715},{"id":"https://openalex.org/keywords/transformer","display_name":"Transformer","score":0.3714999854564667},{"id":"https://openalex.org/keywords/range","display_name":"Range (aeronautics)","score":0.3441999852657318},{"id":"https://openalex.org/keywords/domain","display_name":"Domain (mathematical analysis)","score":0.33379998803138733}],"concepts":[{"id":"https://openalex.org/C48044578","wikidata":"https://www.wikidata.org/wiki/Q727490","display_name":"Scalability","level":2,"score":0.6238999962806702},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.6118999719619751},{"id":"https://openalex.org/C2780966255","wikidata":"https://www.wikidata.org/wiki/Q5474306","display_name":"Foundation (evidence)","level":2,"score":0.5665000081062317},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.5156999826431274},{"id":"https://openalex.org/C118518473","wikidata":"https://www.wikidata.org/wiki/Q11451","display_name":"Agriculture","level":2,"score":0.48910000920295715},{"id":"https://openalex.org/C119857082","wikidata":"https://www.wikidata.org/wiki/Q2539","display_name":"Machine learning","level":1,"score":0.3880000114440918},{"id":"https://openalex.org/C66322947","wikidata":"https://www.wikidata.org/wiki/Q11658","display_name":"Transformer","level":3,"score":0.3714999854564667},{"id":"https://openalex.org/C204323151","wikidata":"https://www.wikidata.org/wiki/Q905424","display_name":"Range (aeronautics)","level":2,"score":0.3441999852657318},{"id":"https://openalex.org/C36503486","wikidata":"https://www.wikidata.org/wiki/Q11235244","display_name":"Domain (mathematical analysis)","level":2,"score":0.33379998803138733},{"id":"https://openalex.org/C31972630","wikidata":"https://www.wikidata.org/wiki/Q844240","display_name":"Computer vision","level":1,"score":0.3296999931335449},{"id":"https://openalex.org/C2776760102","wikidata":"https://www.wikidata.org/wiki/Q5139990","display_name":"Code (set theory)","level":3,"score":0.3174000084400177},{"id":"https://openalex.org/C69357855","wikidata":"https://www.wikidata.org/wiki/Q163214","display_name":"Diffusion","level":2,"score":0.31470000743865967},{"id":"https://openalex.org/C99498987","wikidata":"https://www.wikidata.org/wiki/Q2210247","display_name":"Noise (video)","level":3,"score":0.2888999879360199},{"id":"https://openalex.org/C5339829","wikidata":"https://www.wikidata.org/wiki/Q1425977","display_name":"Machine vision","level":2,"score":0.28119999170303345},{"id":"https://openalex.org/C163294075","wikidata":"https://www.wikidata.org/wiki/Q581861","display_name":"Noise reduction","level":2,"score":0.2590000033378601},{"id":"https://openalex.org/C47136581","wikidata":"https://www.wikidata.org/wiki/Q16000047","display_name":"Agricultural machinery","level":3,"score":0.2558000087738037}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.48550/arxiv.2603.27519","is_oa":true,"landing_page_url":"https://doi.org/10.48550/arxiv.2603.27519","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":null,"is_accepted":false,"is_published":null,"raw_source_name":null,"raw_type":"Preprint"}],"best_oa_location":{"id":"doi:10.48550/arxiv.2603.27519","is_oa":true,"landing_page_url":"https://doi.org/10.48550/arxiv.2603.27519","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":null,"is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"Preprint"},"sustainable_development_goals":[{"score":0.7524753212928772,"display_name":"Zero hunger","id":"https://metadata.un.org/sdg/2"}],"awards":[],"funders":[],"has_content":{"grobid_xml":false,"pdf":false},"content_urls":null,"referenced_works_count":0,"referenced_works":[],"related_works":[],"abstract_inverted_index":{"Vision":[0],"Foundation":[1],"Models":[2],"(VFM)":[3],"pre-trained":[4],"on":[5,13,75],"large-scale":[6],"unlabeled":[7],"data":[8],"have":[9],"achieved":[10],"remarkable":[11],"success":[12],"general":[14],"computer":[15],"vision":[16],"tasks,":[17,111],"yet":[18],"typically":[19],"suffer":[20],"from":[21],"significant":[22],"domain":[23],"gaps":[24],"when":[25],"applied":[26],"to":[27,60],"agriculture.":[28],"In":[29],"this":[30],"context,":[31],"we":[32],"introduce":[33],"$SPROUT$":[34],"($S$calable":[35],"$P$lant":[36],"$R$epresentation":[37],"model":[38,48,121],"via":[39,50],"$O$pen-field":[40],"$U$nsupervised":[41],"$T$raining),":[42],"a":[43,55,76,106],"multi-crop,":[44],"multi-task":[45],"agricultural":[46,83,102],"foundation":[47,103],"trained":[49],"diffusion":[51],"denoising.":[52],"SPROUT":[53,74,96],"leverages":[54],"VAE-free":[56],"Pixel-space":[57],"Diffusion":[58],"Transformer":[59],"learn":[61],"rich,":[62],"structure-aware":[63],"representations":[64],"through":[65],"denoising":[66],"and":[67,90,101,120],"enabling":[68],"efficient":[69],"end-to-end":[70],"training.":[71],"We":[72],"pre-train":[73],"curated":[77],"dataset":[78],"of":[79,109],"2.6":[80],"million":[81],"high-quality":[82],"images":[84],"spanning":[85],"diverse":[86],"crops,":[87],"growth":[88],"stages,":[89],"environments.":[91],"Extensive":[92],"experiments":[93],"demonstrate":[94],"that":[95],"consistently":[97],"outperforms":[98],"state-of-the-art":[99],"web-pretrained":[100],"models":[104],"across":[105],"wide":[107],"range":[108],"downstream":[110],"while":[112],"requiring":[113],"substantially":[114],"lower":[115],"pre-training":[116],"cost.":[117],"The":[118],"code":[119],"are":[122],"available":[123],"at":[124],"https://github.com/UTokyo-FieldPhenomics-Lab/SPROUT.":[125]},"counts_by_year":[],"updated_date":"2026-07-01T06:00:48.157686","created_date":"2026-04-02T00:00:00"}
