{"id":"https://openalex.org/W7148541755","doi":"https://doi.org/10.48550/arxiv.2604.00940","title":"YieldSAT: A Multimodal Benchmark Dataset for High-Resolution Crop Yield Prediction","display_name":"YieldSAT: A Multimodal Benchmark Dataset for High-Resolution Crop Yield Prediction","publication_year":2026,"publication_date":"2026-04-01","ids":{"openalex":"https://openalex.org/W7148541755","doi":"https://doi.org/10.48550/arxiv.2604.00940"},"language":null,"primary_location":{"id":"doi:10.48550/arxiv.2604.00940","is_oa":true,"landing_page_url":"https://doi.org/10.48550/arxiv.2604.00940","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":null,"is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"Preprint"},"type":"preprint","indexed_in":["datacite"],"open_access":{"is_oa":true,"oa_status":"green","oa_url":"https://doi.org/10.48550/arxiv.2604.00940","any_repository_has_fulltext":true},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5019450085","display_name":"Miro Miranda","orcid":"https://orcid.org/0009-0002-8195-9776"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Miranda, Miro","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5132790691","display_name":"Deepak Pathak","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Pathak, Deepak","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5032545698","display_name":"Patrick Helber","orcid":"https://orcid.org/0000-0001-8454-4301"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Helber, Patrick","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5033808296","display_name":"Benjamin Bischke","orcid":"https://orcid.org/0000-0002-6473-3348"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Bischke, Benjamin","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5087589867","display_name":"Hiba Najjar","orcid":"https://orcid.org/0000-0002-7498-794X"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Najjar, Hiba","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5022033505","display_name":"Francisco Mena","orcid":"https://orcid.org/0000-0002-5004-6571"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Mena, Francisco","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5101295886","display_name":"Cristhian Sanchez","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Sanchez, Cristhian","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5102676931","display_name":"Akshay Pai","orcid":"https://orcid.org/0000-0002-0087-1629"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Pai, Akshay","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5132734900","display_name":"Diego Arenas","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Arenas, Diego","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5013519837","display_name":"Mat\u00edas Valdenegro-Toro","orcid":"https://orcid.org/0000-0001-5793-9498"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Valdenegro-Toro, Matias","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5008628120","display_name":"Marcela Charfuel\u00e0n","orcid":"https://orcid.org/0009-0005-6886-0415"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Charfuelan, Marcela","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5013923731","display_name":"Marlon Nuske","orcid":"https://orcid.org/0000-0002-0651-0664"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Nuske, Marlon","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"last","author":{"id":"https://openalex.org/A5132812955","display_name":"Andreas Dengel","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Dengel, Andreas","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]}],"institutions":[],"countries_distinct_count":0,"institutions_distinct_count":0,"corresponding_author_ids":[],"corresponding_institution_ids":[],"apc_list":null,"apc_paid":null,"fwci":null,"has_fulltext":false,"cited_by_count":0,"citation_normalized_percentile":null,"cited_by_percentile_year":null,"biblio":{"volume":null,"issue":null,"first_page":null,"last_page":null},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10111","display_name":"Remote Sensing in Agriculture","score":0.5360999703407288,"subfield":{"id":"https://openalex.org/subfields/2303","display_name":"Ecology"},"field":{"id":"https://openalex.org/fields/23","display_name":"Environmental Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10111","display_name":"Remote Sensing in Agriculture","score":0.5360999703407288,"subfield":{"id":"https://openalex.org/subfields/2303","display_name":"Ecology"},"field":{"id":"https://openalex.org/fields/23","display_name":"Environmental Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10616","display_name":"Smart Agriculture and AI","score":0.421099990606308,"subfield":{"id":"https://openalex.org/subfields/1110","display_name":"Plant Science"},"field":{"id":"https://openalex.org/fields/11","display_name":"Agricultural and Biological Sciences"},"domain":{"id":"https://openalex.org/domains/1","display_name":"Life Sciences"}},{"id":"https://openalex.org/T10689","display_name":"Remote-Sensing Image Classification","score":0.005400000140070915,"subfield":{"id":"https://openalex.org/subfields/2214","display_name":"Media Technology"},"field":{"id":"https://openalex.org/fields/22","display_name":"Engineering"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/ground-truth","display_name":"Ground truth","score":0.5669999718666077},{"id":"https://openalex.org/keywords/crop-yield","display_name":"Crop yield","score":0.5304999947547913},{"id":"https://openalex.org/keywords/benchmark","display_name":"Benchmark (surveying)","score":0.5102999806404114},{"id":"https://openalex.org/keywords/multispectral-image","display_name":"Multispectral image","score":0.5023999810218811},{"id":"https://openalex.org/keywords/scalability","display_name":"Scalability","score":0.4823000133037567},{"id":"https://openalex.org/keywords/deep-learning","display_name":"Deep learning","score":0.4505999982357025},{"id":"https://openalex.org/keywords/yield","display_name":"Yield (engineering)","score":0.4433000087738037},{"id":"https://openalex.org/keywords/satellite","display_name":"Satellite","score":0.43939998745918274},{"id":"https://openalex.org/keywords/big-data","display_name":"Big data","score":0.42489999532699585}],"concepts":[{"id":"https://openalex.org/C146849305","wikidata":"https://www.wikidata.org/wiki/Q370766","display_name":"Ground truth","level":2,"score":0.5669999718666077},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.564300000667572},{"id":"https://openalex.org/C126343540","wikidata":"https://www.wikidata.org/wiki/Q889514","display_name":"Crop yield","level":2,"score":0.5304999947547913},{"id":"https://openalex.org/C124101348","wikidata":"https://www.wikidata.org/wiki/Q172491","display_name":"Data mining","level":1,"score":0.510699987411499},{"id":"https://openalex.org/C185798385","wikidata":"https://www.wikidata.org/wiki/Q1161707","display_name":"Benchmark (surveying)","level":2,"score":0.5102999806404114},{"id":"https://openalex.org/C173163844","wikidata":"https://www.wikidata.org/wiki/Q1761440","display_name":"Multispectral image","level":2,"score":0.5023999810218811},{"id":"https://openalex.org/C48044578","wikidata":"https://www.wikidata.org/wiki/Q727490","display_name":"Scalability","level":2,"score":0.4823000133037567},{"id":"https://openalex.org/C119857082","wikidata":"https://www.wikidata.org/wiki/Q2539","display_name":"Machine learning","level":1,"score":0.4569000005722046},{"id":"https://openalex.org/C108583219","wikidata":"https://www.wikidata.org/wiki/Q197536","display_name":"Deep learning","level":2,"score":0.4505999982357025},{"id":"https://openalex.org/C134121241","wikidata":"https://www.wikidata.org/wiki/Q899301","display_name":"Yield (engineering)","level":2,"score":0.4433000087738037},{"id":"https://openalex.org/C19269812","wikidata":"https://www.wikidata.org/wiki/Q26540","display_name":"Satellite","level":2,"score":0.43939998745918274},{"id":"https://openalex.org/C75684735","wikidata":"https://www.wikidata.org/wiki/Q858810","display_name":"Big data","level":2,"score":0.42489999532699585},{"id":"https://openalex.org/C9652623","wikidata":"https://www.wikidata.org/wiki/Q190109","display_name":"Field (mathematics)","level":2,"score":0.41850000619888306},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.41690000891685486},{"id":"https://openalex.org/C45804977","wikidata":"https://www.wikidata.org/wiki/Q7239673","display_name":"Predictive modelling","level":2,"score":0.4004000127315521},{"id":"https://openalex.org/C46686674","wikidata":"https://www.wikidata.org/wiki/Q466303","display_name":"Boosting (machine learning)","level":2,"score":0.39730000495910645},{"id":"https://openalex.org/C33954974","wikidata":"https://www.wikidata.org/wiki/Q486494","display_name":"Sensor fusion","level":2,"score":0.36579999327659607},{"id":"https://openalex.org/C83546350","wikidata":"https://www.wikidata.org/wiki/Q1139051","display_name":"Regression","level":2,"score":0.3610000014305115},{"id":"https://openalex.org/C159620131","wikidata":"https://www.wikidata.org/wiki/Q1938983","display_name":"Spatial analysis","level":2,"score":0.3319000005722046},{"id":"https://openalex.org/C70153297","wikidata":"https://www.wikidata.org/wiki/Q5591907","display_name":"Gradient boosting","level":3,"score":0.3280999958515167},{"id":"https://openalex.org/C2777106113","wikidata":"https://www.wikidata.org/wiki/Q18349347","display_name":"Crop simulation model","level":3,"score":0.32690000534057617},{"id":"https://openalex.org/C2780451532","wikidata":"https://www.wikidata.org/wiki/Q759676","display_name":"Task (project management)","level":2,"score":0.3264999985694885},{"id":"https://openalex.org/C67186912","wikidata":"https://www.wikidata.org/wiki/Q367664","display_name":"Data modeling","level":2,"score":0.31850001215934753},{"id":"https://openalex.org/C45942800","wikidata":"https://www.wikidata.org/wiki/Q245652","display_name":"Ensemble learning","level":2,"score":0.31520000100135803},{"id":"https://openalex.org/C79337645","wikidata":"https://www.wikidata.org/wiki/Q779824","display_name":"Outlier","level":2,"score":0.3100999891757965},{"id":"https://openalex.org/C62649853","wikidata":"https://www.wikidata.org/wiki/Q199687","display_name":"Remote sensing","level":1,"score":0.2969000041484833},{"id":"https://openalex.org/C153180895","wikidata":"https://www.wikidata.org/wiki/Q7148389","display_name":"Pattern recognition (psychology)","level":2,"score":0.2930000126361847},{"id":"https://openalex.org/C39399123","wikidata":"https://www.wikidata.org/wiki/Q1348989","display_name":"Earth observation","level":3,"score":0.2892000079154968},{"id":"https://openalex.org/C205372480","wikidata":"https://www.wikidata.org/wiki/Q210521","display_name":"Image resolution","level":2,"score":0.2694999873638153},{"id":"https://openalex.org/C2778102629","wikidata":"https://www.wikidata.org/wiki/Q725252","display_name":"Satellite imagery","level":2,"score":0.25780001282691956},{"id":"https://openalex.org/C94124525","wikidata":"https://www.wikidata.org/wiki/Q912550","display_name":"Categorization","level":2,"score":0.2513999938964844}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.48550/arxiv.2604.00940","is_oa":true,"landing_page_url":"https://doi.org/10.48550/arxiv.2604.00940","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":null,"is_accepted":false,"is_published":null,"raw_source_name":null,"raw_type":"Preprint"}],"best_oa_location":{"id":"doi:10.48550/arxiv.2604.00940","is_oa":true,"landing_page_url":"https://doi.org/10.48550/arxiv.2604.00940","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":null,"is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"Preprint"},"sustainable_development_goals":[{"score":0.8276267051696777,"id":"https://metadata.un.org/sdg/13","display_name":"Climate action"}],"awards":[],"funders":[],"has_content":{"grobid_xml":false,"pdf":false},"content_urls":null,"referenced_works_count":0,"referenced_works":[],"related_works":[],"abstract_inverted_index":{"Crop":[0],"yield":[1,12,67,103,143],"prediction":[2,13,144],"requires":[3],"substantial":[4],"data":[5,22,25,157,174],"to":[6,38],"train":[7],"scalable":[8,49],"models.":[9],"However,":[10],"creating":[11],"datasets":[14,30],"is":[15,117,195],"constrained":[16],"by":[17,130,150],"high":[18],"acquisition":[19],"costs,":[20],"heterogeneous":[21],"quality,":[23,35],"and":[24,61,81,83,92,140,156],"privacy":[26],"regulations.":[27],"Consequently,":[28],"existing":[29],"are":[31,105],"scarce,":[32],"low":[33],"in":[34,124,170],"or":[36,41],"limited":[37],"regional":[39],"levels":[40],"single":[42],"crop":[43,66,86,142],"types,":[44,87],"hindering":[45],"the":[46,136,171],"development":[47],"of":[48,112,138],"data-driven":[50],"solutions.":[51],"In":[52,98],"this":[53],"work,":[54],"we":[55,161,181],"release":[56],"YieldSAT,":[57],"a":[58,109,146,183],"large,":[59],"high-quality,":[60],"multimodal":[62],"dataset":[63,194],"for":[64],"high-resolution":[65,141],"prediction.":[68],"YieldSAT":[69],"spans":[70],"various":[71,152],"climate":[72],"zones":[73],"across":[74,94],"multiple":[75],"countries,":[76],"including":[77,88],"Argentina,":[78],"Brazil,":[79],"Uruguay,":[80],"Germany,":[82],"includes":[84],"major":[85],"corn,":[89],"rapeseed,":[90],"soybeans,":[91],"wheat,":[93],"2,173":[95],"expert-curated":[96],"fields.":[97],"total,":[99],"over":[100],"12.2":[101],"million":[102],"samples":[104],"available,":[106],"each":[107],"with":[108,119],"spatial":[110],"resolution":[111],"10":[113],"m.":[114],"Each":[115],"field":[116],"paired":[118],"multispectral":[120],"satellite":[121,127],"imagery,":[122],"resulting":[123],"113,555":[125],"labeled":[126],"images,":[128],"complemented":[129],"auxiliary":[131],"environmental":[132],"data.":[133],"We":[134],"demonstrate":[135],"potential":[137],"large-scale":[139],"as":[145],"pixel":[147],"regression":[148],"task":[149],"comparing":[151],"deep":[153],"learning":[154],"models":[155],"fusion":[158],"architectures.":[159],"Furthermore,":[160],"highlight":[162],"open":[163],"challenges":[164],"arising":[165],"from":[166],"severe":[167],"distribution":[168],"shifts":[169],"ground":[172],"truth":[173],"under":[175],"real-world":[176],"conditions.":[177],"To":[178],"mitigate":[179],"this,":[180],"explore":[182],"domain-informed":[184],"Deep":[185],"Ensemble":[186],"approach":[187],"that":[188],"exhibits":[189],"significant":[190],"performance":[191],"gains.":[192],"The":[193],"available":[196],"at":[197],"https://yieldsat.github.io/.":[198]},"counts_by_year":[],"updated_date":"2026-07-01T06:00:48.157686","created_date":"2026-04-03T00:00:00"}
