{"id":"https://openalex.org/W7129480583","doi":"https://doi.org/10.48550/arxiv.2602.13662","title":"LeafNet: A Large-Scale Dataset and Comprehensive Benchmark for Foundational Vision-Language Understanding of Plant Diseases","display_name":"LeafNet: A Large-Scale Dataset and Comprehensive Benchmark for Foundational Vision-Language Understanding of Plant Diseases","publication_year":2026,"publication_date":"2026-02-14","ids":{"openalex":"https://openalex.org/W7129480583","doi":"https://doi.org/10.48550/arxiv.2602.13662"},"language":null,"primary_location":{"id":"pmh:doi:10.48550/arxiv.2602.13662","is_oa":true,"landing_page_url":null,"pdf_url":null,"source":{"id":"https://openalex.org/S4406922384","display_name":"Open MIND","issn_l":null,"issn":null,"is_oa":false,"is_in_doaj":false,"is_core":false,"host_organization":null,"host_organization_name":null,"host_organization_lineage":[],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"Article"},"type":"preprint","indexed_in":["datacite"],"open_access":{"is_oa":true,"oa_status":"green","oa_url":null,"any_repository_has_fulltext":true},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5070630364","display_name":"Khang Nguyen Quoc","orcid":"https://orcid.org/0000-0003-4927-4822"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Quoc, Khang Nguyen","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5035769784","display_name":"Phuong D. Dao","orcid":"https://orcid.org/0000-0002-3712-9022"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Dao, Phuong D.","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"last","author":{"id":"https://openalex.org/A5031714104","display_name":"Luyl-Da Quach","orcid":"https://orcid.org/0000-0002-5661-4250"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Quach, Luyl-Da","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]}],"institutions":[],"countries_distinct_count":0,"institutions_distinct_count":0,"corresponding_author_ids":[],"corresponding_institution_ids":[],"apc_list":null,"apc_paid":null,"fwci":null,"has_fulltext":false,"cited_by_count":0,"citation_normalized_percentile":null,"cited_by_percentile_year":null,"biblio":{"volume":null,"issue":null,"first_page":null,"last_page":null},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10616","display_name":"Smart Agriculture and AI","score":0.7113999724388123,"subfield":{"id":"https://openalex.org/subfields/1110","display_name":"Plant Science"},"field":{"id":"https://openalex.org/fields/11","display_name":"Agricultural and Biological Sciences"},"domain":{"id":"https://openalex.org/domains/1","display_name":"Life Sciences"}},"topics":[{"id":"https://openalex.org/T10616","display_name":"Smart Agriculture and AI","score":0.7113999724388123,"subfield":{"id":"https://openalex.org/subfields/1110","display_name":"Plant Science"},"field":{"id":"https://openalex.org/fields/11","display_name":"Agricultural and Biological Sciences"},"domain":{"id":"https://openalex.org/domains/1","display_name":"Life Sciences"}},{"id":"https://openalex.org/T10036","display_name":"Advanced Neural Network Applications","score":0.03519999980926514,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11714","display_name":"Multimodal Machine Learning Applications","score":0.018699999898672104,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/benchmarking","display_name":"Benchmarking","score":0.7369999885559082},{"id":"https://openalex.org/keywords/benchmark","display_name":"Benchmark (surveying)","score":0.6949999928474426},{"id":"https://openalex.org/keywords/identification","display_name":"Identification (biology)","score":0.5723000168800354},{"id":"https://openalex.org/keywords/plant-disease","display_name":"Plant disease","score":0.5242000222206116},{"id":"https://openalex.org/keywords/multimodality","display_name":"Multimodality","score":0.3366999924182892},{"id":"https://openalex.org/keywords/disease","display_name":"Disease","score":0.2897000014781952}],"concepts":[{"id":"https://openalex.org/C86251818","wikidata":"https://www.wikidata.org/wiki/Q816754","display_name":"Benchmarking","level":2,"score":0.7369999885559082},{"id":"https://openalex.org/C185798385","wikidata":"https://www.wikidata.org/wiki/Q1161707","display_name":"Benchmark (surveying)","level":2,"score":0.6949999928474426},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.6071000099182129},{"id":"https://openalex.org/C116834253","wikidata":"https://www.wikidata.org/wiki/Q2039217","display_name":"Identification (biology)","level":2,"score":0.5723000168800354},{"id":"https://openalex.org/C119857082","wikidata":"https://www.wikidata.org/wiki/Q2539","display_name":"Machine learning","level":1,"score":0.5669000148773193},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.5285000205039978},{"id":"https://openalex.org/C3019235130","wikidata":"https://www.wikidata.org/wiki/Q188956","display_name":"Plant disease","level":2,"score":0.5242000222206116},{"id":"https://openalex.org/C2522767166","wikidata":"https://www.wikidata.org/wiki/Q2374463","display_name":"Data science","level":1,"score":0.5199999809265137},{"id":"https://openalex.org/C2780910867","wikidata":"https://www.wikidata.org/wiki/Q1952416","display_name":"Multimodality","level":2,"score":0.3366999924182892},{"id":"https://openalex.org/C204321447","wikidata":"https://www.wikidata.org/wiki/Q30642","display_name":"Natural language processing","level":1,"score":0.3050999939441681},{"id":"https://openalex.org/C2779134260","wikidata":"https://www.wikidata.org/wiki/Q12136","display_name":"Disease","level":2,"score":0.2897000014781952},{"id":"https://openalex.org/C36464697","wikidata":"https://www.wikidata.org/wiki/Q451553","display_name":"Visualization","level":2,"score":0.2831999957561493},{"id":"https://openalex.org/C63882131","wikidata":"https://www.wikidata.org/wiki/Q17122954","display_name":"Strengths and weaknesses","level":2,"score":0.2632000148296356},{"id":"https://openalex.org/C66905080","wikidata":"https://www.wikidata.org/wiki/Q17005494","display_name":"Binary classification","level":3,"score":0.2590999901294708},{"id":"https://openalex.org/C168820333","wikidata":"https://www.wikidata.org/wiki/Q448889","display_name":"Visual inspection","level":2,"score":0.25850000977516174}],"mesh":[],"locations_count":2,"locations":[{"id":"pmh:doi:10.48550/arxiv.2602.13662","is_oa":true,"landing_page_url":null,"pdf_url":null,"source":{"id":"https://openalex.org/S4406922384","display_name":"Open MIND","issn_l":null,"issn":null,"is_oa":false,"is_in_doaj":false,"is_core":false,"host_organization":null,"host_organization_name":null,"host_organization_lineage":[],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"Article"},{"id":"doi:10.48550/arxiv.2602.13662","is_oa":true,"landing_page_url":"https://doi.org/10.48550/arxiv.2602.13662","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":null,"is_accepted":false,"is_published":null,"raw_source_name":null,"raw_type":"Preprint"}],"best_oa_location":{"id":"pmh:doi:10.48550/arxiv.2602.13662","is_oa":true,"landing_page_url":null,"pdf_url":null,"source":{"id":"https://openalex.org/S4406922384","display_name":"Open MIND","issn_l":null,"issn":null,"is_oa":false,"is_in_doaj":false,"is_core":false,"host_organization":null,"host_organization_name":null,"host_organization_lineage":[],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"Article"},"sustainable_development_goals":[{"id":"https://metadata.un.org/sdg/2","score":0.5745177865028381,"display_name":"Zero hunger"}],"awards":[],"funders":[],"has_content":{"pdf":false,"grobid_xml":false},"content_urls":null,"referenced_works_count":0,"referenced_works":[],"related_works":[],"abstract_inverted_index":{"Foundation":[0],"models":[1,158],"and":[2,16,42,55,111,148,159,195,208],"vision-language":[3],"pre-training":[4],"have":[5],"significantly":[6,179],"advanced":[7],"Vision-Language":[8],"Models":[9],"(VLMs),":[10],"enabling":[11],"multimodal":[12,39,53,166],"processing":[13],"of":[14,36,67,101,165],"visual":[15,58,106],"linguistic":[17,177],"data.":[18],"However,":[19],"their":[20,127],"application":[21],"in":[22,69,126,188],"domain-specific":[23],"agricultural":[24,94],"tasks,":[25],"such":[26],"as":[27,201],"plant":[28,71,102,192,214],"pathology,":[29],"remains":[30,151],"limited":[31],"due":[32],"to":[33,62],"the":[34,65,162,197],"lack":[35],"large-scale,":[37],"comprehensive":[38,52],"image--text":[40],"datasets":[41],"benchmarks.":[43],"To":[44],"address":[45],"this":[46],"gap,":[47],"we":[48,122],"introduce":[49],"LeafNet,":[50],"a":[51,57,202],"dataset,":[54,121],"LeafBench,":[56],"question-answering":[59],"benchmark":[60],"developed":[61],"systematically":[63],"evaluate":[64],"capabilities":[66],"VLMs":[68,117,160,169,190],"understanding":[70,129],"diseases.":[72],"The":[73,96],"dataset":[74],"comprises":[75],"186,000":[76],"leaf":[77],"digital":[78],"images":[79],"spanning":[80,91],"97":[81],"disease":[82,128,215],"classes,":[83],"paired":[84],"with":[85],"metadata,":[86],"generating":[87],"13,950":[88],"question-answer":[89],"pairs":[90],"six":[92],"critical":[93,163,186],"tasks.":[95],"questions":[97],"assess":[98],"various":[99],"aspects":[100],"pathology":[103,193],"understanding,":[104],"including":[105],"symptom":[107],"recognition,":[108],"taxonomic":[109],"relationships,":[110],"diagnostic":[112,181],"reasoning.":[113],"Benchmarking":[114],"12":[115],"state-of-the-art":[116],"on":[118],"our":[119],"LeafBench":[120,200],"reveal":[123],"substantial":[124],"disparity":[125],"capabilities.":[130],"Our":[131],"study":[132],"shows":[133],"performance":[134],"varies":[135],"markedly":[136],"across":[137],"tasks:":[138],"binary":[139],"healthy--diseased":[140],"classification":[141],"exceeds":[142],"90%":[143],"accuracy,":[144],"while":[145],"fine-grained":[146],"pathogen":[147],"species":[149],"identification":[150],"below":[152],"65%.":[153],"Direct":[154],"comparison":[155],"between":[156],"vision-only":[157],"demonstrates":[161],"advantage":[164],"architectures:":[167],"fine-tuned":[168],"outperform":[170],"traditional":[171],"vision":[172],"models,":[173],"confirming":[174],"that":[175],"integrating":[176],"representations":[178],"enhances":[180],"precision.":[182],"These":[183],"findings":[184],"highlight":[185],"gaps":[187],"current":[189],"for":[191,199,205],"applications":[194],"underscore":[196],"need":[198],"rigorous":[203],"framework":[204],"methodological":[206],"advancement":[207],"progress":[209],"evaluation":[210],"toward":[211],"reliable":[212],"AI-assisted":[213],"diagnosis.":[216],"Code":[217],"is":[218],"available":[219],"at":[220],"https://github.com/EnalisUs/LeafBench.":[221]},"counts_by_year":[],"updated_date":"2026-07-01T08:55:40.977307","created_date":"2026-02-18T00:00:00"}
