{"id":"https://openalex.org/W7128697779","doi":"https://doi.org/10.1016/j.ecoinf.2026.103656","title":"Large language vision models for zero-shot handwriting recognition of historical herbarium labels","display_name":"Large language vision models for zero-shot handwriting recognition of historical herbarium labels","publication_year":2026,"publication_date":"2026-02-12","ids":{"openalex":"https://openalex.org/W7128697779","doi":"https://doi.org/10.1016/j.ecoinf.2026.103656"},"language":"en","primary_location":{"id":"doi:10.1016/j.ecoinf.2026.103656","is_oa":true,"landing_page_url":"https://doi.org/10.1016/j.ecoinf.2026.103656","pdf_url":null,"source":{"id":"https://openalex.org/S195809937","display_name":"Ecological Informatics","issn_l":"1574-9541","issn":["1574-9541","1878-0512"],"is_oa":true,"is_in_doaj":true,"is_core":true,"host_organization":"https://openalex.org/P4310320990","host_organization_name":"Elsevier BV","host_organization_lineage":["https://openalex.org/P4310320990"],"host_organization_lineage_names":["Elsevier BV"],"type":"journal"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Ecological Informatics","raw_type":"journal-article"},"type":"article","indexed_in":["crossref","doaj"],"open_access":{"is_oa":true,"oa_status":"gold","oa_url":"https://doi.org/10.1016/j.ecoinf.2026.103656","any_repository_has_fulltext":true},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5125723303","display_name":"Matthias K\u00f6rschens","orcid":null},"institutions":[],"countries":[],"is_corresponding":true,"raw_author_name":"Matthias K\u00f6rschens","raw_affiliation_strings":[],"raw_orcid":"https://orcid.org/0000-0002-0755-2006","affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5088990196","display_name":"Solveig Franziska Bucher","orcid":"https://orcid.org/0000-0002-2303-4583"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Solveig Franziska Bucher","raw_affiliation_strings":[],"raw_orcid":"https://orcid.org/0000-0002-2303-4583","affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5125752478","display_name":"Christiane M. Ritz","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Christiane M. Ritz","raw_affiliation_strings":[],"raw_orcid":"https://orcid.org/0000-0002-7246-1004","affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5125745807","display_name":"Sebastian Gebauer","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Sebastian Gebauer","raw_affiliation_strings":[],"raw_orcid":"https://orcid.org/0000-0003-2051-0406","affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5032730951","display_name":"Jens Wesenberg","orcid":"https://orcid.org/0000-0002-1694-1740"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Jens Wesenberg","raw_affiliation_strings":[],"raw_orcid":"https://orcid.org/0000-0002-1694-1740","affiliations":[]},{"author_position":"last","author":{"id":"https://openalex.org/A5125744035","display_name":"Christine R\u00f6mermann","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Christine R\u00f6mermann","raw_affiliation_strings":[],"raw_orcid":"https://orcid.org/0000-0003-3471-0951","affiliations":[]}],"institutions":[],"countries_distinct_count":0,"institutions_distinct_count":6,"corresponding_author_ids":["https://openalex.org/A5125723303"],"corresponding_institution_ids":[],"apc_list":{"value":2510,"currency":"USD","value_usd":2510},"apc_paid":{"value":2510,"currency":"USD","value_usd":2510},"fwci":0.0,"has_fulltext":false,"cited_by_count":0,"citation_normalized_percentile":{"value":0.28217216,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":null,"biblio":{"volume":"94","issue":null,"first_page":"103656","last_page":"103656"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10601","display_name":"Handwritten Text Recognition Techniques","score":0.8694999814033508,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10601","display_name":"Handwritten Text Recognition Techniques","score":0.8694999814033508,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T13083","display_name":"Advanced Text Analysis Techniques","score":0.03290000185370445,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11550","display_name":"Text and Document Classification Technologies","score":0.012000000104308128,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/handwriting","display_name":"Handwriting","score":0.7760000228881836},{"id":"https://openalex.org/keywords/herbarium","display_name":"Herbarium","score":0.589900016784668},{"id":"https://openalex.org/keywords/language-model","display_name":"Language model","score":0.3797000050544739},{"id":"https://openalex.org/keywords/handwriting-recognition","display_name":"Handwriting recognition","score":0.29440000653266907}],"concepts":[{"id":"https://openalex.org/C2779386606","wikidata":"https://www.wikidata.org/wiki/Q2393642","display_name":"Handwriting","level":2,"score":0.7760000228881836},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.6844000220298767},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.6470999717712402},{"id":"https://openalex.org/C204321447","wikidata":"https://www.wikidata.org/wiki/Q30642","display_name":"Natural language processing","level":1,"score":0.6345999836921692},{"id":"https://openalex.org/C78945076","wikidata":"https://www.wikidata.org/wiki/Q181916","display_name":"Herbarium","level":2,"score":0.589900016784668},{"id":"https://openalex.org/C41895202","wikidata":"https://www.wikidata.org/wiki/Q8162","display_name":"Linguistics","level":1,"score":0.4171999990940094},{"id":"https://openalex.org/C137293760","wikidata":"https://www.wikidata.org/wiki/Q3621696","display_name":"Language model","level":2,"score":0.3797000050544739},{"id":"https://openalex.org/C112640561","wikidata":"https://www.wikidata.org/wiki/Q2440634","display_name":"Handwriting recognition","level":3,"score":0.29440000653266907},{"id":"https://openalex.org/C96455323","wikidata":"https://www.wikidata.org/wiki/Q13955","display_name":"Arabic","level":2,"score":0.2660999894142151},{"id":"https://openalex.org/C28490314","wikidata":"https://www.wikidata.org/wiki/Q189436","display_name":"Speech recognition","level":1,"score":0.2531999945640564}],"mesh":[],"locations_count":2,"locations":[{"id":"doi:10.1016/j.ecoinf.2026.103656","is_oa":true,"landing_page_url":"https://doi.org/10.1016/j.ecoinf.2026.103656","pdf_url":null,"source":{"id":"https://openalex.org/S195809937","display_name":"Ecological Informatics","issn_l":"1574-9541","issn":["1574-9541","1878-0512"],"is_oa":true,"is_in_doaj":true,"is_core":true,"host_organization":"https://openalex.org/P4310320990","host_organization_name":"Elsevier BV","host_organization_lineage":["https://openalex.org/P4310320990"],"host_organization_lineage_names":["Elsevier BV"],"type":"journal"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Ecological Informatics","raw_type":"journal-article"},{"id":"pmh:oai:doaj.org/article:b6c364206b2f4857abe247d369311625","is_oa":true,"landing_page_url":"https://doaj.org/article/b6c364206b2f4857abe247d369311625","pdf_url":null,"source":{"id":"https://openalex.org/S112646816","display_name":"SHILAP Revista de lepidopterolog\u00eda","issn_l":"0300-5267","issn":["0300-5267","2340-4078"],"is_oa":true,"is_in_doaj":true,"is_core":false,"host_organization":null,"host_organization_name":null,"host_organization_lineage":[],"host_organization_lineage_names":[],"type":"journal"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":"Ecological Informatics, Vol 94, Iss , Pp 103656- (2026)","raw_type":"article"}],"best_oa_location":{"id":"doi:10.1016/j.ecoinf.2026.103656","is_oa":true,"landing_page_url":"https://doi.org/10.1016/j.ecoinf.2026.103656","pdf_url":null,"source":{"id":"https://openalex.org/S195809937","display_name":"Ecological Informatics","issn_l":"1574-9541","issn":["1574-9541","1878-0512"],"is_oa":true,"is_in_doaj":true,"is_core":true,"host_organization":"https://openalex.org/P4310320990","host_organization_name":"Elsevier BV","host_organization_lineage":["https://openalex.org/P4310320990"],"host_organization_lineage_names":["Elsevier BV"],"type":"journal"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Ecological Informatics","raw_type":"journal-article"},"sustainable_development_goals":[],"awards":[{"id":"https://openalex.org/G5632166549","display_name":null,"funder_award_id":"FZT 118","funder_id":"https://openalex.org/F4320330723","funder_display_name":"Deutsches Zentrum f\u00fcr integrative Biodiversit\u00e4tsforschung Halle-Jena-Leipzig"},{"id":"https://openalex.org/G8820888468","display_name":null,"funder_award_id":"09159751","funder_id":"https://openalex.org/F4320330723","funder_display_name":"Deutsches Zentrum f\u00fcr integrative Biodiversit\u00e4tsforschung Halle-Jena-Leipzig"}],"funders":[{"id":"https://openalex.org/F4320320879","display_name":"Deutsche Forschungsgemeinschaft","ror":"https://ror.org/018mejw64"},{"id":"https://openalex.org/F4320330723","display_name":"Deutsches Zentrum f\u00fcr integrative Biodiversit\u00e4tsforschung Halle-Jena-Leipzig","ror":null}],"has_content":{"grobid_xml":false,"pdf":false},"content_urls":null,"referenced_works_count":23,"referenced_works":["https://openalex.org/W1755934201","https://openalex.org/W2140623652","https://openalex.org/W2159024099","https://openalex.org/W2608071175","https://openalex.org/W2793108664","https://openalex.org/W2963037989","https://openalex.org/W3109184365","https://openalex.org/W4382202677","https://openalex.org/W4385830672","https://openalex.org/W4387665825","https://openalex.org/W4388489043","https://openalex.org/W4390507226","https://openalex.org/W4400237336","https://openalex.org/W4401428875","https://openalex.org/W4402088577","https://openalex.org/W4404071291","https://openalex.org/W4406179522","https://openalex.org/W4407929305","https://openalex.org/W4408533932","https://openalex.org/W4408920297","https://openalex.org/W4410480075","https://openalex.org/W4410761886","https://openalex.org/W4412934674"],"related_works":[],"abstract_inverted_index":{"Herbaria":[0],"contain":[1],"large":[2,344],"numbers":[3],"of":[4,9,20,30,41,62,105,134,159,171,188,228,246,274,277,288,294],"conserved":[5],"specimens":[6,76,95],"with":[7,47,99],"lots":[8],"information":[10,43,106],"for":[11,97,290,296],"biodiversity":[12],"research,":[13],"since":[14,114],"they":[15,127,143,179],"offer":[16],"a":[17,39,111,225,285,349],"track":[18],"record":[19],"the":[21,35,48,60,64,67,75,94,103,115,169,172,177,185,189,196,234,247,271,275,282,309,322,328,340],"morphology":[22],"as":[23,25,59,320,325,327],"well":[24,326],"temporal":[26],"and":[27,66,80,91,151,153,207,239,261,292,348],"spatial":[28],"distribution":[29],"plant":[31,37],"species":[32,323],"worldwide.":[33],"Besides":[34],"dried":[36],"itself,":[38],"lot":[40],"additional":[42],"is":[44,110,306,353],"usually":[45],"provided":[46],"herbarium":[49,268,273,317],"specimens,":[50],"typically":[51],"captured":[52],"in":[53,131,195,343],"printed":[54,263,297],"or":[55,222],"handwritten":[56,108,260],"labels,":[57,264,319],"such":[58,215],"date":[61],"collection,":[63],"location":[65,170],"collector\u2019s":[68],"name.":[69],"While,":[70],"due":[71],"to":[72,87,124,147,163,181,213,224,315],"historical":[73],"reasons,":[74],"have":[77],"been":[78],"collected":[79],"labeled":[81],"manually,":[82],"considerable":[83,112],"efforts":[84],"are":[85,128,144,331],"underway":[86],"digitize":[88],"entire":[89],"herbaria":[90],"therewith":[92],"make":[93],"available":[96,355],"analysis":[98,187],"automated":[100,186],"methods.":[101],"However,":[102],"extraction":[104],"from":[107,121,270],"labels":[109,173,248],"challenge,":[113],"handwritings":[116],"do":[117],"not":[118,332],"only":[119],"differ":[120],"one":[122,258,262,293],"collector":[123],"another,":[125],"but":[126],"also":[129,192],"often":[130,145],"old":[132,139],"types":[133],"writing":[135],"(e.g.,":[136],"S\u00fctterlin,":[137],"an":[138],"German":[140],"script).":[141],"Therefore,":[142],"hard":[146],"decipher":[148],"both":[149],"manually":[150],"automatically,":[152],"barely":[154],"any":[155],"substantial":[156],"consistent":[157],"data":[158],"this":[160,199],"kind":[161],"exists":[162],"train":[164],"state-of-the-art":[165,204],"vision":[166],"models.":[167],"Since":[168],"differs":[174],"depending":[175],"on":[176,254,267],"record,":[178],"need":[180],"be":[182,237,312],"detected":[183],"before":[184,308],"writing,":[190],"which":[191],"proved":[193],"challenging":[194],"past.":[197],"In":[198,279],"work":[200],"we":[201,231,300],"show":[202,232],"that":[203,233,302],"Large":[205],"Language":[206],"Vision":[208],"Models":[209],"(LLVM)":[210],"possess":[211],"capabilities":[212],"extract":[214],"handwriting":[216],"zero-shot,":[217],"i.e.,":[218],"completely":[219],"without":[220],"training":[221],"fine-tuning,":[223],"high":[226],"degree":[227],"accuracy.":[229],"Additionally,":[230],"results":[235],"can":[236,311,338],"refined":[238],"improved":[240],"considerably":[241],"by":[242],"performing":[243],"zero-shot":[244],"detection":[245],"beforehand.":[249],"We":[250],"evaluate":[251],"our":[252,280],"approach":[253],"two":[255],"novel":[256],"datasets,":[257],"containing":[259],"respectively,":[265],"based":[266],"scans":[269],"virtual":[272],"flora":[276],"Germany.":[278],"evaluations,":[281],"approaches":[283],"achieve":[284],"mean":[286],"similarity":[287],"84.5%":[289],"handwritten,":[291],"93.1%":[295],"labels.":[298],"Thus,":[299],"conclude":[301],"still":[303],"some":[304],"evaluation":[305],"needed":[307],"LLVMs":[310],"fully":[313],"applied":[314],"transcribe":[316],"specimen":[318],"sometimes":[321],"taxonomies":[324],"collection":[329],"sites":[330],"correctly":[333],"identified.":[334],"Still":[335],"these":[336],"models":[337],"support":[339],"transcription":[341],"process":[342],"collections.":[345],"Our":[346],"code":[347],"graphical":[350],"web":[351],"application":[352],"publicly":[354],"under":[356],"https://github.com/Atlas8008/herbarium_label_reader.":[357]},"counts_by_year":[],"updated_date":"2026-02-17T06:05:46.635709","created_date":"2026-02-13T00:00:00"}
