{"id":"https://openalex.org/W4416062128","doi":"https://doi.org/10.48550/arxiv.2507.06093","title":"Tile-Based ViT Inference with Visual-Cluster Priors for Zero-Shot Multi-Species Plant Identification","display_name":"Tile-Based ViT Inference with Visual-Cluster Priors for Zero-Shot Multi-Species Plant Identification","publication_year":2025,"publication_date":"2025-07-08","ids":{"openalex":"https://openalex.org/W4416062128","doi":"https://doi.org/10.48550/arxiv.2507.06093"},"language":"en","primary_location":{"id":"pmh:oai:arXiv.org:2507.06093","is_oa":true,"landing_page_url":"http://arxiv.org/abs/2507.06093","pdf_url":"https://arxiv.org/pdf/2507.06093","source":{"id":"https://openalex.org/S4393918464","display_name":"ArXiv.org","issn_l":"2331-8422","issn":["2331-8422"],"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":null,"host_organization_name":null,"host_organization_lineage":[],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"text"},"type":"preprint","indexed_in":["arxiv","datacite"],"open_access":{"is_oa":true,"oa_status":"green","oa_url":"https://arxiv.org/pdf/2507.06093","any_repository_has_fulltext":true},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5006723872","display_name":"Murilo Gustineli","orcid":null},"institutions":[],"countries":[],"is_corresponding":true,"raw_author_name":"Gustineli, Murilo","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5078321399","display_name":"Anthony Miyaguchi","orcid":"https://orcid.org/0000-0002-9165-8718"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Miyaguchi, Anthony","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5015773859","display_name":"Adrian Cheung","orcid":"https://orcid.org/0000-0002-4369-2129"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Cheung, Adrian","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"last","author":{"id":"https://openalex.org/A5120322676","display_name":"Divyansh Khattak","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Khattak, Divyansh","raw_affiliation_strings":[],"affiliations":[]}],"institutions":[],"countries_distinct_count":0,"institutions_distinct_count":4,"corresponding_author_ids":["https://openalex.org/A5006723872"],"corresponding_institution_ids":[],"apc_list":null,"apc_paid":null,"fwci":null,"has_fulltext":false,"cited_by_count":0,"citation_normalized_percentile":null,"cited_by_percentile_year":null,"biblio":{"volume":null,"issue":null,"first_page":null,"last_page":null},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10616","display_name":"Smart Agriculture and AI","score":0.871999979019165,"subfield":{"id":"https://openalex.org/subfields/1110","display_name":"Plant Science"},"field":{"id":"https://openalex.org/fields/11","display_name":"Agricultural and Biological Sciences"},"domain":{"id":"https://openalex.org/domains/1","display_name":"Life Sciences"}},"topics":[{"id":"https://openalex.org/T10616","display_name":"Smart Agriculture and AI","score":0.871999979019165,"subfield":{"id":"https://openalex.org/subfields/1110","display_name":"Plant Science"},"field":{"id":"https://openalex.org/fields/11","display_name":"Agricultural and Biological Sciences"},"domain":{"id":"https://openalex.org/domains/1","display_name":"Life Sciences"}},{"id":"https://openalex.org/T10111","display_name":"Remote Sensing in Agriculture","score":0.029400000348687172,"subfield":{"id":"https://openalex.org/subfields/2303","display_name":"Ecology"},"field":{"id":"https://openalex.org/fields/23","display_name":"Environmental Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10036","display_name":"Advanced Neural Network Applications","score":0.020600000396370888,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/prior-probability","display_name":"Prior probability","score":0.6233999729156494},{"id":"https://openalex.org/keywords/bayesian-probability","display_name":"Bayesian probability","score":0.5242999792098999},{"id":"https://openalex.org/keywords/identification","display_name":"Identification (biology)","score":0.4726000130176544},{"id":"https://openalex.org/keywords/bayesian-inference","display_name":"Bayesian inference","score":0.4677000045776367},{"id":"https://openalex.org/keywords/inference","display_name":"Inference","score":0.4629000127315521},{"id":"https://openalex.org/keywords/pattern-recognition","display_name":"Pattern recognition (psychology)","score":0.44339999556541443},{"id":"https://openalex.org/keywords/cluster-analysis","display_name":"Cluster analysis","score":0.4408999979496002},{"id":"https://openalex.org/keywords/plant-identification","display_name":"Plant identification","score":0.42160001397132874},{"id":"https://openalex.org/keywords/geolocation","display_name":"Geolocation","score":0.41679999232292175}],"concepts":[{"id":"https://openalex.org/C177769412","wikidata":"https://www.wikidata.org/wiki/Q278090","display_name":"Prior probability","level":3,"score":0.6233999729156494},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.5866000056266785},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.5806000232696533},{"id":"https://openalex.org/C107673813","wikidata":"https://www.wikidata.org/wiki/Q812534","display_name":"Bayesian probability","level":2,"score":0.5242999792098999},{"id":"https://openalex.org/C116834253","wikidata":"https://www.wikidata.org/wiki/Q2039217","display_name":"Identification (biology)","level":2,"score":0.4726000130176544},{"id":"https://openalex.org/C160234255","wikidata":"https://www.wikidata.org/wiki/Q812535","display_name":"Bayesian inference","level":3,"score":0.4677000045776367},{"id":"https://openalex.org/C2776214188","wikidata":"https://www.wikidata.org/wiki/Q408386","display_name":"Inference","level":2,"score":0.4629000127315521},{"id":"https://openalex.org/C153180895","wikidata":"https://www.wikidata.org/wiki/Q7148389","display_name":"Pattern recognition (psychology)","level":2,"score":0.44339999556541443},{"id":"https://openalex.org/C73555534","wikidata":"https://www.wikidata.org/wiki/Q622825","display_name":"Cluster analysis","level":2,"score":0.4408999979496002},{"id":"https://openalex.org/C124101348","wikidata":"https://www.wikidata.org/wiki/Q172491","display_name":"Data mining","level":1,"score":0.4309999942779541},{"id":"https://openalex.org/C2776091240","wikidata":"https://www.wikidata.org/wiki/Q106238460","display_name":"Plant identification","level":2,"score":0.42160001397132874},{"id":"https://openalex.org/C22041718","wikidata":"https://www.wikidata.org/wiki/Q638949","display_name":"Geolocation","level":2,"score":0.41679999232292175},{"id":"https://openalex.org/C119857082","wikidata":"https://www.wikidata.org/wiki/Q2539","display_name":"Machine learning","level":1,"score":0.36480000615119934},{"id":"https://openalex.org/C207201462","wikidata":"https://www.wikidata.org/wiki/Q182505","display_name":"Bayes' theorem","level":3,"score":0.36070001125335693},{"id":"https://openalex.org/C166963901","wikidata":"https://www.wikidata.org/wiki/Q287251","display_name":"Kurtosis","level":2,"score":0.3361999988555908},{"id":"https://openalex.org/C150921843","wikidata":"https://www.wikidata.org/wiki/Q1170431","display_name":"Resampling","level":2,"score":0.31850001215934753},{"id":"https://openalex.org/C61423126","wikidata":"https://www.wikidata.org/wiki/Q187432","display_name":"Scripting language","level":2,"score":0.3118000030517578},{"id":"https://openalex.org/C205626393","wikidata":"https://www.wikidata.org/wiki/Q2089263","display_name":"Phyllosphere","level":3,"score":0.3109000027179718},{"id":"https://openalex.org/C2781280628","wikidata":"https://www.wikidata.org/wiki/Q5280766","display_name":"Dirichlet process","level":3,"score":0.30550000071525574},{"id":"https://openalex.org/C61224824","wikidata":"https://www.wikidata.org/wiki/Q2260434","display_name":"Mixture model","level":2,"score":0.2863999903202057},{"id":"https://openalex.org/C33923547","wikidata":"https://www.wikidata.org/wiki/Q395","display_name":"Mathematics","level":0,"score":0.2842999994754791},{"id":"https://openalex.org/C3020402766","wikidata":"https://www.wikidata.org/wiki/Q104376712","display_name":"Prior information","level":2,"score":0.275299996137619},{"id":"https://openalex.org/C103278499","wikidata":"https://www.wikidata.org/wiki/Q254465","display_name":"Similarity (geometry)","level":3,"score":0.274399995803833},{"id":"https://openalex.org/C2984074130","wikidata":"https://www.wikidata.org/wiki/Q73539779","display_name":"R package","level":2,"score":0.2662999927997589},{"id":"https://openalex.org/C75553542","wikidata":"https://www.wikidata.org/wiki/Q178161","display_name":"A priori and a posteriori","level":2,"score":0.26420000195503235},{"id":"https://openalex.org/C177212765","wikidata":"https://www.wikidata.org/wiki/Q627335","display_name":"Workflow","level":2,"score":0.26179999113082886},{"id":"https://openalex.org/C111350023","wikidata":"https://www.wikidata.org/wiki/Q1191869","display_name":"Markov chain Monte Carlo","level":3,"score":0.26159998774528503},{"id":"https://openalex.org/C43521106","wikidata":"https://www.wikidata.org/wiki/Q2165493","display_name":"Pipeline (software)","level":2,"score":0.250900000333786},{"id":"https://openalex.org/C205711294","wikidata":"https://www.wikidata.org/wiki/Q176953","display_name":"Rendering (computer graphics)","level":2,"score":0.25060001015663147}],"mesh":[],"locations_count":2,"locations":[{"id":"pmh:oai:arXiv.org:2507.06093","is_oa":true,"landing_page_url":"http://arxiv.org/abs/2507.06093","pdf_url":"https://arxiv.org/pdf/2507.06093","source":{"id":"https://openalex.org/S4393918464","display_name":"ArXiv.org","issn_l":"2331-8422","issn":["2331-8422"],"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":null,"host_organization_name":null,"host_organization_lineage":[],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"text"},{"id":"doi:10.48550/arxiv.2507.06093","is_oa":true,"landing_page_url":"https://doi.org/10.48550/arxiv.2507.06093","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":null,"is_accepted":false,"is_published":null,"raw_source_name":null,"raw_type":"article"}],"best_oa_location":{"id":"pmh:oai:arXiv.org:2507.06093","is_oa":true,"landing_page_url":"http://arxiv.org/abs/2507.06093","pdf_url":"https://arxiv.org/pdf/2507.06093","source":{"id":"https://openalex.org/S4393918464","display_name":"ArXiv.org","issn_l":"2331-8422","issn":["2331-8422"],"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":null,"host_organization_name":null,"host_organization_lineage":[],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"text"},"sustainable_development_goals":[],"awards":[],"funders":[],"has_content":{"grobid_xml":false,"pdf":false},"content_urls":null,"referenced_works_count":0,"referenced_works":[],"related_works":[],"abstract_inverted_index":{"We":[0],"describe":[1],"DS@GT's":[2],"second-place":[3],"solution":[4],"to":[5],"the":[6,40],"PlantCLEF":[7],"2025":[8],"challenge":[9],"on":[10],"multi-species":[11],"plant":[12],"identification":[13],"in":[14],"vegetation":[15],"quadrat":[16],"images.":[17],"Our":[18],"pipeline":[19],"combines":[20],"(i)":[21],"a":[22,31,72],"fine-tuned":[23],"Vision":[24],"Transformer":[25],"ViTD2PC24All":[26],"for":[27],"patch-level":[28],"inference,":[29],"(ii)":[30],"4x4":[32],"tiling":[33],"strategy":[34],"that":[35],"aligns":[36],"patch":[37],"size":[38],"with":[39,67],"network's":[41],"518x518":[42],"receptive":[43],"field,":[44],"and":[45,55,65,88],"(iii)":[46],"domain-prior":[47],"adaptation":[48],"through":[49],"PaCMAP":[50],"+":[51],"K-Means":[52],"visual":[53],"clustering":[54],"geolocation":[56],"filtering.":[57],"Tile":[58],"predictions":[59],"are":[60,91],"aggregated":[61],"by":[62],"majority":[63],"vote":[64],"re-weighted":[66],"cluster-specific":[68],"Bayesian":[69],"priors,":[70],"yielding":[71],"macro-averaged":[73],"F1":[74],"of":[75],"0.348":[76],"(private":[77],"leaderboard)":[78],"while":[79],"requiring":[80],"no":[81],"additional":[82],"training.":[83],"All":[84],"code,":[85],"configuration":[86],"files,":[87],"reproducibility":[89],"scripts":[90],"publicly":[92],"available":[93],"at":[94],"https://github.com/dsgt-arc/plantclef-2025.":[95]},"counts_by_year":[],"updated_date":"2026-03-07T16:01:11.037858","created_date":"2025-10-10T00:00:00"}
