{"id":"https://openalex.org/W4415164166","doi":"https://doi.org/10.1109/iccv51701.2025.00803","title":"Taxadiffusion: Progressively Trained Diffusion Model for Fine-Grained Species Generation","display_name":"Taxadiffusion: Progressively Trained Diffusion Model for Fine-Grained Species Generation","publication_year":2025,"publication_date":"2025-10-19","ids":{"openalex":"https://openalex.org/W4415164166","doi":"https://doi.org/10.1109/iccv51701.2025.00803"},"language":"en","primary_location":{"id":"doi:10.1109/iccv51701.2025.00803","is_oa":false,"landing_page_url":"https://doi.org/10.1109/iccv51701.2025.00803","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"2025 IEEE/CVF International Conference on Computer Vision (ICCV)","raw_type":"proceedings-article"},"type":"preprint","indexed_in":["arxiv","crossref","datacite"],"open_access":{"is_oa":true,"oa_status":"green","oa_url":"https://arxiv.org/pdf/2506.01923","any_repository_has_fulltext":true},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5083442260","display_name":"Amin Karimi Monsefi","orcid":"https://orcid.org/0000-0002-6101-2828"},"institutions":[{"id":"https://openalex.org/I52357470","display_name":"The Ohio State University","ror":"https://ror.org/00rs6vg23","country_code":"US","type":"education","lineage":["https://openalex.org/I52357470"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Amin Karimi Monsefi","raw_affiliation_strings":["The Ohio State University"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"The Ohio State University","institution_ids":["https://openalex.org/I52357470"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5059865613","display_name":"Mridul Khurana","orcid":"https://orcid.org/0009-0003-9346-3206"},"institutions":[{"id":"https://openalex.org/I859038795","display_name":"Virginia Tech","ror":"https://ror.org/02smfhw86","country_code":"US","type":"education","lineage":["https://openalex.org/I859038795"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Mridul Khurana","raw_affiliation_strings":["Virginia Tech"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"Virginia Tech","institution_ids":["https://openalex.org/I859038795"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5073535794","display_name":"Rajiv Ramnath","orcid":"https://orcid.org/0000-0003-0093-8560"},"institutions":[{"id":"https://openalex.org/I52357470","display_name":"The Ohio State University","ror":"https://ror.org/00rs6vg23","country_code":"US","type":"education","lineage":["https://openalex.org/I52357470"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Rajiv Ramnath","raw_affiliation_strings":["The Ohio State University"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"The Ohio State University","institution_ids":["https://openalex.org/I52357470"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5081622450","display_name":"Anuj Karpatne","orcid":"https://orcid.org/0000-0003-1647-3534"},"institutions":[{"id":"https://openalex.org/I859038795","display_name":"Virginia Tech","ror":"https://ror.org/02smfhw86","country_code":"US","type":"education","lineage":["https://openalex.org/I859038795"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Anuj Karpatne","raw_affiliation_strings":["Virginia Tech"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"Virginia Tech","institution_ids":["https://openalex.org/I859038795"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5101520942","display_name":"Wei\u2010Lun Chao","orcid":"https://orcid.org/0000-0003-1269-7231"},"institutions":[{"id":"https://openalex.org/I52357470","display_name":"The Ohio State University","ror":"https://ror.org/00rs6vg23","country_code":"US","type":"education","lineage":["https://openalex.org/I52357470"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Wei-Lun Chao","raw_affiliation_strings":["The Ohio State University"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"The Ohio State University","institution_ids":["https://openalex.org/I52357470"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5049674716","display_name":"Cheng Zhang","orcid":"https://orcid.org/0000-0002-8277-5138"},"institutions":[{"id":"https://openalex.org/I91045830","display_name":"Texas A&M University","ror":"https://ror.org/01f5ytq51","country_code":"US","type":"education","lineage":["https://openalex.org/I91045830"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Cheng Zhang","raw_affiliation_strings":["Texas A&#x0026;M University"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"Texas A&#x0026;M University","institution_ids":["https://openalex.org/I91045830"]}]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":3,"corresponding_author_ids":[],"corresponding_institution_ids":[],"apc_list":null,"apc_paid":null,"fwci":0.0,"has_fulltext":false,"cited_by_count":0,"citation_normalized_percentile":{"value":0.20118235,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":null,"biblio":{"volume":null,"issue":null,"first_page":"8579","last_page":"8589"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T12934","display_name":"Plant and fungal interactions","score":0.7768999934196472,"subfield":{"id":"https://openalex.org/subfields/1105","display_name":"Ecology, Evolution, Behavior and Systematics"},"field":{"id":"https://openalex.org/fields/11","display_name":"Agricultural and Biological Sciences"},"domain":{"id":"https://openalex.org/domains/1","display_name":"Life Sciences"}},"topics":[{"id":"https://openalex.org/T12934","display_name":"Plant and fungal interactions","score":0.7768999934196472,"subfield":{"id":"https://openalex.org/subfields/1105","display_name":"Ecology, Evolution, Behavior and Systematics"},"field":{"id":"https://openalex.org/fields/11","display_name":"Agricultural and Biological Sciences"},"domain":{"id":"https://openalex.org/domains/1","display_name":"Life Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/animal-species","display_name":"Animal species","score":0.6122000217437744},{"id":"https://openalex.org/keywords/fidelity","display_name":"Fidelity","score":0.5878999829292297},{"id":"https://openalex.org/keywords/exploit","display_name":"Exploit","score":0.552299976348877},{"id":"https://openalex.org/keywords/domain","display_name":"Domain (mathematical analysis)","score":0.5},{"id":"https://openalex.org/keywords/diffusion","display_name":"Diffusion","score":0.42910000681877136},{"id":"https://openalex.org/keywords/transfer-of-learning","display_name":"Transfer of learning","score":0.42320001125335693},{"id":"https://openalex.org/keywords/refining","display_name":"Refining (metallurgy)","score":0.41350001096725464},{"id":"https://openalex.org/keywords/training-set","display_name":"Training set","score":0.4090000092983246}],"concepts":[{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.616100013256073},{"id":"https://openalex.org/C2993056352","wikidata":"https://www.wikidata.org/wiki/Q7432","display_name":"Animal species","level":2,"score":0.6122000217437744},{"id":"https://openalex.org/C2776459999","wikidata":"https://www.wikidata.org/wiki/Q2119376","display_name":"Fidelity","level":2,"score":0.5878999829292297},{"id":"https://openalex.org/C165696696","wikidata":"https://www.wikidata.org/wiki/Q11287","display_name":"Exploit","level":2,"score":0.552299976348877},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.53329998254776},{"id":"https://openalex.org/C36503486","wikidata":"https://www.wikidata.org/wiki/Q11235244","display_name":"Domain (mathematical analysis)","level":2,"score":0.5},{"id":"https://openalex.org/C119857082","wikidata":"https://www.wikidata.org/wiki/Q2539","display_name":"Machine learning","level":1,"score":0.4596000015735626},{"id":"https://openalex.org/C69357855","wikidata":"https://www.wikidata.org/wiki/Q163214","display_name":"Diffusion","level":2,"score":0.42910000681877136},{"id":"https://openalex.org/C150899416","wikidata":"https://www.wikidata.org/wiki/Q1820378","display_name":"Transfer of learning","level":2,"score":0.42320001125335693},{"id":"https://openalex.org/C60044698","wikidata":"https://www.wikidata.org/wiki/Q1283324","display_name":"Refining (metallurgy)","level":2,"score":0.41350001096725464},{"id":"https://openalex.org/C51632099","wikidata":"https://www.wikidata.org/wiki/Q3985153","display_name":"Training set","level":2,"score":0.4090000092983246},{"id":"https://openalex.org/C2777212361","wikidata":"https://www.wikidata.org/wiki/Q5127848","display_name":"Class (philosophy)","level":2,"score":0.3783000111579895},{"id":"https://openalex.org/C153180895","wikidata":"https://www.wikidata.org/wiki/Q7148389","display_name":"Pattern recognition (psychology)","level":2,"score":0.37119999527931213},{"id":"https://openalex.org/C207685749","wikidata":"https://www.wikidata.org/wiki/Q2088941","display_name":"Domain knowledge","level":2,"score":0.365200012922287},{"id":"https://openalex.org/C2778355321","wikidata":"https://www.wikidata.org/wiki/Q17079427","display_name":"Identity (music)","level":2,"score":0.33880001306533813},{"id":"https://openalex.org/C48702757","wikidata":"https://www.wikidata.org/wiki/Q8269924","display_name":"Biological classification","level":2,"score":0.2994000017642975},{"id":"https://openalex.org/C186060115","wikidata":"https://www.wikidata.org/wiki/Q30336093","display_name":"Biological system","level":1,"score":0.29820001125335693},{"id":"https://openalex.org/C204323151","wikidata":"https://www.wikidata.org/wiki/Q905424","display_name":"Range (aeronautics)","level":2,"score":0.29339998960494995},{"id":"https://openalex.org/C189592816","wikidata":"https://www.wikidata.org/wiki/Q427626","display_name":"Taxonomic rank","level":3,"score":0.28940001130104065},{"id":"https://openalex.org/C2988419192","wikidata":"https://www.wikidata.org/wiki/Q7155","display_name":"Animal behavior","level":2,"score":0.2624000012874603},{"id":"https://openalex.org/C115961682","wikidata":"https://www.wikidata.org/wiki/Q860623","display_name":"Image (mathematics)","level":2,"score":0.2572999894618988},{"id":"https://openalex.org/C116834253","wikidata":"https://www.wikidata.org/wiki/Q2039217","display_name":"Identification (biology)","level":2,"score":0.2540000081062317}],"mesh":[],"locations_count":3,"locations":[{"id":"doi:10.1109/iccv51701.2025.00803","is_oa":false,"landing_page_url":"https://doi.org/10.1109/iccv51701.2025.00803","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"2025 IEEE/CVF International Conference on Computer Vision (ICCV)","raw_type":"proceedings-article"},{"id":"pmh:oai:arXiv.org:2506.01923","is_oa":true,"landing_page_url":"http://arxiv.org/abs/2506.01923","pdf_url":"https://arxiv.org/pdf/2506.01923","source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":"public-domain","license_id":"https://openalex.org/licenses/public-domain","version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"text"},{"id":"doi:10.48550/arxiv.2506.01923","is_oa":true,"landing_page_url":"https://doi.org/10.48550/arxiv.2506.01923","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":"public-domain","license_id":"https://openalex.org/licenses/public-domain","version":null,"is_accepted":false,"is_published":null,"raw_source_name":null,"raw_type":"Preprint"}],"best_oa_location":{"id":"pmh:oai:arXiv.org:2506.01923","is_oa":true,"landing_page_url":"http://arxiv.org/abs/2506.01923","pdf_url":"https://arxiv.org/pdf/2506.01923","source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":"public-domain","license_id":"https://openalex.org/licenses/public-domain","version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"text"},"sustainable_development_goals":[],"awards":[{"id":"https://openalex.org/G7153582637","display_name":null,"funder_award_id":"OAC-2118240","funder_id":"https://openalex.org/F4320306076","funder_display_name":"National Science Foundation"}],"funders":[{"id":"https://openalex.org/F4320306076","display_name":"National Science Foundation","ror":"https://ror.org/021nxhr62"}],"has_content":{"pdf":true,"grobid_xml":false},"content_urls":{"pdf":"https://content.openalex.org/works/W4415164166.pdf"},"referenced_works_count":0,"referenced_works":[],"related_works":[],"abstract_inverted_index":{"We":[0],"propose":[1],"TaxaDiffusion,":[2],"a":[3,117],"taxonomy-informed":[4],"training":[5,126],"framework":[6],"for":[7,113],"diffusion":[8,63],"models":[9,64],"to":[10],"generate":[11],"fine-grained":[12,111,134,146],"animal":[13,135,147],"images":[14],"with":[15,43,103,124],"high":[16],"morphological":[17,98],"and":[18,53,77,82,84],"identity":[19],"accuracy.":[20],"Unlike":[21],"standard":[22],"approaches":[23],"that":[24,36,138],"treat":[25],"each":[26],"species":[27,38,102],"as":[28,75],"an":[29],"independent":[30],"category,":[31],"TaxaDiffusion":[32,59,119],"incorporates":[33],"domain":[34],"knowledge":[35,107],"many":[37],"exhibit":[39],"strong":[40],"visual":[41],"similarities,":[42],"distinctions":[44],"often":[45],"residing":[46],"in":[47,145],"subtle":[48],"variations":[49],"of":[50],"shape,":[51],"pattern,":[52],"color.":[54],"To":[55],"exploit":[56],"these":[57],"relationships,":[58],"progressively":[60],"trains":[61],"conditioned":[62],"across":[65],"different":[66],"taxonomic":[67],"levels":[68],"--":[69],"starting":[70],"from":[71],"broad":[72],"classifications":[73],"such":[74],"Class":[76],"Order,":[78],"refining":[79,110],"through":[80],"Family":[81],"Genus,":[83],"ultimately":[85],"distinguishing":[86],"at":[87],"the":[88],"Species":[89],"level.":[90],"This":[91],"hierarchical":[92],"learning":[93],"strategy":[94],"first":[95],"captures":[96],"coarse-grained":[97],"traits":[99],"shared":[100],"by":[101],"common":[104],"ancestors,":[105],"facilitating":[106],"transfer":[108],"before":[109],"differences":[112],"species-level":[114],"distinction.":[115],"As":[116],"result,":[118],"enables":[120],"accurate":[121],"generation":[122],"even":[123],"limited":[125],"samples":[127],"per":[128],"species.":[129],"Extensive":[130],"experiments":[131],"on":[132],"three":[133],"datasets":[136],"demonstrate":[137],"outperforms":[139],"existing":[140],"approaches,":[141],"achieving":[142],"superior":[143],"fidelity":[144],"image":[148],"generation.":[149],"Project":[150],"page:":[151],"https://amink8.github.io/TaxaDiffusion/":[152]},"counts_by_year":[],"updated_date":"2026-07-03T08:13:44.112507","created_date":"2025-10-14T00:00:00"}
