{"id":"https://openalex.org/W7162109634","doi":"https://doi.org/10.48550/arxiv.2605.21859","title":"PhylaFlow: Hybrid Flow Matching in Billera-Holmes-Vogtmann Tree Space for Phylogenetic Inference","display_name":"PhylaFlow: Hybrid Flow Matching in Billera-Holmes-Vogtmann Tree Space for Phylogenetic Inference","publication_year":2026,"publication_date":"2026-05-21","ids":{"openalex":"https://openalex.org/W7162109634","doi":"https://doi.org/10.48550/arxiv.2605.21859"},"language":null,"primary_location":{"id":"doi:10.48550/arxiv.2605.21859","is_oa":true,"landing_page_url":"https://doi.org/10.48550/arxiv.2605.21859","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":null,"is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"article"},"type":"preprint","indexed_in":["datacite"],"open_access":{"is_oa":true,"oa_status":"green","oa_url":"https://doi.org/10.48550/arxiv.2605.21859","any_repository_has_fulltext":true},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5006487374","display_name":"Yasha Ektefaie","orcid":"https://orcid.org/0000-0003-2759-4470"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Ektefaie, Yasha","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5136801545","display_name":"Leo Cui","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Cui, Leo","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5136807240","display_name":"Shrey Jain","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Jain, Shrey","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5086052373","display_name":"Marinka \u017ditnik","orcid":"https://orcid.org/0000-0001-8530-7228"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Zitnik, Marinka","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"last","author":{"id":"https://openalex.org/A5136783367","display_name":"Pardis Sabeti","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Sabeti, Pardis","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]}],"institutions":[],"countries_distinct_count":0,"institutions_distinct_count":5,"corresponding_author_ids":[],"corresponding_institution_ids":[],"apc_list":null,"apc_paid":null,"fwci":null,"has_fulltext":false,"cited_by_count":0,"citation_normalized_percentile":null,"cited_by_percentile_year":null,"biblio":{"volume":null,"issue":null,"first_page":null,"last_page":null},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10015","display_name":"Genomics and Phylogenetic Studies","score":0.8069999814033508,"subfield":{"id":"https://openalex.org/subfields/1312","display_name":"Molecular Biology"},"field":{"id":"https://openalex.org/fields/13","display_name":"Biochemistry, Genetics and Molecular Biology"},"domain":{"id":"https://openalex.org/domains/1","display_name":"Life Sciences"}},"topics":[{"id":"https://openalex.org/T10015","display_name":"Genomics and Phylogenetic Studies","score":0.8069999814033508,"subfield":{"id":"https://openalex.org/subfields/1312","display_name":"Molecular Biology"},"field":{"id":"https://openalex.org/fields/13","display_name":"Biochemistry, Genetics and Molecular Biology"},"domain":{"id":"https://openalex.org/domains/1","display_name":"Life Sciences"}},{"id":"https://openalex.org/T11354","display_name":"Evolution and Paleontology Studies","score":0.02759999968111515,"subfield":{"id":"https://openalex.org/subfields/1911","display_name":"Paleontology"},"field":{"id":"https://openalex.org/fields/19","display_name":"Earth and Planetary Sciences"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T12417","display_name":"Morphological variations and asymmetry","score":0.020500000566244125,"subfield":{"id":"https://openalex.org/subfields/2608","display_name":"Geometry and Topology"},"field":{"id":"https://openalex.org/fields/26","display_name":"Mathematics"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/geodesic","display_name":"Geodesic","score":0.6776000261306763},{"id":"https://openalex.org/keywords/orthant","display_name":"Orthant","score":0.6061999797821045},{"id":"https://openalex.org/keywords/tree","display_name":"Tree (set theory)","score":0.5978999733924866},{"id":"https://openalex.org/keywords/topology","display_name":"Topology (electrical circuits)","score":0.5914000272750854},{"id":"https://openalex.org/keywords/network-topology","display_name":"Network topology","score":0.5526000261306763},{"id":"https://openalex.org/keywords/phylogenetic-tree","display_name":"Phylogenetic tree","score":0.48829999566078186},{"id":"https://openalex.org/keywords/boundary","display_name":"Boundary (topology)","score":0.47099998593330383},{"id":"https://openalex.org/keywords/matching","display_name":"Matching (statistics)","score":0.4374000132083893},{"id":"https://openalex.org/keywords/sequence","display_name":"Sequence (biology)","score":0.424699991941452}],"concepts":[{"id":"https://openalex.org/C165818556","wikidata":"https://www.wikidata.org/wiki/Q213488","display_name":"Geodesic","level":2,"score":0.6776000261306763},{"id":"https://openalex.org/C33923547","wikidata":"https://www.wikidata.org/wiki/Q395","display_name":"Mathematics","level":0,"score":0.6460999846458435},{"id":"https://openalex.org/C2780016784","wikidata":"https://www.wikidata.org/wiki/Q2714507","display_name":"Orthant","level":2,"score":0.6061999797821045},{"id":"https://openalex.org/C113174947","wikidata":"https://www.wikidata.org/wiki/Q2859736","display_name":"Tree (set theory)","level":2,"score":0.5978999733924866},{"id":"https://openalex.org/C184720557","wikidata":"https://www.wikidata.org/wiki/Q7825049","display_name":"Topology (electrical circuits)","level":2,"score":0.5914000272750854},{"id":"https://openalex.org/C199845137","wikidata":"https://www.wikidata.org/wiki/Q145490","display_name":"Network topology","level":2,"score":0.5526000261306763},{"id":"https://openalex.org/C193252679","wikidata":"https://www.wikidata.org/wiki/Q242125","display_name":"Phylogenetic tree","level":3,"score":0.48829999566078186},{"id":"https://openalex.org/C62354387","wikidata":"https://www.wikidata.org/wiki/Q875399","display_name":"Boundary (topology)","level":2,"score":0.47099998593330383},{"id":"https://openalex.org/C11413529","wikidata":"https://www.wikidata.org/wiki/Q8366","display_name":"Algorithm","level":1,"score":0.45249998569488525},{"id":"https://openalex.org/C165064840","wikidata":"https://www.wikidata.org/wiki/Q1321061","display_name":"Matching (statistics)","level":2,"score":0.4374000132083893},{"id":"https://openalex.org/C2778112365","wikidata":"https://www.wikidata.org/wiki/Q3511065","display_name":"Sequence (biology)","level":2,"score":0.424699991941452},{"id":"https://openalex.org/C38349280","wikidata":"https://www.wikidata.org/wiki/Q1434290","display_name":"Flow (mathematics)","level":2,"score":0.4018000066280365},{"id":"https://openalex.org/C2776839635","wikidata":"https://www.wikidata.org/wiki/Q14942679","display_name":"Random tree","level":4,"score":0.38940000534057617},{"id":"https://openalex.org/C57830394","wikidata":"https://www.wikidata.org/wiki/Q278079","display_name":"Posterior probability","level":3,"score":0.36890000104904175},{"id":"https://openalex.org/C14166107","wikidata":"https://www.wikidata.org/wiki/Q253829","display_name":"Net (polyhedron)","level":2,"score":0.3569999933242798},{"id":"https://openalex.org/C107673813","wikidata":"https://www.wikidata.org/wiki/Q812534","display_name":"Bayesian probability","level":2,"score":0.34869998693466187},{"id":"https://openalex.org/C55919133","wikidata":"https://www.wikidata.org/wiki/Q7644297","display_name":"Supertree","level":4,"score":0.34540000557899475},{"id":"https://openalex.org/C163797641","wikidata":"https://www.wikidata.org/wiki/Q2067937","display_name":"Tree structure","level":3,"score":0.33169999718666077},{"id":"https://openalex.org/C2778572836","wikidata":"https://www.wikidata.org/wiki/Q380933","display_name":"Space (punctuation)","level":2,"score":0.3224000036716461},{"id":"https://openalex.org/C47556283","wikidata":"https://www.wikidata.org/wiki/Q1058314","display_name":"Diffeomorphism","level":2,"score":0.31850001215934753},{"id":"https://openalex.org/C114614502","wikidata":"https://www.wikidata.org/wiki/Q76592","display_name":"Combinatorics","level":1,"score":0.30239999294281006},{"id":"https://openalex.org/C2777735758","wikidata":"https://www.wikidata.org/wiki/Q817765","display_name":"Path (computing)","level":2,"score":0.3018999993801117},{"id":"https://openalex.org/C104114177","wikidata":"https://www.wikidata.org/wiki/Q79782","display_name":"Motion (physics)","level":2,"score":0.29750001430511475},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.2944999933242798},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.28380000591278076},{"id":"https://openalex.org/C70943382","wikidata":"https://www.wikidata.org/wiki/Q505356","display_name":"Antipodal point","level":2,"score":0.2685000002384186},{"id":"https://openalex.org/C186450821","wikidata":"https://www.wikidata.org/wiki/Q17295","display_name":"Euclidean space","level":2,"score":0.25619998574256897},{"id":"https://openalex.org/C153180895","wikidata":"https://www.wikidata.org/wiki/Q7148389","display_name":"Pattern recognition (psychology)","level":2,"score":0.25600001215934753},{"id":"https://openalex.org/C160234255","wikidata":"https://www.wikidata.org/wiki/Q812535","display_name":"Bayesian inference","level":3,"score":0.2551000118255615},{"id":"https://openalex.org/C2776214188","wikidata":"https://www.wikidata.org/wiki/Q408386","display_name":"Inference","level":2,"score":0.2531999945640564}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.48550/arxiv.2605.21859","is_oa":true,"landing_page_url":"https://doi.org/10.48550/arxiv.2605.21859","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":null,"is_accepted":false,"is_published":null,"raw_source_name":null,"raw_type":"article"}],"best_oa_location":{"id":"doi:10.48550/arxiv.2605.21859","is_oa":true,"landing_page_url":"https://doi.org/10.48550/arxiv.2605.21859","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":null,"is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"article"},"sustainable_development_goals":[],"awards":[],"funders":[],"has_content":{"pdf":false,"grobid_xml":false},"content_urls":null,"referenced_works_count":0,"referenced_works":[],"related_works":[],"abstract_inverted_index":{"Phylogenetic":[0],"trees":[1,71,112],"are":[2],"hybrid":[3,50,200],"objects:":[4],"branch":[5],"lengths":[6],"vary":[7],"continuously,":[8],"while":[9,148],"topologies":[10,116],"change":[11],"discretely":[12],"through":[13],"edge":[14],"contractions":[15],"and":[16,37,86,141,167,211],"expansions.":[17],"Billera-Holmes-Vogtmann":[18],"(BHV)":[19],"tree":[20,59,209],"space":[21,210],"provides":[22],"a":[23,34,49,179,213],"canonical":[24],"geometry":[25,94],"for":[26,217],"this":[27],"structure,":[28],"representing":[29],"each":[30],"resolved":[31],"topology":[32,88,192],"as":[33,40],"Euclidean":[35],"orthant":[36],"topological":[38],"changes":[39],"motion":[41,79],"across":[42],"shared":[43],"lower-dimensional":[44],"boundaries.":[45],"We":[46,90],"introduce":[47],"PhylaFlow,":[48],"flow-matching":[51],"model":[52],"that":[53,199],"learns":[54],"posterior-basin":[55],"transport":[56,206],"in":[57,207],"BHV":[58,65,208],"space.":[60],"PhylaFlow":[61,124,138,158],"is":[62],"trained":[63],"on":[64,145,162,169],"geodesic":[66],"paths":[67],"from":[68],"random":[69],"starting":[70],"to":[72,130],"short-run":[73],"posterior":[74,122,186,191],"samples,":[75],"coupling":[76],"continuous":[77],"branch-length":[78],"within":[80],"orthants":[81],"with":[82],"learned":[83,93],"boundary":[84],"events":[85],"discrete":[87],"transitions.":[89],"evaluate":[91],"the":[92,97,152,174],"operationally:":[95],"if":[96],"flow":[98,201],"reaches":[99],"posterior-relevant":[100],"regions,":[101],"finite-budget":[102,134],"Bayesian":[103,218],"refinement":[104,176],"initialized":[105],"from,":[106],"or":[107],"guided":[108],"by,":[109],"its":[110],"terminal":[111],"should":[113],"recover":[114],"posterior-supported":[115],"more":[117],"efficiently.":[118],"Across":[119],"DS1-DS8":[120],"phylogenetic":[121,219],"benchmarks,":[123],"substantially":[125],"reduces":[126],"initial":[127],"Tree-KL":[128],"relative":[129],"classical":[131],"initializers.":[132],"After":[133],"MrBayes":[135],"refinement,":[136],"direct":[137],"improves":[139],"early":[140],"intermediate":[142],"topology-recovery":[143],"trajectories":[144],"most":[146],"datasets,":[147],"split-guided":[149],"PhylaFlow-MCMC":[150],"obtains":[151],"strongest":[153],"hard-case":[154],"results.":[155],"The":[156],"best":[157],"variant":[159],"outperforms":[160],"short-warmup":[161],"seven":[163],"of":[164,171],"eight":[165,172],"datasets":[166],"PhyloGFN":[168],"five":[170],"under":[173],"same":[175],"budget.":[177],"In":[178],"joint":[180],"sequence-conditioned":[181],"experiment,":[182],"sequence":[183],"embeddings":[184],"steer":[185],"split":[187],"recovery,":[188],"although":[189],"exact":[190],"recovery":[193],"remains":[194],"preliminary.":[195],"These":[196],"results":[197],"show":[198],"matching":[202],"can":[203],"learn":[204],"actionable":[205],"provide":[212],"geometry-aware":[214],"proposal":[215],"mechanism":[216],"inference.":[220]},"counts_by_year":[],"updated_date":"2026-06-11T09:08:48.828518","created_date":"2026-05-23T00:00:00"}
