{"id":"https://openalex.org/W7151249528","doi":"https://doi.org/10.1109/icmla66185.2025.00201","title":"Genotype-to-Phenotype Associations in Yeast with Frequented Region Variants and Deep Learning","display_name":"Genotype-to-Phenotype Associations in Yeast with Frequented Region Variants and Deep Learning","publication_year":2025,"publication_date":"2025-12-03","ids":{"openalex":"https://openalex.org/W7151249528","doi":"https://doi.org/10.1109/icmla66185.2025.00201"},"language":null,"primary_location":{"id":"doi:10.1109/icmla66185.2025.00201","is_oa":false,"landing_page_url":"https://doi.org/10.1109/icmla66185.2025.00201","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"2025 International Conference on Machine Learning and Applications (ICMLA)","raw_type":"proceedings-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":false,"oa_status":"closed","oa_url":null,"any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5133088005","display_name":"Tejaswi Vemuri","orcid":null},"institutions":[{"id":"https://openalex.org/I11874761","display_name":"University of North Florida","ror":"https://ror.org/01j903a45","country_code":"US","type":"education","lineage":["https://openalex.org/I11874761"]}],"countries":["US"],"is_corresponding":true,"raw_author_name":"Tejaswi Vemuri","raw_affiliation_strings":["University of North Florida,School of Computing,Jacksonville,FL,USA"],"affiliations":[{"raw_affiliation_string":"University of North Florida,School of Computing,Jacksonville,FL,USA","institution_ids":["https://openalex.org/I11874761"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5077732895","display_name":"Trung Hoa Dinh","orcid":"https://orcid.org/0000-0001-6303-1427"},"institutions":[{"id":"https://openalex.org/I11874761","display_name":"University of North Florida","ror":"https://ror.org/01j903a45","country_code":"US","type":"education","lineage":["https://openalex.org/I11874761"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Trung Dinh","raw_affiliation_strings":["University of North Florida,School of Computing,Jacksonville,FL,USA"],"affiliations":[{"raw_affiliation_string":"University of North Florida,School of Computing,Jacksonville,FL,USA","institution_ids":["https://openalex.org/I11874761"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5133126225","display_name":"Zonglin Yang","orcid":null},"institutions":[{"id":"https://openalex.org/I118353179","display_name":"DePaul University","ror":"https://ror.org/04xtx5t16","country_code":"US","type":"education","lineage":["https://openalex.org/I118353179"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Zonglin Yang","raw_affiliation_strings":["DePaul University,School of Computing,Chicago,IL,USA"],"affiliations":[{"raw_affiliation_string":"DePaul University,School of Computing,Chicago,IL,USA","institution_ids":["https://openalex.org/I118353179"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5083833340","display_name":"Thiruvarangan Ramaraj","orcid":"https://orcid.org/0000-0002-7333-1041"},"institutions":[{"id":"https://openalex.org/I118353179","display_name":"DePaul University","ror":"https://ror.org/04xtx5t16","country_code":"US","type":"education","lineage":["https://openalex.org/I118353179"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Thiruvarangan Ramaraj","raw_affiliation_strings":["DePaul University,School of Computing,Chicago,IL,USA"],"affiliations":[{"raw_affiliation_string":"DePaul University,School of Computing,Chicago,IL,USA","institution_ids":["https://openalex.org/I118353179"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5071538924","display_name":"Joann Mudge","orcid":"https://orcid.org/0000-0002-2972-1640"},"institutions":[{"id":"https://openalex.org/I1310183320","display_name":"National Center for Genome Resources","ror":"https://ror.org/01p4cne93","country_code":"US","type":"nonprofit","lineage":["https://openalex.org/I1310183320"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Joann Mudge","raw_affiliation_strings":["National Center for Genome Resources,Santa Fe,NM,USA"],"affiliations":[{"raw_affiliation_string":"National Center for Genome Resources,Santa Fe,NM,USA","institution_ids":["https://openalex.org/I1310183320"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5084888509","display_name":"Brendan Mumey","orcid":"https://orcid.org/0000-0001-7151-2124"},"institutions":[{"id":"https://openalex.org/I23732399","display_name":"Montana State University","ror":"https://ror.org/02w0trx84","country_code":"US","type":"education","lineage":["https://openalex.org/I23732399","https://openalex.org/I4210126032"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Brendan Mumey","raw_affiliation_strings":["Montana State University,School of Computer Science,Bozeman,MT,USA"],"affiliations":[{"raw_affiliation_string":"Montana State University,School of Computer Science,Bozeman,MT,USA","institution_ids":["https://openalex.org/I23732399"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5010719226","display_name":"Indika Kahanda","orcid":"https://orcid.org/0000-0002-4536-6917"},"institutions":[{"id":"https://openalex.org/I11874761","display_name":"University of North Florida","ror":"https://ror.org/01j903a45","country_code":"US","type":"education","lineage":["https://openalex.org/I11874761"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Indika Kahanda","raw_affiliation_strings":["University of North Florida,School of Computing,Jacksonville,FL,USA"],"affiliations":[{"raw_affiliation_string":"University of North Florida,School of Computing,Jacksonville,FL,USA","institution_ids":["https://openalex.org/I11874761"]}]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":7,"corresponding_author_ids":["https://openalex.org/A5133088005"],"corresponding_institution_ids":["https://openalex.org/I11874761"],"apc_list":null,"apc_paid":null,"fwci":0.0,"has_fulltext":false,"cited_by_count":0,"citation_normalized_percentile":{"value":0.66873061,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":null,"biblio":{"volume":null,"issue":null,"first_page":"1313","last_page":"1317"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10887","display_name":"Bioinformatics and Genomic Networks","score":0.41780000925064087,"subfield":{"id":"https://openalex.org/subfields/1312","display_name":"Molecular Biology"},"field":{"id":"https://openalex.org/fields/13","display_name":"Biochemistry, Genetics and Molecular Biology"},"domain":{"id":"https://openalex.org/domains/1","display_name":"Life Sciences"}},"topics":[{"id":"https://openalex.org/T10887","display_name":"Bioinformatics and Genomic Networks","score":0.41780000925064087,"subfield":{"id":"https://openalex.org/subfields/1312","display_name":"Molecular Biology"},"field":{"id":"https://openalex.org/fields/13","display_name":"Biochemistry, Genetics and Molecular Biology"},"domain":{"id":"https://openalex.org/domains/1","display_name":"Life Sciences"}},{"id":"https://openalex.org/T11764","display_name":"Evolution and Genetic Dynamics","score":0.09109999984502792,"subfield":{"id":"https://openalex.org/subfields/1311","display_name":"Genetics"},"field":{"id":"https://openalex.org/fields/13","display_name":"Biochemistry, Genetics and Molecular Biology"},"domain":{"id":"https://openalex.org/domains/1","display_name":"Life Sciences"}},{"id":"https://openalex.org/T12254","display_name":"Machine Learning in Bioinformatics","score":0.04650000110268593,"subfield":{"id":"https://openalex.org/subfields/1312","display_name":"Molecular Biology"},"field":{"id":"https://openalex.org/fields/13","display_name":"Biochemistry, Genetics and Molecular Biology"},"domain":{"id":"https://openalex.org/domains/1","display_name":"Life Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/deep-learning","display_name":"Deep learning","score":0.6065999865531921},{"id":"https://openalex.org/keywords/yeast","display_name":"Yeast","score":0.38929998874664307},{"id":"https://openalex.org/keywords/mutation","display_name":"Mutation","score":0.319599986076355},{"id":"https://openalex.org/keywords/saccharomyces-cerevisiae","display_name":"Saccharomyces cerevisiae","score":0.30959999561309814},{"id":"https://openalex.org/keywords/genetic-variants","display_name":"Genetic variants","score":0.29679998755455017},{"id":"https://openalex.org/keywords/feature","display_name":"Feature (linguistics)","score":0.29120001196861267}],"concepts":[{"id":"https://openalex.org/C108583219","wikidata":"https://www.wikidata.org/wiki/Q197536","display_name":"Deep learning","level":2,"score":0.6065999865531921},{"id":"https://openalex.org/C86803240","wikidata":"https://www.wikidata.org/wiki/Q420","display_name":"Biology","level":0,"score":0.49880000948905945},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.45910000801086426},{"id":"https://openalex.org/C54355233","wikidata":"https://www.wikidata.org/wiki/Q7162","display_name":"Genetics","level":1,"score":0.40450000762939453},{"id":"https://openalex.org/C2779222958","wikidata":"https://www.wikidata.org/wiki/Q45422","display_name":"Yeast","level":2,"score":0.38929998874664307},{"id":"https://openalex.org/C501734568","wikidata":"https://www.wikidata.org/wiki/Q42918","display_name":"Mutation","level":3,"score":0.319599986076355},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.31790000200271606},{"id":"https://openalex.org/C70721500","wikidata":"https://www.wikidata.org/wiki/Q177005","display_name":"Computational biology","level":1,"score":0.31220000982284546},{"id":"https://openalex.org/C2777576037","wikidata":"https://www.wikidata.org/wiki/Q719725","display_name":"Saccharomyces cerevisiae","level":3,"score":0.30959999561309814},{"id":"https://openalex.org/C2993967602","wikidata":"https://www.wikidata.org/wiki/Q5532932","display_name":"Genetic variants","level":4,"score":0.29679998755455017},{"id":"https://openalex.org/C2776401178","wikidata":"https://www.wikidata.org/wiki/Q12050496","display_name":"Feature (linguistics)","level":2,"score":0.29120001196861267},{"id":"https://openalex.org/C189206191","wikidata":"https://www.wikidata.org/wiki/Q222046","display_name":"Genomics","level":4,"score":0.2815000116825104},{"id":"https://openalex.org/C2992884146","wikidata":"https://www.wikidata.org/wiki/Q719725","display_name":"Budding yeast","level":4,"score":0.2775999903678894},{"id":"https://openalex.org/C78458016","wikidata":"https://www.wikidata.org/wiki/Q840400","display_name":"Evolutionary biology","level":1,"score":0.26930001378059387},{"id":"https://openalex.org/C141231307","wikidata":"https://www.wikidata.org/wiki/Q7020","display_name":"Genome","level":3,"score":0.25679999589920044}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.1109/icmla66185.2025.00201","is_oa":false,"landing_page_url":"https://doi.org/10.1109/icmla66185.2025.00201","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"2025 International Conference on Machine Learning and Applications (ICMLA)","raw_type":"proceedings-article"}],"best_oa_location":null,"sustainable_development_goals":[{"score":0.7762389183044434,"id":"https://metadata.un.org/sdg/2","display_name":"Zero hunger"}],"awards":[],"funders":[],"has_content":{"pdf":false,"grobid_xml":false},"content_urls":null,"referenced_works_count":16,"referenced_works":["https://openalex.org/W1019830208","https://openalex.org/W2046358187","https://openalex.org/W2104093114","https://openalex.org/W2198606573","https://openalex.org/W2336509392","https://openalex.org/W2747043344","https://openalex.org/W2798064943","https://openalex.org/W2952239877","https://openalex.org/W2952366981","https://openalex.org/W2972870121","https://openalex.org/W3127238141","https://openalex.org/W3159728495","https://openalex.org/W3203588026","https://openalex.org/W4255836900","https://openalex.org/W4295087956","https://openalex.org/W4390970542"],"related_works":[],"abstract_inverted_index":{"Phenotypes":[0],"are":[1],"the":[2,96,110,135],"observable":[3],"characteristics":[4],"of":[5,112,129,150],"an":[6],"individual":[7],"organism.":[8],"Predicting":[9],"quantitative":[10],"phenotypes":[11,122,165],"from":[12,40],"genomic":[13],"variation":[14,205],"remains":[15],"challenging":[16],"when":[17,141,203],"causal":[18],"signals":[19],"span":[20],"both":[21],"local":[22],"motifs":[23],"and":[24,84,107,123,160,195],"distal":[25,196],"regulatory":[26,210],"context.":[27,114],"Building":[28],"on":[29,49,57,61,68,75,90,119,127,134],"Frequented":[30],"Regions":[31],"(FRs),":[32],"which":[33],"represent":[34],"subsequences":[35],"conserved":[36],"across":[37],"genomes,":[38],"extracted":[39],"a":[41,78,85],"pangenome":[42],"graph,":[43],"we":[44],"compare":[45],"six":[46],"modeling":[47,149],"strategies":[48],"five":[50,97,121],"yeast":[51],"growth":[52],"phenotypes:":[53],"Random":[54],"Forest":[55],"(RF)":[56],"FR":[58,62,69,76,92],"counts,":[59],"RF":[60,104,125],"sequences,":[63,70,77],"1D":[64],"convolutional":[65],"neural":[66],"networks":[67],"Long":[71],"Short-Term":[72],"Memory":[73],"(LSTM)":[74],"Genome-wide":[79],"Association":[80],"Study":[81],"(GWAS)":[82],"baseline,":[83],"sequence-based":[86,100],"Enformer":[87,115],"model":[88],"trained":[89],"raw":[91,151],"nucleotide":[93],"windows.":[94],"Across":[95],"phenotypes,":[98,187],"all":[99,120],"baselines":[101,171],"improve":[102],"upon":[103],"(FR":[105],"counts)":[106],"GWAS,":[108],"confirming":[109],"value":[111],"sequence":[113,152],"consistently":[116],"outperforms":[117],"CNN/LSTM":[118],"surpasses":[124],"(FR-sequences)":[126],"three":[128],"five,":[130],"while":[131,179],"remaining":[132],"competitive":[133],"others.":[136],"These":[137,175],"results":[138],"indicate":[139],"that":[140,178,191],"long-range":[142],"dependencies":[143],"contribute":[144],"to":[145,208],"trait":[146],"variation,":[147],"transformer-based":[148],"windows":[153],"may":[154,172],"yield":[155,199],"tangible":[156],"gains":[157],"over":[158],"k-mer":[159],"local-pattern":[161],"learners;":[162],"conversely,":[163],"for":[164,185],"dominated":[166],"by":[167],"short-range":[168,180],"signals,":[169],"lightweight":[170],"remain":[173],"competitive.":[174],"findings":[176],"suggest":[177],"motif":[181],"statistics":[182],"can":[183,198],"suffice":[184],"certain":[186],"deep":[188],"learning":[189],"architectures":[190],"integrate":[192],"positional":[193],"context":[194],"interactions":[197],"additional":[200],"gains,":[201],"particularly":[202],"phenotypic":[204],"is":[206],"linked":[207],"dispersed":[209],"signals.":[211]},"counts_by_year":[],"updated_date":"2026-04-09T06:08:40.794217","created_date":"2026-04-08T00:00:00"}
