{"id":"https://openalex.org/W4404521618","doi":"https://doi.org/10.1371/journal.pcbi.1012597","title":"Prediction of virus-host associations using protein language models and multiple instance learning","display_name":"Prediction of virus-host associations using protein language models and multiple instance learning","publication_year":2024,"publication_date":"2024-11-19","ids":{"openalex":"https://openalex.org/W4404521618","doi":"https://doi.org/10.1371/journal.pcbi.1012597","pmid":"https://pubmed.ncbi.nlm.nih.gov/39561204"},"language":"en","primary_location":{"id":"doi:10.1371/journal.pcbi.1012597","is_oa":true,"landing_page_url":"https://doi.org/10.1371/journal.pcbi.1012597","pdf_url":null,"source":{"id":"https://openalex.org/S86033158","display_name":"PLoS Computational Biology","issn_l":"1553-734X","issn":["1553-734X","1553-7358"],"is_oa":true,"is_in_doaj":true,"is_core":true,"host_organization":"https://openalex.org/P4310315706","host_organization_name":"Public Library of Science","host_organization_lineage":["https://openalex.org/P4310315706"],"host_organization_lineage_names":["Public Library of Science"],"type":"journal"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"PLOS Computational Biology","raw_type":"journal-article"},"type":"article","indexed_in":["crossref","doaj","pubmed"],"open_access":{"is_oa":true,"oa_status":"gold","oa_url":"https://doi.org/10.1371/journal.pcbi.1012597","any_repository_has_fulltext":true},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5100326815","display_name":"Dan Liu","orcid":"https://orcid.org/0009-0008-7976-8042"},"institutions":[{"id":"https://openalex.org/I4210146449","display_name":"MRC University of Glasgow Centre for Virus Research","ror":"https://ror.org/03vaer060","country_code":"GB","type":"government","lineage":["https://openalex.org/I4210087105","https://openalex.org/I4210146449","https://openalex.org/I7882870","https://openalex.org/I90344618"]}],"countries":["GB"],"is_corresponding":true,"raw_author_name":"Dan Liu","raw_affiliation_strings":["MRC-University of Glasgow Centre for Virus Research, Glasgow, United Kingdom","MRC\u2212University of Glasgow Center for Virus Research, Glasgow, United Kingdom"],"affiliations":[{"raw_affiliation_string":"MRC-University of Glasgow Centre for Virus Research, Glasgow, United Kingdom","institution_ids":["https://openalex.org/I4210146449"]},{"raw_affiliation_string":"MRC\u2212University of Glasgow Center for Virus Research, Glasgow, United Kingdom","institution_ids":["https://openalex.org/I4210146449"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5057178535","display_name":"Francesca Young","orcid":"https://orcid.org/0000-0002-5236-1145"},"institutions":[{"id":"https://openalex.org/I7882870","display_name":"University of Glasgow","ror":"https://ror.org/00vtgdb53","country_code":"GB","type":"education","lineage":["https://openalex.org/I7882870"]},{"id":"https://openalex.org/I4210146449","display_name":"MRC University of Glasgow Centre for Virus Research","ror":"https://ror.org/03vaer060","country_code":"GB","type":"government","lineage":["https://openalex.org/I4210087105","https://openalex.org/I4210146449","https://openalex.org/I7882870","https://openalex.org/I90344618"]}],"countries":["GB"],"is_corresponding":true,"raw_author_name":"Francesca Young","raw_affiliation_strings":["MRC-University of Glasgow Centre for Virus Research, Glasgow, United Kingdom","School of Computing Science, University of Glasgow, Glasgow, United Kingdom","MRC\u2212University of Glasgow Center for Virus Research, Glasgow, United Kingdom"],"affiliations":[{"raw_affiliation_string":"MRC-University of Glasgow Centre for Virus Research, Glasgow, United Kingdom","institution_ids":["https://openalex.org/I4210146449"]},{"raw_affiliation_string":"School of Computing Science, University of Glasgow, Glasgow, United Kingdom","institution_ids":["https://openalex.org/I7882870"]},{"raw_affiliation_string":"MRC\u2212University of Glasgow Center for Virus Research, Glasgow, United Kingdom","institution_ids":["https://openalex.org/I4210146449"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5071885443","display_name":"Kieran D. Lamb","orcid":"https://orcid.org/0000-0002-3011-5189"},"institutions":[{"id":"https://openalex.org/I4210146449","display_name":"MRC University of Glasgow Centre for Virus Research","ror":"https://ror.org/03vaer060","country_code":"GB","type":"government","lineage":["https://openalex.org/I4210087105","https://openalex.org/I4210146449","https://openalex.org/I7882870","https://openalex.org/I90344618"]}],"countries":["GB"],"is_corresponding":true,"raw_author_name":"Kieran D. Lamb","raw_affiliation_strings":["MRC-University of Glasgow Centre for Virus Research, Glasgow, United Kingdom","MRC\u2212University of Glasgow Center for Virus Research, Glasgow, United Kingdom"],"affiliations":[{"raw_affiliation_string":"MRC-University of Glasgow Centre for Virus Research, Glasgow, United Kingdom","institution_ids":["https://openalex.org/I4210146449"]},{"raw_affiliation_string":"MRC\u2212University of Glasgow Center for Virus Research, Glasgow, United Kingdom","institution_ids":["https://openalex.org/I4210146449"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5082064376","display_name":"David L. Robertson","orcid":"https://orcid.org/0000-0001-6338-0221"},"institutions":[{"id":"https://openalex.org/I4210146449","display_name":"MRC University of Glasgow Centre for Virus Research","ror":"https://ror.org/03vaer060","country_code":"GB","type":"government","lineage":["https://openalex.org/I4210087105","https://openalex.org/I4210146449","https://openalex.org/I7882870","https://openalex.org/I90344618"]}],"countries":["GB"],"is_corresponding":true,"raw_author_name":"David L. Robertson","raw_affiliation_strings":["MRC-University of Glasgow Centre for Virus Research, Glasgow, United Kingdom","MRC\u2212University of Glasgow Center for Virus Research, Glasgow, United Kingdom"],"affiliations":[{"raw_affiliation_string":"MRC-University of Glasgow Centre for Virus Research, Glasgow, United Kingdom","institution_ids":["https://openalex.org/I4210146449"]},{"raw_affiliation_string":"MRC\u2212University of Glasgow Center for Virus Research, Glasgow, United Kingdom","institution_ids":["https://openalex.org/I4210146449"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5018793685","display_name":"Ke Yuan","orcid":"https://orcid.org/0000-0002-2318-1460"},"institutions":[{"id":"https://openalex.org/I2801316944","display_name":"Cancer Research UK","ror":"https://ror.org/054225q67","country_code":"GB","type":"funder","lineage":["https://openalex.org/I2801316944"]},{"id":"https://openalex.org/I4210143228","display_name":"Cancer Research UK Scotland Institute","ror":"https://ror.org/03pv69j64","country_code":"GB","type":"facility","lineage":["https://openalex.org/I2801316944","https://openalex.org/I4210143228"]},{"id":"https://openalex.org/I7882870","display_name":"University of Glasgow","ror":"https://ror.org/00vtgdb53","country_code":"GB","type":"education","lineage":["https://openalex.org/I7882870"]}],"countries":["GB"],"is_corresponding":true,"raw_author_name":"Ke Yuan","raw_affiliation_strings":["Cancer Research UK Scotland Institute, Glasgow, United Kingdom","School of Cancer Sciences, University of Glasgow, Glasgow, United Kingdom","School of Computing Science, University of Glasgow, Glasgow, United Kingdom","Cancer Research UK Beatson Institute, Glasgow, United Kingdom"],"affiliations":[{"raw_affiliation_string":"Cancer Research UK Scotland Institute, Glasgow, United Kingdom","institution_ids":["https://openalex.org/I2801316944"]},{"raw_affiliation_string":"School of Cancer Sciences, University of Glasgow, Glasgow, United Kingdom","institution_ids":["https://openalex.org/I7882870"]},{"raw_affiliation_string":"School of Computing Science, University of Glasgow, Glasgow, United Kingdom","institution_ids":["https://openalex.org/I7882870"]},{"raw_affiliation_string":"Cancer Research UK Beatson Institute, Glasgow, United Kingdom","institution_ids":["https://openalex.org/I4210143228"]}]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":5,"corresponding_author_ids":["https://openalex.org/A5018793685","https://openalex.org/A5057178535","https://openalex.org/A5071885443","https://openalex.org/A5082064376","https://openalex.org/A5100326815"],"corresponding_institution_ids":["https://openalex.org/I2801316944","https://openalex.org/I4210143228","https://openalex.org/I4210146449","https://openalex.org/I7882870"],"apc_list":{"value":2655,"currency":"USD","value_usd":2655},"apc_paid":{"value":2655,"currency":"USD","value_usd":2655},"fwci":6.4966,"has_fulltext":true,"cited_by_count":14,"citation_normalized_percentile":{"value":0.96872292,"is_in_top_1_percent":false,"is_in_top_10_percent":true},"cited_by_percentile_year":{"min":90,"max":99},"biblio":{"volume":"20","issue":"11","first_page":"e1012597","last_page":"e1012597"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T11048","display_name":"Bacteriophages and microbial interactions","score":0.9998999834060669,"subfield":{"id":"https://openalex.org/subfields/2303","display_name":"Ecology"},"field":{"id":"https://openalex.org/fields/23","display_name":"Environmental Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T11048","display_name":"Bacteriophages and microbial interactions","score":0.9998999834060669,"subfield":{"id":"https://openalex.org/subfields/2303","display_name":"Ecology"},"field":{"id":"https://openalex.org/fields/23","display_name":"Environmental Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10015","display_name":"Genomics and Phylogenetic Studies","score":0.998199999332428,"subfield":{"id":"https://openalex.org/subfields/1312","display_name":"Molecular Biology"},"field":{"id":"https://openalex.org/fields/13","display_name":"Biochemistry, Genetics and Molecular Biology"},"domain":{"id":"https://openalex.org/domains/1","display_name":"Life Sciences"}},{"id":"https://openalex.org/T10521","display_name":"RNA and protein synthesis mechanisms","score":0.9897000193595886,"subfield":{"id":"https://openalex.org/subfields/1312","display_name":"Molecular Biology"},"field":{"id":"https://openalex.org/fields/13","display_name":"Biochemistry, Genetics and Molecular Biology"},"domain":{"id":"https://openalex.org/domains/1","display_name":"Life Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/host","display_name":"Host (biology)","score":0.7595117092132568},{"id":"https://openalex.org/keywords/biology","display_name":"Biology","score":0.5893046259880066},{"id":"https://openalex.org/keywords/computational-biology","display_name":"Computational biology","score":0.5534140467643738},{"id":"https://openalex.org/keywords/virus","display_name":"Virus","score":0.4271264672279358},{"id":"https://openalex.org/keywords/protein-sequencing","display_name":"Protein sequencing","score":0.4146689772605896},{"id":"https://openalex.org/keywords/peptide-sequence","display_name":"Peptide sequence","score":0.2831154465675354},{"id":"https://openalex.org/keywords/genetics","display_name":"Genetics","score":0.2597273588180542},{"id":"https://openalex.org/keywords/gene","display_name":"Gene","score":0.1983833611011505}],"concepts":[{"id":"https://openalex.org/C126831891","wikidata":"https://www.wikidata.org/wiki/Q221673","display_name":"Host (biology)","level":2,"score":0.7595117092132568},{"id":"https://openalex.org/C86803240","wikidata":"https://www.wikidata.org/wiki/Q420","display_name":"Biology","level":0,"score":0.5893046259880066},{"id":"https://openalex.org/C70721500","wikidata":"https://www.wikidata.org/wiki/Q177005","display_name":"Computational biology","level":1,"score":0.5534140467643738},{"id":"https://openalex.org/C2522874641","wikidata":"https://www.wikidata.org/wiki/Q808","display_name":"Virus","level":2,"score":0.4271264672279358},{"id":"https://openalex.org/C10010492","wikidata":"https://www.wikidata.org/wiki/Q3142557","display_name":"Protein sequencing","level":4,"score":0.4146689772605896},{"id":"https://openalex.org/C167625842","wikidata":"https://www.wikidata.org/wiki/Q899763","display_name":"Peptide sequence","level":3,"score":0.2831154465675354},{"id":"https://openalex.org/C54355233","wikidata":"https://www.wikidata.org/wiki/Q7162","display_name":"Genetics","level":1,"score":0.2597273588180542},{"id":"https://openalex.org/C104317684","wikidata":"https://www.wikidata.org/wiki/Q7187","display_name":"Gene","level":2,"score":0.1983833611011505}],"mesh":[{"descriptor_ui":"D000076662","descriptor_name":"Host Microbial Interactions","qualifier_ui":"Q000502","qualifier_name":"physiology","is_major_topic":false},{"descriptor_ui":"D000076662","descriptor_name":"Host Microbial Interactions","qualifier_ui":"Q000502","qualifier_name":"physiology","is_major_topic":false},{"descriptor_ui":"D000076662","descriptor_name":"Host Microbial Interactions","qualifier_ui":"Q000502","qualifier_name":"physiology","is_major_topic":false},{"descriptor_ui":"D000076662","descriptor_name":"Host Microbial Interactions","qualifier_ui":"Q000502","qualifier_name":"physiology","is_major_topic":false},{"descriptor_ui":"D000077321","descriptor_name":"Deep Learning","qualifier_ui":null,"qualifier_name":null,"is_major_topic":false},{"descriptor_ui":"D000077321","descriptor_name":"Deep Learning","qualifier_ui":null,"qualifier_name":null,"is_major_topic":false},{"descriptor_ui":"D000077321","descriptor_name":"Deep Learning","qualifier_ui":null,"qualifier_name":null,"is_major_topic":false},{"descriptor_ui":"D000077321","descriptor_name":"Deep Learning","qualifier_ui":null,"qualifier_name":null,"is_major_topic":false},{"descriptor_ui":"D000818","descriptor_name":"Animals","qualifier_ui":null,"qualifier_name":null,"is_major_topic":false},{"descriptor_ui":"D000818","descriptor_name":"Animals","qualifier_ui":null,"qualifier_name":null,"is_major_topic":false},{"descriptor_ui":"D000818","descriptor_name":"Animals","qualifier_ui":null,"qualifier_name":null,"is_major_topic":false},{"descriptor_ui":"D000818","descriptor_name":"Animals","qualifier_ui":null,"qualifier_name":null,"is_major_topic":false},{"descriptor_ui":"D006801","descriptor_name":"Humans","qualifier_ui":null,"qualifier_name":null,"is_major_topic":false},{"descriptor_ui":"D006801","descriptor_name":"Humans","qualifier_ui":null,"qualifier_name":null,"is_major_topic":false},{"descriptor_ui":"D006801","descriptor_name":"Humans","qualifier_ui":null,"qualifier_name":null,"is_major_topic":false},{"descriptor_ui":"D006801","descriptor_name":"Humans","qualifier_ui":null,"qualifier_name":null,"is_major_topic":false},{"descriptor_ui":"D014764","descriptor_name":"Viral Proteins","qualifier_ui":"Q000378","qualifier_name":"metabolism","is_major_topic":true},{"descriptor_ui":"D014764","descriptor_name":"Viral Proteins","qualifier_ui":"Q000378","qualifier_name":"metabolism","is_major_topic":true},{"descriptor_ui":"D014764","descriptor_name":"Viral Proteins","qualifier_ui":"Q000378","qualifier_name":"metabolism","is_major_topic":true},{"descriptor_ui":"D014764","descriptor_name":"Viral Proteins","qualifier_ui":"Q000378","qualifier_name":"metabolism","is_major_topic":true},{"descriptor_ui":"D014764","descriptor_name":"Viral Proteins","qualifier_ui":"Q000737","qualifier_name":"chemistry","is_major_topic":true},{"descriptor_ui":"D014764","descriptor_name":"Viral Proteins","qualifier_ui":"Q000737","qualifier_name":"chemistry","is_major_topic":true},{"descriptor_ui":"D014764","descriptor_name":"Viral Proteins","qualifier_ui":"Q000737","qualifier_name":"chemistry","is_major_topic":true},{"descriptor_ui":"D014764","descriptor_name":"Viral Proteins","qualifier_ui":"Q000737","qualifier_name":"chemistry","is_major_topic":true},{"descriptor_ui":"D014780","descriptor_name":"Viruses","qualifier_ui":"Q000378","qualifier_name":"metabolism","is_major_topic":true},{"descriptor_ui":"D014780","descriptor_name":"Viruses","qualifier_ui":"Q000378","qualifier_name":"metabolism","is_major_topic":true},{"descriptor_ui":"D014780","descriptor_name":"Viruses","qualifier_ui":"Q000378","qualifier_name":"metabolism","is_major_topic":true},{"descriptor_ui":"D014780","descriptor_name":"Viruses","qualifier_ui":"Q000378","qualifier_name":"metabolism","is_major_topic":true},{"descriptor_ui":"D019295","descriptor_name":"Computational Biology","qualifier_ui":"Q000379","qualifier_name":"methods","is_major_topic":true},{"descriptor_ui":"D019295","descriptor_name":"Computational Biology","qualifier_ui":"Q000379","qualifier_name":"methods","is_major_topic":true},{"descriptor_ui":"D019295","descriptor_name":"Computational Biology","qualifier_ui":"Q000379","qualifier_name":"methods","is_major_topic":true},{"descriptor_ui":"D019295","descriptor_name":"Computational Biology","qualifier_ui":"Q000379","qualifier_name":"methods","is_major_topic":true},{"descriptor_ui":"D054884","descriptor_name":"Host-Pathogen Interactions","qualifier_ui":"Q000502","qualifier_name":"physiology","is_major_topic":true},{"descriptor_ui":"D054884","descriptor_name":"Host-Pathogen Interactions","qualifier_ui":"Q000502","qualifier_name":"physiology","is_major_topic":true},{"descriptor_ui":"D054884","descriptor_name":"Host-Pathogen Interactions","qualifier_ui":"Q000502","qualifier_name":"physiology","is_major_topic":true},{"descriptor_ui":"D054884","descriptor_name":"Host-Pathogen Interactions","qualifier_ui":"Q000502","qualifier_name":"physiology","is_major_topic":true}],"locations_count":5,"locations":[{"id":"doi:10.1371/journal.pcbi.1012597","is_oa":true,"landing_page_url":"https://doi.org/10.1371/journal.pcbi.1012597","pdf_url":null,"source":{"id":"https://openalex.org/S86033158","display_name":"PLoS Computational Biology","issn_l":"1553-734X","issn":["1553-734X","1553-7358"],"is_oa":true,"is_in_doaj":true,"is_core":true,"host_organization":"https://openalex.org/P4310315706","host_organization_name":"Public Library of Science","host_organization_lineage":["https://openalex.org/P4310315706"],"host_organization_lineage_names":["Public Library of Science"],"type":"journal"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"PLOS Computational Biology","raw_type":"journal-article"},{"id":"pmid:39561204","is_oa":false,"landing_page_url":"https://pubmed.ncbi.nlm.nih.gov/39561204","pdf_url":null,"source":{"id":"https://openalex.org/S4306525036","display_name":"PubMed","issn_l":null,"issn":null,"is_oa":false,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I1299303238","host_organization_name":"National Institutes of Health","host_organization_lineage":["https://openalex.org/I1299303238"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"PLoS computational biology","raw_type":null},{"id":"pmh:oai:eprints.gla.ac.uk:342709","is_oa":true,"landing_page_url":"http://eprints.gla.ac.uk/view/author/62428.html>,","pdf_url":"https://eprints.gla.ac.uk/342709/1/342709.pdf","source":{"id":"https://openalex.org/S4210235606","display_name":"ENLIGHTEN (Jurnal Bimbingan dan Konseling Islam)","issn_l":"2622-8912","issn":["2622-8912","2622-8920"],"is_oa":true,"is_in_doaj":true,"is_core":false,"host_organization":null,"host_organization_name":null,"host_organization_lineage":[],"host_organization_lineage_names":[],"type":"journal"},"license":"cc-by-sa","license_id":"https://openalex.org/licenses/cc-by-sa","version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"PeerReviewed"},{"id":"pmh:oai:pubmedcentral.nih.gov:11614202","is_oa":true,"landing_page_url":"https://www.ncbi.nlm.nih.gov/pmc/articles/11614202","pdf_url":"https://pmc.ncbi.nlm.nih.gov/articles/PMC11614202/pdf/pcbi.1012597.pdf","source":{"id":"https://openalex.org/S2764455111","display_name":"PubMed Central","issn_l":null,"issn":null,"is_oa":false,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I1299303238","host_organization_name":"National Institutes of Health","host_organization_lineage":["https://openalex.org/I1299303238"],"host_organization_lineage_names":[],"type":"repository"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":"PLoS Comput Biol","raw_type":"Text"},{"id":"pmh:oai:doaj.org/article:b6a8b5fcecca4139a96a9a4137909b44","is_oa":true,"landing_page_url":"https://doaj.org/article/b6a8b5fcecca4139a96a9a4137909b44","pdf_url":null,"source":{"id":"https://openalex.org/S112646816","display_name":"SHILAP Revista de lepidopterolog\u00eda","issn_l":"0300-5267","issn":["0300-5267","2340-4078"],"is_oa":true,"is_in_doaj":true,"is_core":false,"host_organization":null,"host_organization_name":null,"host_organization_lineage":[],"host_organization_lineage_names":[],"type":"journal"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":"PLoS Computational Biology, Vol 20, Iss 11, p e1012597 (2024)","raw_type":"article"}],"best_oa_location":{"id":"doi:10.1371/journal.pcbi.1012597","is_oa":true,"landing_page_url":"https://doi.org/10.1371/journal.pcbi.1012597","pdf_url":null,"source":{"id":"https://openalex.org/S86033158","display_name":"PLoS Computational Biology","issn_l":"1553-734X","issn":["1553-734X","1553-7358"],"is_oa":true,"is_in_doaj":true,"is_core":true,"host_organization":"https://openalex.org/P4310315706","host_organization_name":"Public Library of Science","host_organization_lineage":["https://openalex.org/P4310315706"],"host_organization_lineage_names":["Public Library of Science"],"type":"journal"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"PLOS Computational Biology","raw_type":"journal-article"},"sustainable_development_goals":[{"display_name":"Life in Land","id":"https://metadata.un.org/sdg/15","score":0.5600000023841858}],"awards":[{"id":"https://openalex.org/G1586798349","display_name":"Integrative viral genomics and bioinformatics platform","funder_award_id":"MC_UU_00034/5","funder_id":"https://openalex.org/F4320334626","funder_display_name":"Medical Research Council"},{"id":"https://openalex.org/G1974542962","display_name":null,"funder_award_id":"Sk\u0142odowska","funder_id":"https://openalex.org/F4320320300","funder_display_name":"European Commission"},{"id":"https://openalex.org/G1989121949","display_name":null,"funder_award_id":"EP/R018634/1","funder_id":"https://openalex.org/F4320334627","funder_display_name":"Engineering and Physical Sciences Research Council"},{"id":"https://openalex.org/G1990576317","display_name":null,"funder_award_id":"BBSRC","funder_id":"https://openalex.org/F4320334626","funder_display_name":"Medical Research Council"},{"id":"https://openalex.org/G2178131472","display_name":null,"funder_award_id":"955974","funder_id":"https://openalex.org/F4320338337","funder_display_name":"H2020 Marie Sk\u0142odowska-Curie Actions"},{"id":"https://openalex.org/G2206474454","display_name":null,"funder_award_id":"MC_UU_12014","funder_id":"https://openalex.org/F4320334626","funder_display_name":"Medical Research Council"},{"id":"https://openalex.org/G2689612763","display_name":null,"funder_award_id":"Marie","funder_id":"https://openalex.org/F4320320300","funder_display_name":"European Commission"},{"id":"https://openalex.org/G3340343804","display_name":"Understanding (harmful) virus-host interactions by linking virology and bioinformatics","funder_award_id":"955974","funder_id":"https://openalex.org/F4320320300","funder_display_name":"European Commission"},{"id":"https://openalex.org/G3525737904","display_name":"Viral Hepatitis","funder_award_id":"MC_UU_12014/1","funder_id":"https://openalex.org/F4320334626","funder_display_name":"Medical Research Council"},{"id":"https://openalex.org/G3817770730","display_name":"DTP Bid Led by University of Edinburgh","funder_award_id":"MR/N013166/1","funder_id":"https://openalex.org/F4320334626","funder_display_name":"Medical Research Council"},{"id":"https://openalex.org/G3899947651","display_name":null,"funder_award_id":"BB/V016067/1","funder_id":"https://openalex.org/F4320334629","funder_display_name":"Biotechnology and Biological Sciences Research Council"},{"id":"https://openalex.org/G4447653093","display_name":null,"funder_award_id":"Network","funder_id":"https://openalex.org/F4320320300","funder_display_name":"European Commission"},{"id":"https://openalex.org/G4534189432","display_name":null,"funder_award_id":"MR/V01157X/1","funder_id":"https://openalex.org/F4320334626","funder_display_name":"Medical Research Council"},{"id":"https://openalex.org/G4716351894","display_name":null,"funder_award_id":"MR/V01157X/2","funder_id":"https://openalex.org/F4320334626","funder_display_name":"Medical Research Council"},{"id":"https://openalex.org/G5187265158","display_name":"Closed-Loop Data Science for Complex, Computationally- and Data-Intensive Analytics","funder_award_id":"EP/R018634/1","funder_id":"https://openalex.org/F4320334627","funder_display_name":"Engineering and Physical Sciences Research Council"},{"id":"https://openalex.org/G5566807808","display_name":null,"funder_award_id":"MC_UU_","funder_id":"https://openalex.org/F4320334626","funder_display_name":"Medical Research Council"},{"id":"https://openalex.org/G6100177302","display_name":null,"funder_award_id":"Sk\u0142odowska","funder_id":"https://openalex.org/F4320338337","funder_display_name":"H2020 Marie Sk\u0142odowska-Curie Actions"},{"id":"https://openalex.org/G6808950318","display_name":null,"funder_award_id":"MR/N013166/1","funder_id":"https://openalex.org/F4320334629","funder_display_name":"Biotechnology and Biological Sciences Research Council"},{"id":"https://openalex.org/G6891376111","display_name":null,"funder_award_id":"MC_UU_12014/12","funder_id":"https://openalex.org/F4320334626","funder_display_name":"Medical Research Council"},{"id":"https://openalex.org/G7174427763","display_name":"MOLECULAR BARRIERS TO THE EMERGENCE OF CORONAVIRUSES IN HUMANS","funder_award_id":"MR/V01157X/1","funder_id":"https://openalex.org/F4320334626","funder_display_name":"Medical Research Council"},{"id":"https://openalex.org/G7665676760","display_name":"Investigating Host and Viral Factors for Improved Design of Future Live Attenuated Vaccines for IBV","funder_award_id":"BB/V016067/1","funder_id":"https://openalex.org/F4320334629","funder_display_name":"Biotechnology and Biological Sciences Research Council"},{"id":"https://openalex.org/G7901872499","display_name":null,"funder_award_id":"Marie","funder_id":"https://openalex.org/F4320338337","funder_display_name":"H2020 Marie Sk\u0142odowska-Curie Actions"},{"id":"https://openalex.org/G7955706205","display_name":null,"funder_award_id":"Horizon 2020","funder_id":"https://openalex.org/F4320338337","funder_display_name":"H2020 Marie Sk\u0142odowska-Curie Actions"},{"id":"https://openalex.org/G8318064016","display_name":null,"funder_award_id":"Horizon","funder_id":"https://openalex.org/F4320320300","funder_display_name":"European Commission"},{"id":"https://openalex.org/G8352026019","display_name":null,"funder_award_id":"R018634/1","funder_id":"https://openalex.org/F4320334627","funder_display_name":"Engineering and Physical Sciences Research Council"},{"id":"https://openalex.org/G8452545418","display_name":null,"funder_award_id":"unknown","funder_id":"https://openalex.org/F4320334627","funder_display_name":"Engineering and Physical Sciences Research Council"}],"funders":[{"id":"https://openalex.org/F4320320300","display_name":"European Commission","ror":"https://ror.org/00k4n6c32"},{"id":"https://openalex.org/F4320332167","display_name":"Directorate for Biological Sciences","ror":"https://ror.org/001xhss06"},{"id":"https://openalex.org/F4320334626","display_name":"Medical Research Council","ror":"https://ror.org/03x94j517"},{"id":"https://openalex.org/F4320334627","display_name":"Engineering and Physical Sciences Research Council","ror":"https://ror.org/0439y7842"},{"id":"https://openalex.org/F4320334629","display_name":"Biotechnology and Biological Sciences Research Council","ror":"https://ror.org/00cwqg982"},{"id":"https://openalex.org/F4320338337","display_name":"H2020 Marie Sk\u0142odowska-Curie Actions","ror":null}],"has_content":{"grobid_xml":false,"pdf":false},"content_urls":null,"referenced_works_count":32,"referenced_works":["https://openalex.org/W1448965840","https://openalex.org/W1527927437","https://openalex.org/W1982267716","https://openalex.org/W2047032063","https://openalex.org/W2084241014","https://openalex.org/W2088333086","https://openalex.org/W2101291993","https://openalex.org/W2119859604","https://openalex.org/W2120172561","https://openalex.org/W2154318594","https://openalex.org/W2291003811","https://openalex.org/W2513727910","https://openalex.org/W2559100382","https://openalex.org/W2734399491","https://openalex.org/W2901212243","https://openalex.org/W2904384071","https://openalex.org/W2950954328","https://openalex.org/W3003217347","https://openalex.org/W3011205382","https://openalex.org/W3032757820","https://openalex.org/W3037496568","https://openalex.org/W3092973783","https://openalex.org/W3112043731","https://openalex.org/W3118981004","https://openalex.org/W3146944767","https://openalex.org/W3147885797","https://openalex.org/W4207059657","https://openalex.org/W4231410305","https://openalex.org/W4288431192","https://openalex.org/W4385245566","https://openalex.org/W6683033130","https://openalex.org/W6739901393"],"related_works":["https://openalex.org/W4391375266","https://openalex.org/W2082860237","https://openalex.org/W2119695867","https://openalex.org/W2130076355","https://openalex.org/W1990804418","https://openalex.org/W1993764875","https://openalex.org/W2046158694","https://openalex.org/W2788277189","https://openalex.org/W2013243191","https://openalex.org/W2977939402"],"abstract_inverted_index":{"Predicting":[0],"virus-host":[1,174],"associations":[2],"is":[3,32],"essential":[4],"to":[5,68,86,155],"determine":[6],"the":[7,25,28,50,166],"specific":[8],"host":[9,26,51,69],"species":[10,52],"that":[11,48,65,93],"viruses":[12,19,31,54],"interact":[13],"with,":[14],"and":[15,22,81,109,125,130,133,150],"discover":[16],"if":[17],"new":[18],"infect":[20],"humans":[21],"animals.":[23],"Currently,":[24],"of":[27,30,122],"majority":[29],"unknown,":[33],"particularly":[34],"in":[35,127,135,165,173],"microbiomes.":[36],"To":[37],"address":[38],"this":[39],"challenge,":[40],"we":[41],"introduce":[42],"EvoMIL,":[43],"a":[44,74],"deep":[45],"learning":[46,85],"method":[47,72],"predicts":[49],"for":[53,146,157],"from":[55,152],"viral":[56,63],"sequences":[57],"only.":[58],"It":[59],"also":[60],"identifies":[61,162],"important":[62,163],"proteins":[64,164],"significantly":[66],"contribute":[67],"prediction.":[70],"The":[71],"combines":[73],"pre-trained":[75],"large":[76],"protein":[77,94],"language":[78],"model":[79],"(ESM)":[80],"attention-based":[82],"multiple":[83],"instance":[84],"allow":[87],"protein-orientated":[88],"predictions.":[89],"Our":[90],"results":[91],"show":[92],"embeddings":[95],"capture":[96],"stronger":[97],"predictive":[98],"signals":[99],"than":[100],"sequence":[101],"composition":[102],"features,":[103],"including":[104],"amino":[105],"acids,":[106],"physiochemical":[107],"properties,":[108],"DNA":[110],"k-mers.":[111],"In":[112],"multi-host":[113],"prediction":[114,167],"tasks,":[115],"EvoMIL":[116,138,161],"achieves":[117],"median":[118],"F1":[119],"score":[120],"improvements":[121],"10.8%,":[123],"16.2%,":[124],"4.9%":[126],"prokaryotic":[128,148],"hosts,":[129],"1.7%,":[131],"6.6%":[132],"11.5%":[134],"eukaryotic":[136,158],"hosts.":[137,159],"binary":[139],"classifiers":[140],"achieve":[141],"impressive":[142],"AUC":[143],"over":[144],"0.95":[145],"all":[147],"hosts":[149],"range":[151],"roughly":[153],"0.8":[154],"0.9":[156],"Furthermore,":[160],"task,":[168],"capturing":[169],"key":[170],"functions":[171],"involved":[172],"specificity.":[175]},"counts_by_year":[{"year":2026,"cited_by_count":2},{"year":2025,"cited_by_count":11},{"year":2024,"cited_by_count":1}],"updated_date":"2026-03-25T23:56:10.502304","created_date":"2025-10-10T00:00:00"}
