{"id":"https://openalex.org/W4417478313","doi":"https://doi.org/10.1021/acs.jcim.5c02082","title":"BGC-MAC and BGC-MAP: Attention-Based Models for Biosynthetic Gene Cluster Classification and Product Matching","display_name":"BGC-MAC and BGC-MAP: Attention-Based Models for Biosynthetic Gene Cluster Classification and Product Matching","publication_year":2025,"publication_date":"2025-12-18","ids":{"openalex":"https://openalex.org/W4417478313","doi":"https://doi.org/10.1021/acs.jcim.5c02082","pmid":"https://pubmed.ncbi.nlm.nih.gov/41412814"},"language":"en","primary_location":{"id":"doi:10.1021/acs.jcim.5c02082","is_oa":false,"landing_page_url":"https://doi.org/10.1021/acs.jcim.5c02082","pdf_url":null,"source":{"id":"https://openalex.org/S167262187","display_name":"Journal of Chemical Information and Modeling","issn_l":"1549-9596","issn":["1549-9596","1549-960X"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310320006","host_organization_name":"American Chemical Society","host_organization_lineage":["https://openalex.org/P4310320006"],"host_organization_lineage_names":["American Chemical Society"],"type":"journal"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Journal of Chemical Information and Modeling","raw_type":"journal-article"},"type":"article","indexed_in":["crossref","pubmed"],"open_access":{"is_oa":true,"oa_status":"green","oa_url":"https://pmc.ncbi.nlm.nih.gov/articles/PMC12744964/","any_repository_has_fulltext":true},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5110936221","display_name":"Kim P. Lu","orcid":"https://orcid.org/0009-0006-5784-1304"},"institutions":[{"id":"https://openalex.org/I166722992","display_name":"University of Massachusetts Chan Medical School","ror":"https://ror.org/0464eyp60","country_code":"US","type":"education","lineage":["https://openalex.org/I166722992"]},{"id":"https://openalex.org/I4210162397","display_name":"UMass Memorial Medical Center","ror":"https://ror.org/053v00853","country_code":"US","type":"healthcare","lineage":["https://openalex.org/I1303243448","https://openalex.org/I4210162397"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Kechen Lu","raw_affiliation_strings":["Department of Pathology","UMass Chan Medical School"],"raw_orcid":"https://orcid.org/0009-0006-5784-1304","affiliations":[{"raw_affiliation_string":"Department of Pathology","institution_ids":[]},{"raw_affiliation_string":"UMass Chan Medical School","institution_ids":["https://openalex.org/I4210162397","https://openalex.org/I166722992"]}]},{"author_position":"middle","author":{"id":null,"display_name":"Mengting Li","orcid":"https://orcid.org/0009-0004-8597-3350"},"institutions":[{"id":"https://openalex.org/I33213144","display_name":"University of Florida","ror":"https://ror.org/02y3ad647","country_code":"US","type":"education","lineage":["https://openalex.org/I33213144"]},{"id":"https://openalex.org/I4210137452","display_name":"Drug Discovery Laboratory (Norway)","ror":"https://ror.org/04nybae35","country_code":"NO","type":"company","lineage":["https://openalex.org/I4210137452"]}],"countries":["NO","US"],"is_corresponding":false,"raw_author_name":"Mengting Li","raw_affiliation_strings":["Department of Medicinal Chemistry, Center for Natural Products, Drug Discovery and Development (CNPD3)","University of Florida"],"raw_orcid":"https://orcid.org/0009-0004-8597-3350","affiliations":[{"raw_affiliation_string":"Department of Medicinal Chemistry, Center for Natural Products, Drug Discovery and Development (CNPD3)","institution_ids":["https://openalex.org/I4210137452"]},{"raw_affiliation_string":"University of Florida","institution_ids":["https://openalex.org/I33213144"]}]},{"author_position":"middle","author":{"id":null,"display_name":"Hao Geng","orcid":"https://orcid.org/0009-0009-3349-3191"},"institutions":[{"id":"https://openalex.org/I40347166","display_name":"University of Chicago","ror":"https://ror.org/024mw5h28","country_code":"US","type":"education","lineage":["https://openalex.org/I40347166"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Hao Geng","raw_affiliation_strings":["Department of Chemistry","The University of Chicago"],"raw_orcid":"https://orcid.org/0009-0009-3349-3191","affiliations":[{"raw_affiliation_string":"Department of Chemistry","institution_ids":[]},{"raw_affiliation_string":"The University of Chicago","institution_ids":["https://openalex.org/I40347166"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5100407913","display_name":"Wenqiang Xu","orcid":"https://orcid.org/0000-0002-8877-0098"},"institutions":[{"id":"https://openalex.org/I33213144","display_name":"University of Florida","ror":"https://ror.org/02y3ad647","country_code":"US","type":"education","lineage":["https://openalex.org/I33213144"]},{"id":"https://openalex.org/I4210137452","display_name":"Drug Discovery Laboratory (Norway)","ror":"https://ror.org/04nybae35","country_code":"NO","type":"company","lineage":["https://openalex.org/I4210137452"]}],"countries":["NO","US"],"is_corresponding":false,"raw_author_name":"Wenqiang Xu","raw_affiliation_strings":["Department of Medicinal Chemistry, Center for Natural Products, Drug Discovery and Development (CNPD3)","University of Florida"],"raw_orcid":"https://orcid.org/0000-0002-8877-0098","affiliations":[{"raw_affiliation_string":"Department of Medicinal Chemistry, Center for Natural Products, Drug Discovery and Development (CNPD3)","institution_ids":["https://openalex.org/I4210137452"]},{"raw_affiliation_string":"University of Florida","institution_ids":["https://openalex.org/I33213144"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5106290252","display_name":"Manyun Chen","orcid":"https://orcid.org/0000-0001-6803-044X"},"institutions":[{"id":"https://openalex.org/I33213144","display_name":"University of Florida","ror":"https://ror.org/02y3ad647","country_code":"US","type":"education","lineage":["https://openalex.org/I33213144"]},{"id":"https://openalex.org/I4210137452","display_name":"Drug Discovery Laboratory (Norway)","ror":"https://ror.org/04nybae35","country_code":"NO","type":"company","lineage":["https://openalex.org/I4210137452"]}],"countries":["NO","US"],"is_corresponding":false,"raw_author_name":"Manyun Chen","raw_affiliation_strings":["Department of Medicinal Chemistry, Center for Natural Products, Drug Discovery and Development (CNPD3)","University of Florida"],"raw_orcid":"https://orcid.org/0000-0001-6803-044X","affiliations":[{"raw_affiliation_string":"Department of Medicinal Chemistry, Center for Natural Products, Drug Discovery and Development (CNPD3)","institution_ids":["https://openalex.org/I4210137452"]},{"raw_affiliation_string":"University of Florida","institution_ids":["https://openalex.org/I33213144"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5034040358","display_name":"Tian\u2010Min Fu","orcid":"https://orcid.org/0000-0002-6281-1752"},"institutions":[{"id":"https://openalex.org/I166722992","display_name":"University of Massachusetts Chan Medical School","ror":"https://ror.org/0464eyp60","country_code":"US","type":"education","lineage":["https://openalex.org/I166722992"]},{"id":"https://openalex.org/I4210162397","display_name":"UMass Memorial Medical Center","ror":"https://ror.org/053v00853","country_code":"US","type":"healthcare","lineage":["https://openalex.org/I1303243448","https://openalex.org/I4210162397"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Tian-Min Fu","raw_affiliation_strings":["Department of Pathology","UMass Chan Medical School"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"Department of Pathology","institution_ids":[]},{"raw_affiliation_string":"UMass Chan Medical School","institution_ids":["https://openalex.org/I4210162397","https://openalex.org/I166722992"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5044244955","display_name":"Hendrik Luesch","orcid":"https://orcid.org/0000-0002-4091-7492"},"institutions":[{"id":"https://openalex.org/I33213144","display_name":"University of Florida","ror":"https://ror.org/02y3ad647","country_code":"US","type":"education","lineage":["https://openalex.org/I33213144"]},{"id":"https://openalex.org/I4210126319","display_name":"Duke-NUS Medical School","ror":"https://ror.org/02j1m6098","country_code":"SG","type":"education","lineage":["https://openalex.org/I165932596","https://openalex.org/I170897317","https://openalex.org/I4210126319"]},{"id":"https://openalex.org/I4210137452","display_name":"Drug Discovery Laboratory (Norway)","ror":"https://ror.org/04nybae35","country_code":"NO","type":"company","lineage":["https://openalex.org/I4210137452"]}],"countries":["NO","SG","US"],"is_corresponding":false,"raw_author_name":"Hendrik Luesch","raw_affiliation_strings":["Department of Medicinal Chemistry, Center for Natural Products, Drug Discovery and Development (CNPD3)","Duke-NUS Medical School","Program in Cancer and Stem Cell Biology","University of Florida"],"raw_orcid":"https://orcid.org/0000-0002-4091-7492","affiliations":[{"raw_affiliation_string":"Department of Medicinal Chemistry, Center for Natural Products, Drug Discovery and Development (CNPD3)","institution_ids":["https://openalex.org/I4210137452"]},{"raw_affiliation_string":"Duke-NUS Medical School","institution_ids":["https://openalex.org/I4210126319"]},{"raw_affiliation_string":"Program in Cancer and Stem Cell Biology","institution_ids":[]},{"raw_affiliation_string":"University of Florida","institution_ids":["https://openalex.org/I33213144"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5040683433","display_name":"Yousong Ding","orcid":"https://orcid.org/0000-0001-8610-0659"},"institutions":[{"id":"https://openalex.org/I33213144","display_name":"University of Florida","ror":"https://ror.org/02y3ad647","country_code":"US","type":"education","lineage":["https://openalex.org/I33213144"]},{"id":"https://openalex.org/I4210137452","display_name":"Drug Discovery Laboratory (Norway)","ror":"https://ror.org/04nybae35","country_code":"NO","type":"company","lineage":["https://openalex.org/I4210137452"]}],"countries":["NO","US"],"is_corresponding":false,"raw_author_name":"Yousong Ding","raw_affiliation_strings":["Department of Medicinal Chemistry, Center for Natural Products, Drug Discovery and Development (CNPD3)","University of Florida"],"raw_orcid":"https://orcid.org/0000-0001-8610-0659","affiliations":[{"raw_affiliation_string":"Department of Medicinal Chemistry, Center for Natural Products, Drug Discovery and Development (CNPD3)","institution_ids":["https://openalex.org/I4210137452"]},{"raw_affiliation_string":"University of Florida","institution_ids":["https://openalex.org/I33213144"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5040679040","display_name":"Wen Jun Xie","orcid":"https://orcid.org/0000-0002-3982-9305"},"institutions":[{"id":"https://openalex.org/I33213144","display_name":"University of Florida","ror":"https://ror.org/02y3ad647","country_code":"US","type":"education","lineage":["https://openalex.org/I33213144"]},{"id":"https://openalex.org/I4210137452","display_name":"Drug Discovery Laboratory (Norway)","ror":"https://ror.org/04nybae35","country_code":"NO","type":"company","lineage":["https://openalex.org/I4210137452"]}],"countries":["NO","US"],"is_corresponding":true,"raw_author_name":"Wen Jun Xie","raw_affiliation_strings":["Department of Medicinal Chemistry, Center for Natural Products, Drug Discovery and Development (CNPD3)","University of Florida"],"raw_orcid":"https://orcid.org/0000-0002-3982-9305","affiliations":[{"raw_affiliation_string":"Department of Medicinal Chemistry, Center for Natural Products, Drug Discovery and Development (CNPD3)","institution_ids":["https://openalex.org/I4210137452"]},{"raw_affiliation_string":"University of Florida","institution_ids":["https://openalex.org/I33213144"]}]}],"institutions":[],"countries_distinct_count":3,"institutions_distinct_count":9,"corresponding_author_ids":["https://openalex.org/A5040679040"],"corresponding_institution_ids":["https://openalex.org/I33213144","https://openalex.org/I4210137452"],"apc_list":null,"apc_paid":null,"fwci":0.0,"has_fulltext":false,"cited_by_count":0,"citation_normalized_percentile":{"value":0.41693226,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":null,"biblio":{"volume":"66","issue":"1","first_page":"138","last_page":"151"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10252","display_name":"Microbial Natural Products and Biosynthesis","score":0.5710999965667725,"subfield":{"id":"https://openalex.org/subfields/2736","display_name":"Pharmacology"},"field":{"id":"https://openalex.org/fields/27","display_name":"Medicine"},"domain":{"id":"https://openalex.org/domains/4","display_name":"Health Sciences"}},"topics":[{"id":"https://openalex.org/T10252","display_name":"Microbial Natural Products and Biosynthesis","score":0.5710999965667725,"subfield":{"id":"https://openalex.org/subfields/2736","display_name":"Pharmacology"},"field":{"id":"https://openalex.org/fields/27","display_name":"Medicine"},"domain":{"id":"https://openalex.org/domains/4","display_name":"Health Sciences"}},{"id":"https://openalex.org/T11948","display_name":"Machine Learning in Materials Science","score":0.0843999981880188,"subfield":{"id":"https://openalex.org/subfields/2505","display_name":"Materials Chemistry"},"field":{"id":"https://openalex.org/fields/25","display_name":"Materials Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10015","display_name":"Genomics and Phylogenetic Studies","score":0.06400000303983688,"subfield":{"id":"https://openalex.org/subfields/1312","display_name":"Molecular Biology"},"field":{"id":"https://openalex.org/fields/13","display_name":"Biochemistry, Genetics and Molecular Biology"},"domain":{"id":"https://openalex.org/domains/1","display_name":"Life Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/natural-product","display_name":"Natural product","score":0.7199000120162964},{"id":"https://openalex.org/keywords/annotation","display_name":"Annotation","score":0.6869000196456909},{"id":"https://openalex.org/keywords/classifier","display_name":"Classifier (UML)","score":0.5972999930381775},{"id":"https://openalex.org/keywords/product","display_name":"Product (mathematics)","score":0.44909998774528503},{"id":"https://openalex.org/keywords/matching","display_name":"Matching (statistics)","score":0.43779999017715454},{"id":"https://openalex.org/keywords/gene","display_name":"Gene","score":0.3756999969482422},{"id":"https://openalex.org/keywords/key","display_name":"Key (lock)","score":0.37400001287460327}],"concepts":[{"id":"https://openalex.org/C2779396153","wikidata":"https://www.wikidata.org/wiki/Q901227","display_name":"Natural product","level":2,"score":0.7199000120162964},{"id":"https://openalex.org/C2776321320","wikidata":"https://www.wikidata.org/wiki/Q857525","display_name":"Annotation","level":2,"score":0.6869000196456909},{"id":"https://openalex.org/C70721500","wikidata":"https://www.wikidata.org/wiki/Q177005","display_name":"Computational biology","level":1,"score":0.6089000105857849},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.6021999716758728},{"id":"https://openalex.org/C95623464","wikidata":"https://www.wikidata.org/wiki/Q1096149","display_name":"Classifier (UML)","level":2,"score":0.5972999930381775},{"id":"https://openalex.org/C90673727","wikidata":"https://www.wikidata.org/wiki/Q901718","display_name":"Product (mathematics)","level":2,"score":0.44909998774528503},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.44620001316070557},{"id":"https://openalex.org/C165064840","wikidata":"https://www.wikidata.org/wiki/Q1321061","display_name":"Matching (statistics)","level":2,"score":0.43779999017715454},{"id":"https://openalex.org/C104317684","wikidata":"https://www.wikidata.org/wiki/Q7187","display_name":"Gene","level":2,"score":0.3756999969482422},{"id":"https://openalex.org/C26517878","wikidata":"https://www.wikidata.org/wiki/Q228039","display_name":"Key (lock)","level":2,"score":0.37400001287460327},{"id":"https://openalex.org/C36857842","wikidata":"https://www.wikidata.org/wiki/Q1501261","display_name":"Gene cluster","level":3,"score":0.3614000082015991},{"id":"https://openalex.org/C108583219","wikidata":"https://www.wikidata.org/wiki/Q197536","display_name":"Deep learning","level":2,"score":0.3452000021934509},{"id":"https://openalex.org/C2777904410","wikidata":"https://www.wikidata.org/wiki/Q7397","display_name":"Software","level":2,"score":0.33149999380111694},{"id":"https://openalex.org/C2908923196","wikidata":"https://www.wikidata.org/wiki/Q5205742","display_name":"Gene Annotation","level":4,"score":0.3255000114440918},{"id":"https://openalex.org/C86803240","wikidata":"https://www.wikidata.org/wiki/Q420","display_name":"Biology","level":0,"score":0.30140000581741333},{"id":"https://openalex.org/C119857082","wikidata":"https://www.wikidata.org/wiki/Q2539","display_name":"Machine learning","level":1,"score":0.29760000109672546},{"id":"https://openalex.org/C2776608160","wikidata":"https://www.wikidata.org/wiki/Q4785462","display_name":"Natural (archaeology)","level":2,"score":0.2676999866962433},{"id":"https://openalex.org/C74187038","wikidata":"https://www.wikidata.org/wiki/Q1418791","display_name":"Drug discovery","level":2,"score":0.2590000033378601},{"id":"https://openalex.org/C124101348","wikidata":"https://www.wikidata.org/wiki/Q172491","display_name":"Data mining","level":1,"score":0.25369998812675476}],"mesh":[{"descriptor_ui":"D000077321","descriptor_name":"Deep Learning","qualifier_ui":null,"qualifier_name":null,"is_major_topic":false},{"descriptor_ui":"D000077321","descriptor_name":"Deep Learning","qualifier_ui":null,"qualifier_name":null,"is_major_topic":false},{"descriptor_ui":"D000077321","descriptor_name":"Deep Learning","qualifier_ui":null,"qualifier_name":null,"is_major_topic":false},{"descriptor_ui":"D001688","descriptor_name":"Biological Products","qualifier_ui":"Q000378","qualifier_name":"metabolism","is_major_topic":true},{"descriptor_ui":"D001688","descriptor_name":"Biological Products","qualifier_ui":"Q000378","qualifier_name":"metabolism","is_major_topic":true},{"descriptor_ui":"D001688","descriptor_name":"Biological Products","qualifier_ui":"Q000378","qualifier_name":"metabolism","is_major_topic":true},{"descriptor_ui":"D001688","descriptor_name":"Biological Products","qualifier_ui":"Q000737","qualifier_name":"chemistry","is_major_topic":true},{"descriptor_ui":"D001688","descriptor_name":"Biological Products","qualifier_ui":"Q000737","qualifier_name":"chemistry","is_major_topic":true},{"descriptor_ui":"D001688","descriptor_name":"Biological Products","qualifier_ui":"Q000737","qualifier_name":"chemistry","is_major_topic":true},{"descriptor_ui":"D005810","descriptor_name":"Multigene Family","qualifier_ui":null,"qualifier_name":null,"is_major_topic":true},{"descriptor_ui":"D005810","descriptor_name":"Multigene Family","qualifier_ui":null,"qualifier_name":null,"is_major_topic":true},{"descriptor_ui":"D005810","descriptor_name":"Multigene Family","qualifier_ui":null,"qualifier_name":null,"is_major_topic":true},{"descriptor_ui":"D019295","descriptor_name":"Computational Biology","qualifier_ui":"Q000379","qualifier_name":"methods","is_major_topic":true},{"descriptor_ui":"D019295","descriptor_name":"Computational Biology","qualifier_ui":"Q000379","qualifier_name":"methods","is_major_topic":true},{"descriptor_ui":"D019295","descriptor_name":"Computational Biology","qualifier_ui":"Q000379","qualifier_name":"methods","is_major_topic":true},{"descriptor_ui":"D053898","descriptor_name":"Biosynthetic Pathways","qualifier_ui":"Q000235","qualifier_name":"genetics","is_major_topic":true},{"descriptor_ui":"D053898","descriptor_name":"Biosynthetic Pathways","qualifier_ui":"Q000235","qualifier_name":"genetics","is_major_topic":true},{"descriptor_ui":"D053898","descriptor_name":"Biosynthetic Pathways","qualifier_ui":"Q000235","qualifier_name":"genetics","is_major_topic":true}],"locations_count":3,"locations":[{"id":"doi:10.1021/acs.jcim.5c02082","is_oa":false,"landing_page_url":"https://doi.org/10.1021/acs.jcim.5c02082","pdf_url":null,"source":{"id":"https://openalex.org/S167262187","display_name":"Journal of Chemical Information and Modeling","issn_l":"1549-9596","issn":["1549-9596","1549-960X"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310320006","host_organization_name":"American Chemical Society","host_organization_lineage":["https://openalex.org/P4310320006"],"host_organization_lineage_names":["American Chemical Society"],"type":"journal"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Journal of Chemical Information and Modeling","raw_type":"journal-article"},{"id":"pmid:41412814","is_oa":false,"landing_page_url":"https://pubmed.ncbi.nlm.nih.gov/41412814","pdf_url":null,"source":{"id":"https://openalex.org/S4306525036","display_name":"PubMed","issn_l":null,"issn":null,"is_oa":false,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I1299303238","host_organization_name":"National Institutes of Health","host_organization_lineage":["https://openalex.org/I1299303238"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Journal of chemical information and modeling","raw_type":null},{"id":"pmh:oai:pubmedcentral.nih.gov:12744964","is_oa":true,"landing_page_url":"https://pmc.ncbi.nlm.nih.gov/articles/PMC12744964/","pdf_url":null,"source":{"id":"https://openalex.org/S2764455111","display_name":"PubMed Central","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I1299303238","host_organization_name":"National Institutes of Health","host_organization_lineage":["https://openalex.org/I1299303238"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":"J Chem Inf Model","raw_type":"Text"}],"best_oa_location":{"id":"pmh:oai:pubmedcentral.nih.gov:12744964","is_oa":true,"landing_page_url":"https://pmc.ncbi.nlm.nih.gov/articles/PMC12744964/","pdf_url":null,"source":{"id":"https://openalex.org/S2764455111","display_name":"PubMed Central","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I1299303238","host_organization_name":"National Institutes of Health","host_organization_lineage":["https://openalex.org/I1299303238"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":"J Chem Inf Model","raw_type":"Text"},"sustainable_development_goals":[],"awards":[{"id":"https://openalex.org/G7700199930","display_name":null,"funder_award_id":"R35GM159995","funder_id":"https://openalex.org/F4320337354","funder_display_name":"National Institute of General Medical Sciences"},{"id":"https://openalex.org/G8498580294","display_name":null,"funder_award_id":"R35GM128742","funder_id":"https://openalex.org/F4320337354","funder_display_name":"National Institute of General Medical Sciences"},{"id":"https://openalex.org/G964658624","display_name":null,"funder_award_id":"RM1GM145426","funder_id":"https://openalex.org/F4320337354","funder_display_name":"National Institute of General Medical Sciences"}],"funders":[{"id":"https://openalex.org/F4320337354","display_name":"National Institute of General Medical Sciences","ror":"https://ror.org/04q48ey07"}],"has_content":{"grobid_xml":false,"pdf":false},"content_urls":null,"referenced_works_count":44,"referenced_works":["https://openalex.org/W1202680985","https://openalex.org/W1971116463","https://openalex.org/W1982793579","https://openalex.org/W1988037271","https://openalex.org/W1992428015","https://openalex.org/W1999668718","https://openalex.org/W2009898018","https://openalex.org/W2057308191","https://openalex.org/W2135967789","https://openalex.org/W2142328147","https://openalex.org/W2231317445","https://openalex.org/W2256742438","https://openalex.org/W2564866890","https://openalex.org/W2902123714","https://openalex.org/W2921485343","https://openalex.org/W2947423323","https://openalex.org/W2961626135","https://openalex.org/W2962897394","https://openalex.org/W2967688728","https://openalex.org/W2994786999","https://openalex.org/W2997918501","https://openalex.org/W3011366455","https://openalex.org/W3048310471","https://openalex.org/W3095583226","https://openalex.org/W3107629351","https://openalex.org/W3118695441","https://openalex.org/W3119952098","https://openalex.org/W3124709617","https://openalex.org/W3159505833","https://openalex.org/W4295312788","https://openalex.org/W4297734170","https://openalex.org/W4327550249","https://openalex.org/W4366352204","https://openalex.org/W4368358469","https://openalex.org/W4377861946","https://openalex.org/W4386607677","https://openalex.org/W4388034592","https://openalex.org/W4388979610","https://openalex.org/W4400010121","https://openalex.org/W4404432370","https://openalex.org/W4405220977","https://openalex.org/W4407108641","https://openalex.org/W4413619957","https://openalex.org/W4414553450"],"related_works":[],"abstract_inverted_index":{"Natural":[0],"products,":[1],"synthesized":[2],"via":[3],"enzymes":[4],"encoded":[5],"by":[6,73],"biosynthetic":[7,149],"gene":[8],"clusters":[9],"(BGCs),":[10],"represent":[11],"a":[12,98,108,139],"major":[13],"source":[14],"of":[15,28,42,155],"therapeutic":[16],"agents.":[17],"Accurate":[18],"BGC":[19,33,64,146],"annotation":[20,34],"is":[21,161],"essential":[22],"to":[23,38,62,93,102],"unlocking":[24],"the":[25,43,112,128,153],"vast":[26],"potential":[27,92,104],"natural":[29,74,99,105,157],"product":[30,60,75,89,100],"diversity.":[31],"However,":[32],"remains":[35],"challenging":[36],"due":[37],"our":[39],"incomplete":[40],"understanding":[41],"enzymatic":[44],"logic":[45],"underlying":[46],"biosynthesis.":[47],"Here,":[48],"we":[49],"present":[50],"two":[51],"deep":[52],"learning":[53],"models":[54],"trained":[55],"on":[56],"experimentally":[57],"validated":[58],"BGC-natural":[59],"pairs":[61],"advance":[63],"annotation.":[65],"The":[66,81,159],"BGC-multihead":[67,82],"attention":[68,83],"classifier":[69],"(BGC-MAC)":[70],"classifies":[71],"BGCs":[72,87,96],"class,":[76],"outperforming":[77],"antiSMASH":[78],"and":[79,123,136,151],"DeepBGC.":[80],"product-matcher":[84],"(BGC-MAP)":[85],"associates":[86],"with":[88],"structures,":[90],"demonstrating":[91],"prioritize":[94],"candidate":[95],"given":[97,109],"or":[101],"identify":[103],"products":[106],"from":[107],"BGC.":[110],"Importantly,":[111],"models'":[113],"cross-attention":[114],"mechanisms":[115],"enable":[116],"explainable":[117,141],"AI,":[118],"identifying":[119],"key":[120],"protein":[121],"domains":[122],"revealing":[124],"BGC-substructure":[125],"relationships":[126],"in":[127],"biosynthesis":[129],"without":[130],"requiring":[131],"prior":[132],"annotations.":[133],"Together,":[134],"BGC-MAC":[135],"BGC-MAP":[137],"establish":[138],"data-driven,":[140],"AI":[142],"framework":[143],"that":[144],"enhances":[145],"annotation,":[147],"deepens":[148],"insight,":[150],"accelerates":[152],"discovery":[154],"new":[156],"products.":[158],"software":[160],"available":[162],"at":[163],"https://github.com/EvoCatalysis/BGC_annotation.":[164]},"counts_by_year":[],"updated_date":"2026-03-27T05:58:40.876381","created_date":"2025-12-19T00:00:00"}
