{"id":"https://openalex.org/W4393981110","doi":"https://doi.org/10.1038/s42256-024-00823-9","title":"A 5\u2032 UTR language model for decoding untranslated regions of mRNA and function predictions","display_name":"A 5\u2032 UTR language model for decoding untranslated regions of mRNA and function predictions","publication_year":2024,"publication_date":"2024-04-05","ids":{"openalex":"https://openalex.org/W4393981110","doi":"https://doi.org/10.1038/s42256-024-00823-9","pmid":"https://pubmed.ncbi.nlm.nih.gov/38855263"},"language":"en","primary_location":{"id":"doi:10.1038/s42256-024-00823-9","is_oa":false,"landing_page_url":"https://doi.org/10.1038/s42256-024-00823-9","pdf_url":null,"source":{"id":"https://openalex.org/S2912241403","display_name":"Nature Machine Intelligence","issn_l":"2522-5839","issn":["2522-5839"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310319908","host_organization_name":"Nature Portfolio","host_organization_lineage":["https://openalex.org/P4310319908","https://openalex.org/P4310319965"],"host_organization_lineage_names":["Nature Portfolio","Springer Nature"],"type":"journal"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Nature Machine Intelligence","raw_type":"journal-article"},"type":"article","indexed_in":["crossref","pubmed"],"open_access":{"is_oa":true,"oa_status":"green","oa_url":"https://pmc.ncbi.nlm.nih.gov/articles/PMC11155392/pdf/nihms-1998067.pdf","any_repository_has_fulltext":true},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5081142384","display_name":"Yanyi Chu","orcid":"https://orcid.org/0000-0002-4969-3931"},"institutions":[{"id":"https://openalex.org/I20089843","display_name":"Princeton University","ror":"https://ror.org/00hx57361","country_code":"US","type":"education","lineage":["https://openalex.org/I20089843"]},{"id":"https://openalex.org/I97018004","display_name":"Stanford University","ror":"https://ror.org/00f54p054","country_code":"US","type":"education","lineage":["https://openalex.org/I97018004"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Yanyi Chu","raw_affiliation_strings":["Center for Statistics and Machine Learning and Department of Electrical and Computer Engineering, Princeton University, Princeton, NJ 08544, USA","Department of Pathology, Stanford University School of Medicine, Stanford, CA 94305, USA","Department of Electrical and Computer Engineering, Princeton University, Princeton, NJ, USA"],"affiliations":[{"raw_affiliation_string":"Center for Statistics and Machine Learning and Department of Electrical and Computer Engineering, Princeton University, Princeton, NJ 08544, USA","institution_ids":["https://openalex.org/I20089843"]},{"raw_affiliation_string":"Department of Pathology, Stanford University School of Medicine, Stanford, CA 94305, USA","institution_ids":["https://openalex.org/I97018004"]},{"raw_affiliation_string":"Department of Electrical and Computer Engineering, Princeton University, Princeton, NJ, USA","institution_ids":["https://openalex.org/I20089843"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5100580293","display_name":"Dan Yu","orcid":null},"institutions":[{"id":"https://openalex.org/I4210143085","display_name":"Boston Sports & Shoulder Center","ror":"https://ror.org/045s8h491","country_code":"US","type":"healthcare","lineage":["https://openalex.org/I4210143085"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Dan Yu","raw_affiliation_strings":["RVAC Medicines, Waltham, MA 02451, USA","RVAC Medicines, Waltham, MA, USA"],"affiliations":[{"raw_affiliation_string":"RVAC Medicines, Waltham, MA 02451, USA","institution_ids":["https://openalex.org/I4210143085"]},{"raw_affiliation_string":"RVAC Medicines, Waltham, MA, USA","institution_ids":[]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5100512141","display_name":"Yupeng Li","orcid":"https://orcid.org/0009-0000-9052-2408"},"institutions":[{"id":"https://openalex.org/I4210143085","display_name":"Boston Sports & Shoulder Center","ror":"https://ror.org/045s8h491","country_code":"US","type":"healthcare","lineage":["https://openalex.org/I4210143085"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Yupeng Li","raw_affiliation_strings":["RVAC Medicines, Waltham, MA 02451, USA","Zipcode Bio, Weston, MA, USA"],"affiliations":[{"raw_affiliation_string":"RVAC Medicines, Waltham, MA 02451, USA","institution_ids":["https://openalex.org/I4210143085"]},{"raw_affiliation_string":"Zipcode Bio, Weston, MA, USA","institution_ids":[]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5109343769","display_name":"Kaixuan Huang","orcid":null},"institutions":[{"id":"https://openalex.org/I20089843","display_name":"Princeton University","ror":"https://ror.org/00hx57361","country_code":"US","type":"education","lineage":["https://openalex.org/I20089843"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Kaixuan Huang","raw_affiliation_strings":["Center for Statistics and Machine Learning and Department of Electrical and Computer Engineering, Princeton University, Princeton, NJ 08544, USA","Department of Electrical and Computer Engineering, Princeton University, Princeton, NJ, USA"],"affiliations":[{"raw_affiliation_string":"Center for Statistics and Machine Learning and Department of Electrical and Computer Engineering, Princeton University, Princeton, NJ 08544, USA","institution_ids":["https://openalex.org/I20089843"]},{"raw_affiliation_string":"Department of Electrical and Computer Engineering, Princeton University, Princeton, NJ, USA","institution_ids":["https://openalex.org/I20089843"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5103197320","display_name":"Yue Shen","orcid":"https://orcid.org/0000-0002-4148-6874"},"institutions":[{"id":"https://openalex.org/I4210143085","display_name":"Boston Sports & Shoulder Center","ror":"https://ror.org/045s8h491","country_code":"US","type":"healthcare","lineage":["https://openalex.org/I4210143085"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Yue Shen","raw_affiliation_strings":["RVAC Medicines, Waltham, MA 02451, USA","RVAC Medicines, Waltham, MA, USA"],"affiliations":[{"raw_affiliation_string":"RVAC Medicines, Waltham, MA 02451, USA","institution_ids":["https://openalex.org/I4210143085"]},{"raw_affiliation_string":"RVAC Medicines, Waltham, MA, USA","institution_ids":[]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5080765172","display_name":"Le Cong","orcid":"https://orcid.org/0000-0003-4725-8714"},"institutions":[{"id":"https://openalex.org/I97018004","display_name":"Stanford University","ror":"https://ror.org/00f54p054","country_code":"US","type":"education","lineage":["https://openalex.org/I97018004"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Le Cong","raw_affiliation_strings":["Department of Pathology, Stanford University School of Medicine, Stanford, CA 94305, USA","Department of Pathology, School of Medicine, Stanford University, Stanford, CA, USA"],"affiliations":[{"raw_affiliation_string":"Department of Pathology, Stanford University School of Medicine, Stanford, CA 94305, USA","institution_ids":["https://openalex.org/I97018004"]},{"raw_affiliation_string":"Department of Pathology, School of Medicine, Stanford University, Stanford, CA, USA","institution_ids":["https://openalex.org/I97018004"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5101875766","display_name":"Jason Zhang","orcid":"https://orcid.org/0000-0003-4632-7730"},"institutions":[{"id":"https://openalex.org/I63125664","display_name":"Weston College","ror":"https://ror.org/02reesv50","country_code":"GB","type":"education","lineage":["https://openalex.org/I63125664"]}],"countries":["GB"],"is_corresponding":false,"raw_author_name":"Jason Zhang","raw_affiliation_strings":["Zipcode Bio, Weston, MA 02493, USA","Zipcode Bio, Weston, MA, USA"],"affiliations":[{"raw_affiliation_string":"Zipcode Bio, Weston, MA 02493, USA","institution_ids":["https://openalex.org/I63125664"]},{"raw_affiliation_string":"Zipcode Bio, Weston, MA, USA","institution_ids":[]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5100707460","display_name":"Mengdi Wang","orcid":"https://orcid.org/0000-0002-2101-9507"},"institutions":[{"id":"https://openalex.org/I20089843","display_name":"Princeton University","ror":"https://ror.org/00hx57361","country_code":"US","type":"education","lineage":["https://openalex.org/I20089843"]}],"countries":["US"],"is_corresponding":true,"raw_author_name":"Mengdi Wang","raw_affiliation_strings":["Center for Statistics and Machine Learning and Department of Electrical and Computer Engineering, Princeton University, Princeton, NJ 08544, USA","Department of Electrical and Computer Engineering, Princeton University, Princeton, NJ, USA"],"affiliations":[{"raw_affiliation_string":"Center for Statistics and Machine Learning and Department of Electrical and Computer Engineering, Princeton University, Princeton, NJ 08544, USA","institution_ids":["https://openalex.org/I20089843"]},{"raw_affiliation_string":"Department of Electrical and Computer Engineering, Princeton University, Princeton, NJ, USA","institution_ids":["https://openalex.org/I20089843"]}]}],"institutions":[],"countries_distinct_count":2,"institutions_distinct_count":8,"corresponding_author_ids":["https://openalex.org/A5100707460"],"corresponding_institution_ids":["https://openalex.org/I20089843"],"apc_list":{"value":9750,"currency":"EUR","value_usd":11690},"apc_paid":null,"fwci":24.0422,"has_fulltext":true,"cited_by_count":105,"citation_normalized_percentile":{"value":0.9979626,"is_in_top_1_percent":true,"is_in_top_10_percent":true},"cited_by_percentile_year":{"min":99,"max":100},"biblio":{"volume":"6","issue":"4","first_page":"449","last_page":"460"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10521","display_name":"RNA and protein synthesis mechanisms","score":0.9998999834060669,"subfield":{"id":"https://openalex.org/subfields/1312","display_name":"Molecular Biology"},"field":{"id":"https://openalex.org/fields/13","display_name":"Biochemistry, Genetics and Molecular Biology"},"domain":{"id":"https://openalex.org/domains/1","display_name":"Life Sciences"}},"topics":[{"id":"https://openalex.org/T10521","display_name":"RNA and protein synthesis mechanisms","score":0.9998999834060669,"subfield":{"id":"https://openalex.org/subfields/1312","display_name":"Molecular Biology"},"field":{"id":"https://openalex.org/fields/13","display_name":"Biochemistry, Genetics and Molecular Biology"},"domain":{"id":"https://openalex.org/domains/1","display_name":"Life Sciences"}},{"id":"https://openalex.org/T10604","display_name":"RNA Research and Splicing","score":0.9995999932289124,"subfield":{"id":"https://openalex.org/subfields/1312","display_name":"Molecular Biology"},"field":{"id":"https://openalex.org/fields/13","display_name":"Biochemistry, Genetics and Molecular Biology"},"domain":{"id":"https://openalex.org/domains/1","display_name":"Life Sciences"}},{"id":"https://openalex.org/T11482","display_name":"RNA modifications and cancer","score":0.9994999766349792,"subfield":{"id":"https://openalex.org/subfields/1312","display_name":"Molecular Biology"},"field":{"id":"https://openalex.org/fields/13","display_name":"Biochemistry, Genetics and Molecular Biology"},"domain":{"id":"https://openalex.org/domains/1","display_name":"Life Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/three-prime-untranslated-region","display_name":"Three prime untranslated region","score":0.7014325261116028},{"id":"https://openalex.org/keywords/untranslated-region","display_name":"Untranslated region","score":0.677862286567688},{"id":"https://openalex.org/keywords/decoding-methods","display_name":"Decoding methods","score":0.6083678007125854},{"id":"https://openalex.org/keywords/function","display_name":"Function (biology)","score":0.5842882990837097},{"id":"https://openalex.org/keywords/messenger-rna","display_name":"Messenger RNA","score":0.5734220743179321},{"id":"https://openalex.org/keywords/five-prime-untranslated-region","display_name":"Five prime untranslated region","score":0.4784581661224365},{"id":"https://openalex.org/keywords/computational-biology","display_name":"Computational biology","score":0.358828604221344},{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.32525867223739624},{"id":"https://openalex.org/keywords/biology","display_name":"Biology","score":0.2866990566253662},{"id":"https://openalex.org/keywords/cell-biology","display_name":"Cell biology","score":0.2204042375087738},{"id":"https://openalex.org/keywords/genetics","display_name":"Genetics","score":0.21567177772521973},{"id":"https://openalex.org/keywords/telecommunications","display_name":"Telecommunications","score":0.20162436366081238},{"id":"https://openalex.org/keywords/gene","display_name":"Gene","score":0.18357303738594055}],"concepts":[{"id":"https://openalex.org/C22667442","wikidata":"https://www.wikidata.org/wiki/Q3272830","display_name":"Three prime untranslated region","level":5,"score":0.7014325261116028},{"id":"https://openalex.org/C89604277","wikidata":"https://www.wikidata.org/wiki/Q424345","display_name":"Untranslated region","level":4,"score":0.677862286567688},{"id":"https://openalex.org/C57273362","wikidata":"https://www.wikidata.org/wiki/Q576722","display_name":"Decoding methods","level":2,"score":0.6083678007125854},{"id":"https://openalex.org/C14036430","wikidata":"https://www.wikidata.org/wiki/Q3736076","display_name":"Function (biology)","level":2,"score":0.5842882990837097},{"id":"https://openalex.org/C105580179","wikidata":"https://www.wikidata.org/wiki/Q188928","display_name":"Messenger RNA","level":3,"score":0.5734220743179321},{"id":"https://openalex.org/C12464233","wikidata":"https://www.wikidata.org/wiki/Q937624","display_name":"Five prime untranslated region","level":5,"score":0.4784581661224365},{"id":"https://openalex.org/C70721500","wikidata":"https://www.wikidata.org/wiki/Q177005","display_name":"Computational biology","level":1,"score":0.358828604221344},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.32525867223739624},{"id":"https://openalex.org/C86803240","wikidata":"https://www.wikidata.org/wiki/Q420","display_name":"Biology","level":0,"score":0.2866990566253662},{"id":"https://openalex.org/C95444343","wikidata":"https://www.wikidata.org/wiki/Q7141","display_name":"Cell biology","level":1,"score":0.2204042375087738},{"id":"https://openalex.org/C54355233","wikidata":"https://www.wikidata.org/wiki/Q7162","display_name":"Genetics","level":1,"score":0.21567177772521973},{"id":"https://openalex.org/C76155785","wikidata":"https://www.wikidata.org/wiki/Q418","display_name":"Telecommunications","level":1,"score":0.20162436366081238},{"id":"https://openalex.org/C104317684","wikidata":"https://www.wikidata.org/wiki/Q7187","display_name":"Gene","level":2,"score":0.18357303738594055}],"mesh":[],"locations_count":3,"locations":[{"id":"doi:10.1038/s42256-024-00823-9","is_oa":false,"landing_page_url":"https://doi.org/10.1038/s42256-024-00823-9","pdf_url":null,"source":{"id":"https://openalex.org/S2912241403","display_name":"Nature Machine Intelligence","issn_l":"2522-5839","issn":["2522-5839"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310319908","host_organization_name":"Nature Portfolio","host_organization_lineage":["https://openalex.org/P4310319908","https://openalex.org/P4310319965"],"host_organization_lineage_names":["Nature Portfolio","Springer Nature"],"type":"journal"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Nature Machine Intelligence","raw_type":"journal-article"},{"id":"pmid:38855263","is_oa":false,"landing_page_url":"https://pubmed.ncbi.nlm.nih.gov/38855263","pdf_url":null,"source":{"id":"https://openalex.org/S4306525036","display_name":"PubMed","issn_l":null,"issn":null,"is_oa":false,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I1299303238","host_organization_name":"National Institutes of Health","host_organization_lineage":["https://openalex.org/I1299303238"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Nature machine intelligence","raw_type":null},{"id":"pmh:oai:pubmedcentral.nih.gov:11155392","is_oa":true,"landing_page_url":"https://www.ncbi.nlm.nih.gov/pmc/articles/11155392","pdf_url":"https://pmc.ncbi.nlm.nih.gov/articles/PMC11155392/pdf/nihms-1998067.pdf","source":{"id":"https://openalex.org/S2764455111","display_name":"PubMed Central","issn_l":null,"issn":null,"is_oa":false,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I1299303238","host_organization_name":"National Institutes of Health","host_organization_lineage":["https://openalex.org/I1299303238"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":"Nat Mach Intell","raw_type":"Text"}],"best_oa_location":{"id":"pmh:oai:pubmedcentral.nih.gov:11155392","is_oa":true,"landing_page_url":"https://www.ncbi.nlm.nih.gov/pmc/articles/11155392","pdf_url":"https://pmc.ncbi.nlm.nih.gov/articles/PMC11155392/pdf/nihms-1998067.pdf","source":{"id":"https://openalex.org/S2764455111","display_name":"PubMed Central","issn_l":null,"issn":null,"is_oa":false,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I1299303238","host_organization_name":"National Institutes of Health","host_organization_lineage":["https://openalex.org/I1299303238"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":"Nat Mach Intell","raw_type":"Text"},"sustainable_development_goals":[],"awards":[{"id":"https://openalex.org/G409730928","display_name":null,"funder_award_id":"1953686","funder_id":"https://openalex.org/F4320306076","funder_display_name":"National Science Foundation"},{"id":"https://openalex.org/G848032724","display_name":null,"funder_award_id":"Science","funder_id":"https://openalex.org/F4320306076","funder_display_name":"National Science Foundation"}],"funders":[{"id":"https://openalex.org/F4320306076","display_name":"National Science Foundation","ror":"https://ror.org/021nxhr62"}],"has_content":{"pdf":true,"grobid_xml":false},"content_urls":{"pdf":"https://content.openalex.org/works/W4393981110.pdf"},"referenced_works_count":40,"referenced_works":["https://openalex.org/W1929414144","https://openalex.org/W1983273401","https://openalex.org/W2026487666","https://openalex.org/W2045348184","https://openalex.org/W2062299199","https://openalex.org/W2086561953","https://openalex.org/W2095748631","https://openalex.org/W2152052780","https://openalex.org/W2152974197","https://openalex.org/W2234324103","https://openalex.org/W2417928515","https://openalex.org/W2427010553","https://openalex.org/W2462718056","https://openalex.org/W2597558967","https://openalex.org/W2770378609","https://openalex.org/W2884961061","https://openalex.org/W2955231772","https://openalex.org/W2964113711","https://openalex.org/W2966361671","https://openalex.org/W3032045451","https://openalex.org/W3033368660","https://openalex.org/W3081805696","https://openalex.org/W3087615546","https://openalex.org/W3100348855","https://openalex.org/W3111174583","https://openalex.org/W3152698349","https://openalex.org/W3163562839","https://openalex.org/W3180908419","https://openalex.org/W4200135473","https://openalex.org/W4213095938","https://openalex.org/W4220991830","https://openalex.org/W4225858649","https://openalex.org/W4281867072","https://openalex.org/W4319812018","https://openalex.org/W4384008448","https://openalex.org/W4385445546","https://openalex.org/W4389046989","https://openalex.org/W4393981110","https://openalex.org/W6739901393","https://openalex.org/W6967867575"],"related_works":["https://openalex.org/W2002886563","https://openalex.org/W2074437367","https://openalex.org/W2063674507","https://openalex.org/W977309228","https://openalex.org/W2066198055","https://openalex.org/W2037244830","https://openalex.org/W2386767893","https://openalex.org/W1529829075","https://openalex.org/W2075705389","https://openalex.org/W4230503687"],"abstract_inverted_index":null,"counts_by_year":[{"year":2026,"cited_by_count":18},{"year":2025,"cited_by_count":63},{"year":2024,"cited_by_count":24}],"updated_date":"2026-04-10T15:06:20.359241","created_date":"2025-10-10T00:00:00"}
