{"id":"https://openalex.org/W4360615494","doi":"https://doi.org/10.1186/s13321-023-00704-0","title":"GlyLES: Grammar-based Parsing of Glycans from IUPAC-condensed to SMILES","display_name":"GlyLES: Grammar-based Parsing of Glycans from IUPAC-condensed to SMILES","publication_year":2023,"publication_date":"2023-03-23","ids":{"openalex":"https://openalex.org/W4360615494","doi":"https://doi.org/10.1186/s13321-023-00704-0","pmid":"https://pubmed.ncbi.nlm.nih.gov/36959676"},"language":"en","primary_location":{"id":"doi:10.1186/s13321-023-00704-0","is_oa":true,"landing_page_url":"https://doi.org/10.1186/s13321-023-00704-0","pdf_url":"https://jcheminf.biomedcentral.com/counter/pdf/10.1186/s13321-023-00704-0","source":{"id":"https://openalex.org/S180838163","display_name":"Journal of Cheminformatics","issn_l":"1758-2946","issn":["1758-2946"],"is_oa":true,"is_in_doaj":true,"is_core":true,"host_organization":"https://openalex.org/P4310320256","host_organization_name":"BioMed Central","host_organization_lineage":["https://openalex.org/P4310320256","https://openalex.org/P4310319965"],"host_organization_lineage_names":["BioMed Central","Springer Nature"],"type":"journal"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Journal of Cheminformatics","raw_type":"journal-article"},"type":"article","indexed_in":["crossref","doaj","pubmed"],"open_access":{"is_oa":true,"oa_status":"gold","oa_url":"https://jcheminf.biomedcentral.com/counter/pdf/10.1186/s13321-023-00704-0","any_repository_has_fulltext":true},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5005749874","display_name":"Roman Joeres","orcid":"https://orcid.org/0009-0000-2952-9395"},"institutions":[{"id":"https://openalex.org/I4210142777","display_name":"Helmholtz Institute for Pharmaceutical Research Saarland","ror":"https://ror.org/042dsac10","country_code":"DE","type":"government","lineage":["https://openalex.org/I1305996414","https://openalex.org/I4210124929","https://openalex.org/I4210142777"]},{"id":"https://openalex.org/I4210124929","display_name":"Helmholtz Centre for Infection Research","ror":"https://ror.org/03d0p2685","country_code":"DE","type":"facility","lineage":["https://openalex.org/I1305996414","https://openalex.org/I4210124929"]}],"countries":["DE"],"is_corresponding":true,"raw_author_name":"Roman Joeres","raw_affiliation_strings":["Center for Bioinformatics, Saarland University, Saarbruecken, Germany. roman.joeres@helmholtz-hips.de","Helmholtz Institute for Pharmaceutical Research Saarland (HIPS), Helmholtz Centre for Infection Research (HZI), Saarbruecken, Germany. roman.joeres@helmholtz-hips.de","Helmholtz Institute for Pharmaceutical Research Saarland (HIPS), Helmholtz Centre for Infection Research (HZI), Saarbruecken, Germany"],"affiliations":[{"raw_affiliation_string":"Center for Bioinformatics, Saarland University, Saarbruecken, Germany. roman.joeres@helmholtz-hips.de","institution_ids":[]},{"raw_affiliation_string":"Helmholtz Institute for Pharmaceutical Research Saarland (HIPS), Helmholtz Centre for Infection Research (HZI), Saarbruecken, Germany. roman.joeres@helmholtz-hips.de","institution_ids":[]},{"raw_affiliation_string":"Helmholtz Institute for Pharmaceutical Research Saarland (HIPS), Helmholtz Centre for Infection Research (HZI), Saarbruecken, Germany","institution_ids":["https://openalex.org/I4210142777","https://openalex.org/I4210124929"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5051396144","display_name":"Daniel Bojar","orcid":"https://orcid.org/0000-0002-3008-7851"},"institutions":[{"id":"https://openalex.org/I881427289","display_name":"University of Gothenburg","ror":"https://ror.org/01tm6cn81","country_code":"SE","type":"education","lineage":["https://openalex.org/I881427289"]}],"countries":["SE"],"is_corresponding":false,"raw_author_name":"Daniel Bojar","raw_affiliation_strings":["Department of Chemistry and Molecular Biology, University of Gothenburg, Gothenburg, Sweden","Wallenberg Centre for Molecular and Translational Medicine, University of Gothenburg, Gothenburg, Sweden"],"affiliations":[{"raw_affiliation_string":"Department of Chemistry and Molecular Biology, University of Gothenburg, Gothenburg, Sweden","institution_ids":["https://openalex.org/I881427289"]},{"raw_affiliation_string":"Wallenberg Centre for Molecular and Translational Medicine, University of Gothenburg, Gothenburg, Sweden","institution_ids":["https://openalex.org/I881427289"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5101632496","display_name":"Olga V. Kalinina","orcid":"https://orcid.org/0000-0002-9445-477X"},"institutions":[{"id":"https://openalex.org/I91712215","display_name":"Saarland University","ror":"https://ror.org/01jdpyv68","country_code":"DE","type":"education","lineage":["https://openalex.org/I91712215"]},{"id":"https://openalex.org/I4210124929","display_name":"Helmholtz Centre for Infection Research","ror":"https://ror.org/03d0p2685","country_code":"DE","type":"facility","lineage":["https://openalex.org/I1305996414","https://openalex.org/I4210124929"]},{"id":"https://openalex.org/I4210142777","display_name":"Helmholtz Institute for Pharmaceutical Research Saarland","ror":"https://ror.org/042dsac10","country_code":"DE","type":"government","lineage":["https://openalex.org/I1305996414","https://openalex.org/I4210124929","https://openalex.org/I4210142777"]}],"countries":["DE"],"is_corresponding":false,"raw_author_name":"Olga V. Kalinina","raw_affiliation_strings":["Center for Bioinformatics, Saarland University, Saarbruecken, Germany","Faculty of Medicine, Saarland University, Homburg, Germany","Helmholtz Institute for Pharmaceutical Research Saarland (HIPS), Helmholtz Centre for Infection Research (HZI), Saarbruecken, Germany"],"affiliations":[{"raw_affiliation_string":"Center for Bioinformatics, Saarland University, Saarbruecken, Germany","institution_ids":["https://openalex.org/I91712215"]},{"raw_affiliation_string":"Faculty of Medicine, Saarland University, Homburg, Germany","institution_ids":["https://openalex.org/I91712215"]},{"raw_affiliation_string":"Helmholtz Institute for Pharmaceutical Research Saarland (HIPS), Helmholtz Centre for Infection Research (HZI), Saarbruecken, Germany","institution_ids":["https://openalex.org/I4210142777","https://openalex.org/I4210124929"]}]}],"institutions":[],"countries_distinct_count":2,"institutions_distinct_count":3,"corresponding_author_ids":["https://openalex.org/A5005749874"],"corresponding_institution_ids":["https://openalex.org/I4210124929","https://openalex.org/I4210142777"],"apc_list":{"value":1290,"currency":"GBP","value_usd":1582},"apc_paid":{"value":1290,"currency":"GBP","value_usd":1582},"fwci":1.6557,"has_fulltext":true,"cited_by_count":11,"citation_normalized_percentile":{"value":0.83415388,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":{"min":94,"max":98},"biblio":{"volume":"15","issue":"1","first_page":"37","last_page":"37"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10602","display_name":"Glycosylation and Glycoproteins Research","score":1.0,"subfield":{"id":"https://openalex.org/subfields/1312","display_name":"Molecular Biology"},"field":{"id":"https://openalex.org/fields/13","display_name":"Biochemistry, Genetics and Molecular Biology"},"domain":{"id":"https://openalex.org/domains/1","display_name":"Life Sciences"}},"topics":[{"id":"https://openalex.org/T10602","display_name":"Glycosylation and Glycoproteins Research","score":1.0,"subfield":{"id":"https://openalex.org/subfields/1312","display_name":"Molecular Biology"},"field":{"id":"https://openalex.org/fields/13","display_name":"Biochemistry, Genetics and Molecular Biology"},"domain":{"id":"https://openalex.org/domains/1","display_name":"Life Sciences"}},{"id":"https://openalex.org/T10835","display_name":"Carbohydrate Chemistry and Synthesis","score":0.9995999932289124,"subfield":{"id":"https://openalex.org/subfields/1605","display_name":"Organic Chemistry"},"field":{"id":"https://openalex.org/fields/16","display_name":"Chemistry"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10015","display_name":"Genomics and Phylogenetic Studies","score":0.9987000226974487,"subfield":{"id":"https://openalex.org/subfields/1312","display_name":"Molecular Biology"},"field":{"id":"https://openalex.org/fields/13","display_name":"Biochemistry, Genetics and Molecular Biology"},"domain":{"id":"https://openalex.org/domains/1","display_name":"Life Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/chemical-nomenclature","display_name":"Chemical nomenclature","score":0.9176269173622131},{"id":"https://openalex.org/keywords/glycan","display_name":"Glycan","score":0.6074864864349365},{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.5288204550743103},{"id":"https://openalex.org/keywords/notation","display_name":"Notation","score":0.5125668048858643},{"id":"https://openalex.org/keywords/representation","display_name":"Representation (politics)","score":0.4921943247318268},{"id":"https://openalex.org/keywords/chemistry","display_name":"Chemistry","score":0.43486952781677246},{"id":"https://openalex.org/keywords/programming-language","display_name":"Programming language","score":0.35656702518463135},{"id":"https://openalex.org/keywords/mathematics","display_name":"Mathematics","score":0.15239760279655457},{"id":"https://openalex.org/keywords/biochemistry","display_name":"Biochemistry","score":0.10438543558120728},{"id":"https://openalex.org/keywords/glycoprotein","display_name":"Glycoprotein","score":0.10297060012817383},{"id":"https://openalex.org/keywords/organic-chemistry","display_name":"Organic chemistry","score":0.09710279107093811}],"concepts":[{"id":"https://openalex.org/C125832229","wikidata":"https://www.wikidata.org/wiki/Q6503924","display_name":"Chemical nomenclature","level":2,"score":0.9176269173622131},{"id":"https://openalex.org/C206212055","wikidata":"https://www.wikidata.org/wiki/Q2553138","display_name":"Glycan","level":3,"score":0.6074864864349365},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.5288204550743103},{"id":"https://openalex.org/C45357846","wikidata":"https://www.wikidata.org/wiki/Q2001982","display_name":"Notation","level":2,"score":0.5125668048858643},{"id":"https://openalex.org/C2776359362","wikidata":"https://www.wikidata.org/wiki/Q2145286","display_name":"Representation (politics)","level":3,"score":0.4921943247318268},{"id":"https://openalex.org/C185592680","wikidata":"https://www.wikidata.org/wiki/Q2329","display_name":"Chemistry","level":0,"score":0.43486952781677246},{"id":"https://openalex.org/C199360897","wikidata":"https://www.wikidata.org/wiki/Q9143","display_name":"Programming language","level":1,"score":0.35656702518463135},{"id":"https://openalex.org/C33923547","wikidata":"https://www.wikidata.org/wiki/Q395","display_name":"Mathematics","level":0,"score":0.15239760279655457},{"id":"https://openalex.org/C55493867","wikidata":"https://www.wikidata.org/wiki/Q7094","display_name":"Biochemistry","level":1,"score":0.10438543558120728},{"id":"https://openalex.org/C108625454","wikidata":"https://www.wikidata.org/wiki/Q187126","display_name":"Glycoprotein","level":2,"score":0.10297060012817383},{"id":"https://openalex.org/C178790620","wikidata":"https://www.wikidata.org/wiki/Q11351","display_name":"Organic chemistry","level":1,"score":0.09710279107093811},{"id":"https://openalex.org/C199539241","wikidata":"https://www.wikidata.org/wiki/Q7748","display_name":"Law","level":1,"score":0.0},{"id":"https://openalex.org/C94625758","wikidata":"https://www.wikidata.org/wiki/Q7163","display_name":"Politics","level":2,"score":0.0},{"id":"https://openalex.org/C94375191","wikidata":"https://www.wikidata.org/wiki/Q11205","display_name":"Arithmetic","level":1,"score":0.0},{"id":"https://openalex.org/C17744445","wikidata":"https://www.wikidata.org/wiki/Q36442","display_name":"Political science","level":0,"score":0.0}],"mesh":[],"locations_count":4,"locations":[{"id":"doi:10.1186/s13321-023-00704-0","is_oa":true,"landing_page_url":"https://doi.org/10.1186/s13321-023-00704-0","pdf_url":"https://jcheminf.biomedcentral.com/counter/pdf/10.1186/s13321-023-00704-0","source":{"id":"https://openalex.org/S180838163","display_name":"Journal of Cheminformatics","issn_l":"1758-2946","issn":["1758-2946"],"is_oa":true,"is_in_doaj":true,"is_core":true,"host_organization":"https://openalex.org/P4310320256","host_organization_name":"BioMed Central","host_organization_lineage":["https://openalex.org/P4310320256","https://openalex.org/P4310319965"],"host_organization_lineage_names":["BioMed Central","Springer Nature"],"type":"journal"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Journal of Cheminformatics","raw_type":"journal-article"},{"id":"pmid:36959676","is_oa":false,"landing_page_url":"https://pubmed.ncbi.nlm.nih.gov/36959676","pdf_url":null,"source":{"id":"https://openalex.org/S4306525036","display_name":"PubMed","issn_l":null,"issn":null,"is_oa":false,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I1299303238","host_organization_name":"National Institutes of Health","host_organization_lineage":["https://openalex.org/I1299303238"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Journal of cheminformatics","raw_type":null},{"id":"pmh:oai:pubmedcentral.nih.gov:10035253","is_oa":true,"landing_page_url":"https://www.ncbi.nlm.nih.gov/pmc/articles/10035253","pdf_url":"https://pmc.ncbi.nlm.nih.gov/articles/PMC10035253/pdf/13321_2023_Article_704.pdf","source":{"id":"https://openalex.org/S2764455111","display_name":"PubMed Central","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I1299303238","host_organization_name":"National Institutes of Health","host_organization_lineage":["https://openalex.org/I1299303238"],"host_organization_lineage_names":[],"type":"repository"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":"J Cheminform","raw_type":"Text"},{"id":"pmh:oai:doaj.org/article:be5c3de7146e4616a57edc91a71cd089","is_oa":true,"landing_page_url":"https://doaj.org/article/be5c3de7146e4616a57edc91a71cd089","pdf_url":null,"source":{"id":"https://openalex.org/S112646816","display_name":"SHILAP Revista de lepidopterolog\u00eda","issn_l":"0300-5267","issn":["0300-5267","2340-4078"],"is_oa":true,"is_in_doaj":true,"is_core":false,"host_organization":null,"host_organization_name":null,"host_organization_lineage":[],"host_organization_lineage_names":[],"type":"journal"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":"Journal of Cheminformatics, Vol 15, Iss 1, Pp 1-11 (2023)","raw_type":"article"}],"best_oa_location":{"id":"doi:10.1186/s13321-023-00704-0","is_oa":true,"landing_page_url":"https://doi.org/10.1186/s13321-023-00704-0","pdf_url":"https://jcheminf.biomedcentral.com/counter/pdf/10.1186/s13321-023-00704-0","source":{"id":"https://openalex.org/S180838163","display_name":"Journal of Cheminformatics","issn_l":"1758-2946","issn":["1758-2946"],"is_oa":true,"is_in_doaj":true,"is_core":true,"host_organization":"https://openalex.org/P4310320256","host_organization_name":"BioMed Central","host_organization_lineage":["https://openalex.org/P4310320256","https://openalex.org/P4310319965"],"host_organization_lineage_names":["BioMed Central","Springer Nature"],"type":"journal"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Journal of Cheminformatics","raw_type":"journal-article"},"sustainable_development_goals":[{"display_name":"Quality Education","score":0.6499999761581421,"id":"https://metadata.un.org/sdg/4"}],"awards":[],"funders":[{"id":"https://openalex.org/F4320320923","display_name":"Branco Weiss Fellowship \u2013 Society in Science","ror":"https://ror.org/05a28rw58"},{"id":"https://openalex.org/F4320322327","display_name":"Knut och Alice Wallenbergs Stiftelse","ror":"https://ror.org/004hzzk67"},{"id":"https://openalex.org/F4320323421","display_name":"G\u00f6teborgs Universitet","ror":"https://ror.org/01tm6cn81"}],"has_content":{"pdf":true,"grobid_xml":false},"content_urls":{"pdf":"https://content.openalex.org/works/W4360615494.pdf"},"referenced_works_count":34,"referenced_works":["https://openalex.org/W145329232","https://openalex.org/W1975147762","https://openalex.org/W2007058937","https://openalex.org/W2034354062","https://openalex.org/W2055498841","https://openalex.org/W2072858400","https://openalex.org/W2077538928","https://openalex.org/W2083174069","https://openalex.org/W2094937489","https://openalex.org/W2121076445","https://openalex.org/W2134950344","https://openalex.org/W2190199302","https://openalex.org/W2237372923","https://openalex.org/W2401162373","https://openalex.org/W2417623909","https://openalex.org/W2591586569","https://openalex.org/W2592378655","https://openalex.org/W2790040331","https://openalex.org/W2802098245","https://openalex.org/W2899070097","https://openalex.org/W2912075946","https://openalex.org/W2942758734","https://openalex.org/W2953110573","https://openalex.org/W2981114078","https://openalex.org/W3036138343","https://openalex.org/W3089517581","https://openalex.org/W3158336232","https://openalex.org/W3174429003","https://openalex.org/W3201853415","https://openalex.org/W3215407107","https://openalex.org/W4220918884","https://openalex.org/W4297837250","https://openalex.org/W4298008375","https://openalex.org/W4382776004"],"related_works":["https://openalex.org/W2095596879","https://openalex.org/W2171646645","https://openalex.org/W4251955477","https://openalex.org/W4386027229","https://openalex.org/W2065541177","https://openalex.org/W2016358259","https://openalex.org/W4212769910","https://openalex.org/W2466842274","https://openalex.org/W4385815001","https://openalex.org/W4256142723"],"abstract_inverted_index":{"Glycans":[0,57,83],"are":[1,8,15,58,96],"important":[2,30],"polysaccharides":[3],"on":[4,73,106,114,191],"cellular":[5],"surfaces":[6],"that":[7,85,219],"bound":[9],"to":[10,90,137,142,167,228],"glycoproteins":[11],"and":[12,37,134,243,245],"glycolipids.":[13],"These":[14,94],"one":[16],"of":[17,23,49,70,156,160,187,207,226],"the":[18,47,62,74,79,91,103,115,139,147,153,170,174,180,184,196,204,211,216,223],"most":[19],"common":[20],"post-translational":[21],"modifications":[22],"proteins":[24],"in":[25,32,42,99,169,210],"eukaryotic":[26],"cells.":[27],"They":[28],"play":[29],"roles":[31],"protein":[33],"folding,":[34],"cell-cell":[35],"interactions,":[36],"other":[38],"extracellular":[39],"processes.":[40],"Changes":[41],"glycan":[43,104,209],"structures":[44,186],"may":[45,232],"influence":[46],"course":[48],"different":[50],"diseases,":[51],"such":[52,119],"as":[53,78,120],"infections":[54],"or":[55],"cancer.":[56],"commonly":[59],"represented":[60],"using":[61],"IUPAC-condensed":[63,65,140,161,175,193,224],"notation.":[64,176,213],"is":[66,129,215,254],"a":[67,107,112,165,208,246],"textual":[68],"representation":[69,113],"glycans":[71,227],"operating":[72],"same":[75],"topological":[76,108],"level":[77],"Symbol":[80],"Nomenclature":[81],"for":[82,111,152,250],"(SNFG)":[84],"assigns":[86],"colored,":[87],"geometrical":[88],"shapes":[89],"main":[92],"monomers.":[93],"symbols":[95],"then":[97],"connected":[98],"tree-like":[100],"structures,":[101],"visualizing":[102],"structure":[105,206],"level.":[109],"Yet":[110],"atomic":[116,185,205],"level,":[117],"notations":[118],"SMILES":[121,157,212,229],"should":[122],"be":[123],"used.":[124],"To":[125],"our":[126],"knowledge,":[127],"there":[128],"no":[130],"easy-to-use,":[131],"general,":[132],"open-source,":[133],"offline":[135],"tool":[136,181],"convert":[138],"notation":[141,225],"SMILES.":[143],"Here,":[144],"we":[145],"present":[146],"open-access":[148],"Python":[149],"package":[150,218],"GlyLES":[151,163,214,253],"generalizable":[154],"generation":[155],"representations":[158],"out":[159],"representations.":[162],"uses":[164],"grammar":[166],"read":[168],"monomer":[171,189],"tree":[172],"from":[173,222],"From":[177],"this":[178],"tree,":[179],"can":[182],"compute":[183],"each":[188],"based":[190],"their":[192],"descriptions.":[194],"In":[195],"last":[197],"step,":[198],"it":[199],"merges":[200],"all":[201],"monomers":[202],"into":[203],"first":[217],"allows":[220],"conversion":[221],"strings.":[230],"This":[231],"have":[233],"multiple":[234],"applications,":[235],"including":[236],"straightforward":[237],"visualization,":[238],"substructure":[239],"search,":[240],"molecular":[241],"modeling":[242],"docking,":[244],"new":[247],"featurization":[248],"strategy":[249],"machine-learning":[251],"algorithms.":[252],"available":[255],"at":[256],"https://github.com/kalininalab/GlyLES":[257],".":[258]},"counts_by_year":[{"year":2025,"cited_by_count":4},{"year":2024,"cited_by_count":2},{"year":2023,"cited_by_count":5}],"updated_date":"2026-04-21T08:09:41.155169","created_date":"2025-10-10T00:00:00"}
