{"id":"https://openalex.org/W4409884454","doi":"https://doi.org/10.1186/s13321-025-01008-1","title":"SMILES all around: structure to SMILES conversion for transition metal complexes","display_name":"SMILES all around: structure to SMILES conversion for transition metal complexes","publication_year":2025,"publication_date":"2025-04-28","ids":{"openalex":"https://openalex.org/W4409884454","doi":"https://doi.org/10.1186/s13321-025-01008-1","pmid":"https://pubmed.ncbi.nlm.nih.gov/40296090"},"language":"en","primary_location":{"id":"doi:10.1186/s13321-025-01008-1","is_oa":true,"landing_page_url":"https://doi.org/10.1186/s13321-025-01008-1","pdf_url":"https://jcheminf.biomedcentral.com/counter/pdf/10.1186/s13321-025-01008-1","source":{"id":"https://openalex.org/S180838163","display_name":"Journal of Cheminformatics","issn_l":"1758-2946","issn":["1758-2946"],"is_oa":true,"is_in_doaj":true,"is_core":true,"host_organization":"https://openalex.org/P4310320256","host_organization_name":"BioMed Central","host_organization_lineage":["https://openalex.org/P4310320256","https://openalex.org/P4310319965"],"host_organization_lineage_names":["BioMed Central","Springer Nature"],"type":"journal"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Journal of Cheminformatics","raw_type":"journal-article"},"type":"article","indexed_in":["crossref","doaj","pubmed"],"open_access":{"is_oa":true,"oa_status":"gold","oa_url":"https://jcheminf.biomedcentral.com/counter/pdf/10.1186/s13321-025-01008-1","any_repository_has_fulltext":true},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5079016206","display_name":"Maria H. Rasmussen","orcid":null},"institutions":[{"id":"https://openalex.org/I124055696","display_name":"University of Copenhagen","ror":"https://ror.org/035b05819","country_code":"DK","type":"education","lineage":["https://openalex.org/I124055696"]}],"countries":["DK"],"is_corresponding":true,"raw_author_name":"Maria H. Rasmussen","raw_affiliation_strings":["Department of Chemistry, University of Copenhagen, Copenhagen, Denmark"],"affiliations":[{"raw_affiliation_string":"Department of Chemistry, University of Copenhagen, Copenhagen, Denmark","institution_ids":["https://openalex.org/I124055696"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5092254348","display_name":"Magnus Strandgaard","orcid":null},"institutions":[{"id":"https://openalex.org/I124055696","display_name":"University of Copenhagen","ror":"https://ror.org/035b05819","country_code":"DK","type":"education","lineage":["https://openalex.org/I124055696"]}],"countries":["DK"],"is_corresponding":false,"raw_author_name":"Magnus Strandgaard","raw_affiliation_strings":["Department of Chemistry, University of Copenhagen, Copenhagen, Denmark"],"affiliations":[{"raw_affiliation_string":"Department of Chemistry, University of Copenhagen, Copenhagen, Denmark","institution_ids":["https://openalex.org/I124055696"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5051973614","display_name":"Julius Seumer","orcid":"https://orcid.org/0000-0003-2512-3536"},"institutions":[{"id":"https://openalex.org/I124055696","display_name":"University of Copenhagen","ror":"https://ror.org/035b05819","country_code":"DK","type":"education","lineage":["https://openalex.org/I124055696"]}],"countries":["DK"],"is_corresponding":false,"raw_author_name":"Julius Seumer","raw_affiliation_strings":["Department of Chemistry, University of Copenhagen, Copenhagen, Denmark"],"affiliations":[{"raw_affiliation_string":"Department of Chemistry, University of Copenhagen, Copenhagen, Denmark","institution_ids":["https://openalex.org/I124055696"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5033340669","display_name":"Lars Hemmingsen","orcid":"https://orcid.org/0000-0002-1823-3035"},"institutions":[{"id":"https://openalex.org/I124055696","display_name":"University of Copenhagen","ror":"https://ror.org/035b05819","country_code":"DK","type":"education","lineage":["https://openalex.org/I124055696"]}],"countries":["DK"],"is_corresponding":false,"raw_author_name":"Laura K. Hemmingsen","raw_affiliation_strings":["Department of Chemistry, University of Copenhagen, Copenhagen, Denmark"],"affiliations":[{"raw_affiliation_string":"Department of Chemistry, University of Copenhagen, Copenhagen, Denmark","institution_ids":["https://openalex.org/I124055696"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5002793023","display_name":"Angelo Frei","orcid":"https://orcid.org/0000-0001-6169-2491"},"institutions":[{"id":"https://openalex.org/I52099693","display_name":"University of York","ror":"https://ror.org/04m01e293","country_code":"GB","type":"education","lineage":["https://openalex.org/I52099693"]}],"countries":["GB"],"is_corresponding":false,"raw_author_name":"Angelo Frei","raw_affiliation_strings":["Department of Chemistry, University of York, York, UK"],"affiliations":[{"raw_affiliation_string":"Department of Chemistry, University of York, York, UK","institution_ids":["https://openalex.org/I52099693"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5044914316","display_name":"David Balcells","orcid":"https://orcid.org/0000-0002-3389-0543"},"institutions":[{"id":"https://openalex.org/I184942183","display_name":"University of Oslo","ror":"https://ror.org/01xtthb56","country_code":"NO","type":"education","lineage":["https://openalex.org/I184942183"]}],"countries":["NO"],"is_corresponding":false,"raw_author_name":"David Balcells","raw_affiliation_strings":["Department of Chemistry, University of Oslo, Oslo, Norway"],"affiliations":[{"raw_affiliation_string":"Department of Chemistry, University of Oslo, Oslo, Norway","institution_ids":["https://openalex.org/I184942183"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5053685425","display_name":"Jan H. Jensen","orcid":"https://orcid.org/0000-0002-1465-1010"},"institutions":[{"id":"https://openalex.org/I124055696","display_name":"University of Copenhagen","ror":"https://ror.org/035b05819","country_code":"DK","type":"education","lineage":["https://openalex.org/I124055696"]}],"countries":["DK"],"is_corresponding":false,"raw_author_name":"Jan H. Jensen","raw_affiliation_strings":["Department of Chemistry, University of Copenhagen, Copenhagen, Denmark. jhjensen@chem.ku.dk"],"affiliations":[{"raw_affiliation_string":"Department of Chemistry, University of Copenhagen, Copenhagen, Denmark. jhjensen@chem.ku.dk","institution_ids":["https://openalex.org/I124055696"]}]}],"institutions":[],"countries_distinct_count":3,"institutions_distinct_count":7,"corresponding_author_ids":["https://openalex.org/A5079016206"],"corresponding_institution_ids":["https://openalex.org/I124055696"],"apc_list":{"value":1290,"currency":"GBP","value_usd":1582},"apc_paid":{"value":1290,"currency":"GBP","value_usd":1582},"fwci":7.4678,"has_fulltext":true,"cited_by_count":16,"citation_normalized_percentile":{"value":0.9790956,"is_in_top_1_percent":false,"is_in_top_10_percent":true},"cited_by_percentile_year":{"min":99,"max":100},"biblio":{"volume":"17","issue":"1","first_page":"63","last_page":"63"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T11948","display_name":"Machine Learning in Materials Science","score":0.9961000084877014,"subfield":{"id":"https://openalex.org/subfields/2505","display_name":"Materials Chemistry"},"field":{"id":"https://openalex.org/fields/25","display_name":"Materials Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T11948","display_name":"Machine Learning in Materials Science","score":0.9961000084877014,"subfield":{"id":"https://openalex.org/subfields/2505","display_name":"Materials Chemistry"},"field":{"id":"https://openalex.org/fields/25","display_name":"Materials Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10211","display_name":"Computational Drug Discovery Methods","score":0.9900000095367432,"subfield":{"id":"https://openalex.org/subfields/1703","display_name":"Computational Theory and Mathematics"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T13180","display_name":"Chemistry and Chemical Engineering","score":0.9721999764442444,"subfield":{"id":"https://openalex.org/subfields/2304","display_name":"Environmental Chemistry"},"field":{"id":"https://openalex.org/fields/23","display_name":"Environmental Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.5336597561836243},{"id":"https://openalex.org/keywords/smiles-rearrangement","display_name":"Smiles rearrangement","score":0.45870766043663025},{"id":"https://openalex.org/keywords/data-science","display_name":"Data science","score":0.42782995104789734},{"id":"https://openalex.org/keywords/data-mining","display_name":"Data mining","score":0.33463382720947266},{"id":"https://openalex.org/keywords/chemistry","display_name":"Chemistry","score":0.29663416743278503},{"id":"https://openalex.org/keywords/stereochemistry","display_name":"Stereochemistry","score":0.10866525769233704}],"concepts":[{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.5336597561836243},{"id":"https://openalex.org/C2779587451","wikidata":"https://www.wikidata.org/wiki/Q898710","display_name":"Smiles rearrangement","level":2,"score":0.45870766043663025},{"id":"https://openalex.org/C2522767166","wikidata":"https://www.wikidata.org/wiki/Q2374463","display_name":"Data science","level":1,"score":0.42782995104789734},{"id":"https://openalex.org/C124101348","wikidata":"https://www.wikidata.org/wiki/Q172491","display_name":"Data mining","level":1,"score":0.33463382720947266},{"id":"https://openalex.org/C185592680","wikidata":"https://www.wikidata.org/wiki/Q2329","display_name":"Chemistry","level":0,"score":0.29663416743278503},{"id":"https://openalex.org/C71240020","wikidata":"https://www.wikidata.org/wiki/Q186011","display_name":"Stereochemistry","level":1,"score":0.10866525769233704}],"mesh":[],"locations_count":5,"locations":[{"id":"doi:10.1186/s13321-025-01008-1","is_oa":true,"landing_page_url":"https://doi.org/10.1186/s13321-025-01008-1","pdf_url":"https://jcheminf.biomedcentral.com/counter/pdf/10.1186/s13321-025-01008-1","source":{"id":"https://openalex.org/S180838163","display_name":"Journal of Cheminformatics","issn_l":"1758-2946","issn":["1758-2946"],"is_oa":true,"is_in_doaj":true,"is_core":true,"host_organization":"https://openalex.org/P4310320256","host_organization_name":"BioMed Central","host_organization_lineage":["https://openalex.org/P4310320256","https://openalex.org/P4310319965"],"host_organization_lineage_names":["BioMed Central","Springer Nature"],"type":"journal"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Journal of Cheminformatics","raw_type":"journal-article"},{"id":"pmid:40296090","is_oa":false,"landing_page_url":"https://pubmed.ncbi.nlm.nih.gov/40296090","pdf_url":null,"source":{"id":"https://openalex.org/S4306525036","display_name":"PubMed","issn_l":null,"issn":null,"is_oa":false,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I1299303238","host_organization_name":"National Institutes of Health","host_organization_lineage":["https://openalex.org/I1299303238"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Journal of cheminformatics","raw_type":null},{"id":"pmh:oai:pure.atira.dk:openaire_cris_publications/c1a29111-7caf-48bf-9058-c2f08b9bd55c","is_oa":true,"landing_page_url":"https://researchprofiles.ku.dk/da/publications/c1a29111-7caf-48bf-9058-c2f08b9bd55c","pdf_url":"https://curis.ku.dk/ws/files/450048094/s13321-025-01008-1.pdf","source":{"id":"https://openalex.org/S4306401983","display_name":"Research at the University of Copenhagen (University of Copenhagen)","issn_l":null,"issn":null,"is_oa":false,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I124055696","host_organization_name":"University of Copenhagen","host_organization_lineage":["https://openalex.org/I124055696"],"host_organization_lineage_names":[],"type":"repository"},"license":"other-oa","license_id":"https://openalex.org/licenses/other-oa","version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":"Rasmussen , M H , Strandgaard , M , Seumer , J , Hemmingsen , L K , Frei , A , Balcells , D & Jensen , J H 2025 , ' SMILES all around : structure to SMILES conversion for transition metal complexes ' , Journal of Cheminformatics , vol. 17 , no. 1 , 63 . https://doi.org/10.1186/s13321-025-01008-1","raw_type":"article"},{"id":"pmh:oai:doaj.org/article:e5fcb51dc35346d1bf16773fa9c6bcfc","is_oa":true,"landing_page_url":"https://doaj.org/article/e5fcb51dc35346d1bf16773fa9c6bcfc","pdf_url":null,"source":{"id":"https://openalex.org/S112646816","display_name":"SHILAP Revista de lepidopterolog\u00eda","issn_l":"0300-5267","issn":["0300-5267","2340-4078"],"is_oa":true,"is_in_doaj":true,"is_core":false,"host_organization":null,"host_organization_name":null,"host_organization_lineage":[],"host_organization_lineage_names":[],"type":"journal"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":"Journal of Cheminformatics, Vol 17, Iss 1, Pp 1-13 (2025)","raw_type":"article"},{"id":"pmh:oai:pubmedcentral.nih.gov:12039060","is_oa":true,"landing_page_url":"https://www.ncbi.nlm.nih.gov/pmc/articles/12039060","pdf_url":null,"source":{"id":"https://openalex.org/S2764455111","display_name":"PubMed Central","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I1299303238","host_organization_name":"National Institutes of Health","host_organization_lineage":["https://openalex.org/I1299303238"],"host_organization_lineage_names":[],"type":"repository"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":"J Cheminform","raw_type":"Text"}],"best_oa_location":{"id":"doi:10.1186/s13321-025-01008-1","is_oa":true,"landing_page_url":"https://doi.org/10.1186/s13321-025-01008-1","pdf_url":"https://jcheminf.biomedcentral.com/counter/pdf/10.1186/s13321-025-01008-1","source":{"id":"https://openalex.org/S180838163","display_name":"Journal of Cheminformatics","issn_l":"1758-2946","issn":["1758-2946"],"is_oa":true,"is_in_doaj":true,"is_core":true,"host_organization":"https://openalex.org/P4310320256","host_organization_name":"BioMed Central","host_organization_lineage":["https://openalex.org/P4310320256","https://openalex.org/P4310319965"],"host_organization_lineage_names":["BioMed Central","Springer Nature"],"type":"journal"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Journal of Cheminformatics","raw_type":"journal-article"},"sustainable_development_goals":[],"awards":[{"id":"https://openalex.org/G5687107550","display_name":null,"funder_award_id":"NNF20OC0064104","funder_id":"https://openalex.org/F4320325957","funder_display_name":"Novo Nordisk Fonden"}],"funders":[{"id":"https://openalex.org/F4320320945","display_name":"K\u00f8benhavns Universitet","ror":"https://ror.org/035b05819"},{"id":"https://openalex.org/F4320322436","display_name":"Novo Nordisk","ror":"https://ror.org/0435rc536"},{"id":"https://openalex.org/F4320325957","display_name":"Novo Nordisk Fonden","ror":"https://ror.org/04txyc737"}],"has_content":{"grobid_xml":true,"pdf":true},"content_urls":{"pdf":"https://content.openalex.org/works/W4409884454.pdf","grobid_xml":"https://content.openalex.org/works/W4409884454.grobid-xml"},"referenced_works_count":21,"referenced_works":["https://openalex.org/W1974162115","https://openalex.org/W1981458170","https://openalex.org/W1988037271","https://openalex.org/W2160592148","https://openalex.org/W2169678694","https://openalex.org/W2319902168","https://openalex.org/W2416896172","https://openalex.org/W2912083425","https://openalex.org/W3014154196","https://openalex.org/W3098543521","https://openalex.org/W4293741009","https://openalex.org/W4360780118","https://openalex.org/W4367727879","https://openalex.org/W4383216745","https://openalex.org/W4389340616","https://openalex.org/W4391815300","https://openalex.org/W4391881459","https://openalex.org/W4393309150","https://openalex.org/W4399439682","https://openalex.org/W4403488032","https://openalex.org/W6765940776"],"related_works":["https://openalex.org/W4391375266","https://openalex.org/W2899084033","https://openalex.org/W2748952813","https://openalex.org/W4280602306","https://openalex.org/W2991005846","https://openalex.org/W2949151618","https://openalex.org/W2953164896","https://openalex.org/W2033882320","https://openalex.org/W2140018336","https://openalex.org/W3095763436"],"abstract_inverted_index":{"We":[0,139,163,252,305],"present":[1,237,253],"a":[2,76,149,238,254,275],"method":[3,77,255],"for":[4,8,37,64,148,159,245],"creating":[5],"RDKit-parsable":[6,259],"SMILES":[7,61,69,86,126,147,166,221,244,260,280],"transition":[9,263],"metal":[10,264],"complexes":[11,265],"(TMCs)":[12,266],"based":[13,98,222],"on":[14,99,210,317],"xyz-coordinates":[15],"and":[16,94,155,173,199,270,302],"overall":[17],"charge":[18],"of":[19,145,151,176,185,240,262,277,292],"the":[20,30,35,129,152,177,183,190,211,220,249,318],"complex.":[21],"This":[22,228],"can":[23,224,257,312],"be":[24,180],"viewed":[25],"as":[26,233,300],"an":[27,67],"extension":[28],"to":[29,59,71,167,179,273,286],"program":[31],"xyz2mol":[32],"that":[33,52,208,256,307],"does":[34],"same":[36],"organic":[38],"molecules.":[39],"The":[40,282],"only":[41],"dependency":[42],"is":[43,66],"RDKit,":[44],"which":[45],"makes":[46,229],"it":[47,57,272],"widely":[48],"applicable.":[49],"One":[50],"thing":[51],"has":[53,78],"been":[54],"lacking":[55],"when":[56],"comes":[58],"generating":[60],"from":[62,105,267],"structure":[63],"TMCs":[65,247],"existing":[68],"dataset":[70,239,276],"compare":[72,140],"with.":[73],"Therefore,":[74,82],"sanity-checking":[75],"required":[79],"manual":[80],"work.":[81],"we":[83,206,236],"also":[84],"generate":[85,287],"two":[87],"other":[88],"ways;":[89],"one":[90,124],"where":[91,197],"ligand":[92],"charges":[93],"TMC":[95,279,293],"connectivity":[96],"are":[97,201],"natural":[100],"bond":[101],"orbital":[102],"(NBO)":[103],"analysis":[104],"density":[106],"functional":[107],"theory":[108],"(DFT)":[109],"calculations":[110],"utilizing":[111],"recent":[112],"work":[113],"by":[114,137,193],"Kneiding":[115,194],"et":[116,195],"al.":[117,196],"(Digit":[118],"Discov":[119],"2:":[120],"618-633,":[121],"2023).":[122],"Another":[123],"fixes":[125],"available":[127],"through":[128],"Cambridge":[130],"Structural":[131],"Database":[132],"(CSD),":[133],"making":[134],"them":[135,230],"parsable":[136,243],"RDKit.":[138],"these":[141,165,308],"three":[142,161],"different":[143],"ways":[144],"obtaining":[146],"subset":[150],"CSD":[153],"(tmQMg)":[154],"find":[156,207],">70%":[157],"agreement":[158],"all":[160],"pairs.":[162],"utilize":[164],"make":[168],"simple":[169,310],"molecular":[170,297],"fingerprint":[171],"(FP)":[172],"graph-based":[174],"representations":[175,223,298,311],"molecules":[178],"used":[181],"in":[182,248],"context":[184],"machine":[186,289],"learning.":[187],"Comparing":[188],"with":[189,203],"graphs":[191],"made":[192],"nodes":[198],"edges":[200],"featurized":[202],"DFT":[204],"properties,":[205],"depending":[209,316],"target":[212,319],"property":[213],"(polarizability,":[214],"HOMO-LUMO":[215],"gap":[216],"or":[217],"dipole":[218],"moment)":[219],"perform":[225,288,313],"equally":[226],"well.":[227],"very":[231],"suitable":[232],"baseline-models.":[234],"Finally":[235],"227k":[241,278],"RDKit":[242],"mononuclear":[246],"CSD.Scientific":[250],"contribution":[251],"create":[258,274],"strings":[261],"Cartesian":[268],"coordinates":[269],"use":[271],"strings.":[281],"RDKit-parsability":[283],"allows":[284],"us":[285],"learning":[290],"studies":[291],"properties":[294],"using":[295],"\"standard\"":[296],"such":[299],"fingerprints":[301],"2D-graph":[303],"convolution.":[304],"show":[306],"relatively":[309],"quite":[314],"well":[315],"property.":[320]},"counts_by_year":[{"year":2026,"cited_by_count":8},{"year":2025,"cited_by_count":8}],"updated_date":"2026-04-21T08:09:41.155169","created_date":"2025-10-10T00:00:00"}
