{"id":"https://openalex.org/W4200319408","doi":"https://doi.org/10.1109/bibe52308.2021.9635320","title":"Preparation of Simplified Molecular Input Line Entry System Notation Datasets for use in Convolutional Neural Networks","display_name":"Preparation of Simplified Molecular Input Line Entry System Notation Datasets for use in Convolutional Neural Networks","publication_year":2021,"publication_date":"2021-10-25","ids":{"openalex":"https://openalex.org/W4200319408","doi":"https://doi.org/10.1109/bibe52308.2021.9635320"},"language":"en","primary_location":{"id":"doi:10.1109/bibe52308.2021.9635320","is_oa":false,"landing_page_url":"https://doi.org/10.1109/bibe52308.2021.9635320","pdf_url":null,"source":{"id":"https://openalex.org/S4363608533","display_name":"2021 IEEE 21st International Conference on Bioinformatics and Bioengineering (BIBE)","issn_l":null,"issn":null,"is_oa":false,"is_in_doaj":false,"is_core":false,"host_organization":null,"host_organization_name":null,"host_organization_lineage":[],"host_organization_lineage_names":[],"type":"conference"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"2021 IEEE 21st International Conference on Bioinformatics and Bioengineering (BIBE)","raw_type":"proceedings-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":false,"oa_status":"closed","oa_url":null,"any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5054098756","display_name":"Sandi Baressi \u0160egota","orcid":"https://orcid.org/0000-0002-3015-1024"},"institutions":[{"id":"https://openalex.org/I154347574","display_name":"University of Rijeka","ror":"https://ror.org/05r8dqr10","country_code":"HR","type":"education","lineage":["https://openalex.org/I154347574"]}],"countries":["HR"],"is_corresponding":false,"raw_author_name":"Sandi Baressi Segota","raw_affiliation_strings":["Faculty of Engineering, University of Rijeka, Rijeka, Croatia"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"Faculty of Engineering, University of Rijeka, Rijeka, Croatia","institution_ids":["https://openalex.org/I154347574"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5070800868","display_name":"Nikola An\u0111eli\u0107","orcid":"https://orcid.org/0000-0002-0314-243X"},"institutions":[{"id":"https://openalex.org/I154347574","display_name":"University of Rijeka","ror":"https://ror.org/05r8dqr10","country_code":"HR","type":"education","lineage":["https://openalex.org/I154347574"]}],"countries":["HR"],"is_corresponding":false,"raw_author_name":"Nikola Andelic","raw_affiliation_strings":["Faculty of Engineering, University of Rijeka, Rijeka, Croatia"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"Faculty of Engineering, University of Rijeka, Rijeka, Croatia","institution_ids":["https://openalex.org/I154347574"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5078677385","display_name":"Ivan Lorencin","orcid":"https://orcid.org/0000-0002-5964-245X"},"institutions":[{"id":"https://openalex.org/I154347574","display_name":"University of Rijeka","ror":"https://ror.org/05r8dqr10","country_code":"HR","type":"education","lineage":["https://openalex.org/I154347574"]}],"countries":["HR"],"is_corresponding":false,"raw_author_name":"Ivan Lorencin","raw_affiliation_strings":["Faculty of Engineering, University of Rijeka, Rijeka, Croatia"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"Faculty of Engineering, University of Rijeka, Rijeka, Croatia","institution_ids":["https://openalex.org/I154347574"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5079658540","display_name":"Jelena Musulin","orcid":"https://orcid.org/0000-0002-5213-1550"},"institutions":[{"id":"https://openalex.org/I154347574","display_name":"University of Rijeka","ror":"https://ror.org/05r8dqr10","country_code":"HR","type":"education","lineage":["https://openalex.org/I154347574"]}],"countries":["HR"],"is_corresponding":false,"raw_author_name":"Jelena Musulin","raw_affiliation_strings":["Faculty of Engineering, University of Rijeka, Rijeka, Croatia"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"Faculty of Engineering, University of Rijeka, Rijeka, Croatia","institution_ids":["https://openalex.org/I154347574"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5055325985","display_name":"Daniel \u0160tifani\u0107","orcid":"https://orcid.org/0000-0001-9396-2441"},"institutions":[{"id":"https://openalex.org/I154347574","display_name":"University of Rijeka","ror":"https://ror.org/05r8dqr10","country_code":"HR","type":"education","lineage":["https://openalex.org/I154347574"]}],"countries":["HR"],"is_corresponding":false,"raw_author_name":"Daniel Stifanic","raw_affiliation_strings":["Faculty of Engineering, University of Rijeka, Rijeka, Croatia"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"Faculty of Engineering, University of Rijeka, Rijeka, Croatia","institution_ids":["https://openalex.org/I154347574"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5005957890","display_name":"Zlatan Car","orcid":"https://orcid.org/0000-0003-2817-9252"},"institutions":[{"id":"https://openalex.org/I154347574","display_name":"University of Rijeka","ror":"https://ror.org/05r8dqr10","country_code":"HR","type":"education","lineage":["https://openalex.org/I154347574"]}],"countries":["HR"],"is_corresponding":false,"raw_author_name":"Zlatan Car","raw_affiliation_strings":["Faculty of Engineering, University of Rijeka, Rijeka, Croatia"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"Faculty of Engineering, University of Rijeka, Rijeka, Croatia","institution_ids":["https://openalex.org/I154347574"]}]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":6,"corresponding_author_ids":[],"corresponding_institution_ids":[],"apc_list":null,"apc_paid":null,"fwci":2.8343,"has_fulltext":false,"cited_by_count":11,"citation_normalized_percentile":{"value":0.91810842,"is_in_top_1_percent":false,"is_in_top_10_percent":true},"cited_by_percentile_year":{"min":94,"max":98},"biblio":{"volume":null,"issue":null,"first_page":"1","last_page":"6"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10211","display_name":"Computational Drug Discovery Methods","score":0.9954000115394592,"subfield":{"id":"https://openalex.org/subfields/1703","display_name":"Computational Theory and Mathematics"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10211","display_name":"Computational Drug Discovery Methods","score":0.9954000115394592,"subfield":{"id":"https://openalex.org/subfields/1703","display_name":"Computational Theory and Mathematics"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11948","display_name":"Machine Learning in Materials Science","score":0.9848999977111816,"subfield":{"id":"https://openalex.org/subfields/2505","display_name":"Materials Chemistry"},"field":{"id":"https://openalex.org/fields/25","display_name":"Materials Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10908","display_name":"Analytical Chemistry and Chromatography","score":0.916100025177002,"subfield":{"id":"https://openalex.org/subfields/1607","display_name":"Spectroscopy"},"field":{"id":"https://openalex.org/fields/16","display_name":"Chemistry"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.8332720994949341},{"id":"https://openalex.org/keywords/convolutional-neural-network","display_name":"Convolutional neural network","score":0.806161642074585},{"id":"https://openalex.org/keywords/notation","display_name":"Notation","score":0.7524300813674927},{"id":"https://openalex.org/keywords/transformation","display_name":"Transformation (genetics)","score":0.604091465473175},{"id":"https://openalex.org/keywords/representation","display_name":"Representation (politics)","score":0.6017528772354126},{"id":"https://openalex.org/keywords/line","display_name":"Line (geometry)","score":0.5206167697906494},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.5090371966362},{"id":"https://openalex.org/keywords/transformation-matrix","display_name":"Transformation matrix","score":0.4908071458339691},{"id":"https://openalex.org/keywords/point","display_name":"Point (geometry)","score":0.47623971104621887},{"id":"https://openalex.org/keywords/artificial-neural-network","display_name":"Artificial neural network","score":0.4685588479042053},{"id":"https://openalex.org/keywords/pattern-recognition","display_name":"Pattern recognition (psychology)","score":0.43567946553230286},{"id":"https://openalex.org/keywords/matrix","display_name":"Matrix (chemical analysis)","score":0.4164135158061981},{"id":"https://openalex.org/keywords/data-mining","display_name":"Data mining","score":0.34132644534111023},{"id":"https://openalex.org/keywords/theoretical-computer-science","display_name":"Theoretical computer science","score":0.3280409276485443}],"concepts":[{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.8332720994949341},{"id":"https://openalex.org/C81363708","wikidata":"https://www.wikidata.org/wiki/Q17084460","display_name":"Convolutional neural network","level":2,"score":0.806161642074585},{"id":"https://openalex.org/C45357846","wikidata":"https://www.wikidata.org/wiki/Q2001982","display_name":"Notation","level":2,"score":0.7524300813674927},{"id":"https://openalex.org/C204241405","wikidata":"https://www.wikidata.org/wiki/Q461499","display_name":"Transformation (genetics)","level":3,"score":0.604091465473175},{"id":"https://openalex.org/C2776359362","wikidata":"https://www.wikidata.org/wiki/Q2145286","display_name":"Representation (politics)","level":3,"score":0.6017528772354126},{"id":"https://openalex.org/C198352243","wikidata":"https://www.wikidata.org/wiki/Q37105","display_name":"Line (geometry)","level":2,"score":0.5206167697906494},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.5090371966362},{"id":"https://openalex.org/C165443888","wikidata":"https://www.wikidata.org/wiki/Q1482183","display_name":"Transformation matrix","level":3,"score":0.4908071458339691},{"id":"https://openalex.org/C28719098","wikidata":"https://www.wikidata.org/wiki/Q44946","display_name":"Point (geometry)","level":2,"score":0.47623971104621887},{"id":"https://openalex.org/C50644808","wikidata":"https://www.wikidata.org/wiki/Q192776","display_name":"Artificial neural network","level":2,"score":0.4685588479042053},{"id":"https://openalex.org/C153180895","wikidata":"https://www.wikidata.org/wiki/Q7148389","display_name":"Pattern recognition (psychology)","level":2,"score":0.43567946553230286},{"id":"https://openalex.org/C106487976","wikidata":"https://www.wikidata.org/wiki/Q685816","display_name":"Matrix (chemical analysis)","level":2,"score":0.4164135158061981},{"id":"https://openalex.org/C124101348","wikidata":"https://www.wikidata.org/wiki/Q172491","display_name":"Data mining","level":1,"score":0.34132644534111023},{"id":"https://openalex.org/C80444323","wikidata":"https://www.wikidata.org/wiki/Q2878974","display_name":"Theoretical computer science","level":1,"score":0.3280409276485443},{"id":"https://openalex.org/C94375191","wikidata":"https://www.wikidata.org/wiki/Q11205","display_name":"Arithmetic","level":1,"score":0.0},{"id":"https://openalex.org/C104317684","wikidata":"https://www.wikidata.org/wiki/Q7187","display_name":"Gene","level":2,"score":0.0},{"id":"https://openalex.org/C17744445","wikidata":"https://www.wikidata.org/wiki/Q36442","display_name":"Political science","level":0,"score":0.0},{"id":"https://openalex.org/C74650414","wikidata":"https://www.wikidata.org/wiki/Q11397","display_name":"Classical mechanics","level":1,"score":0.0},{"id":"https://openalex.org/C33923547","wikidata":"https://www.wikidata.org/wiki/Q395","display_name":"Mathematics","level":0,"score":0.0},{"id":"https://openalex.org/C199539241","wikidata":"https://www.wikidata.org/wiki/Q7748","display_name":"Law","level":1,"score":0.0},{"id":"https://openalex.org/C94625758","wikidata":"https://www.wikidata.org/wiki/Q7163","display_name":"Politics","level":2,"score":0.0},{"id":"https://openalex.org/C55493867","wikidata":"https://www.wikidata.org/wiki/Q7094","display_name":"Biochemistry","level":1,"score":0.0},{"id":"https://openalex.org/C121332964","wikidata":"https://www.wikidata.org/wiki/Q413","display_name":"Physics","level":0,"score":0.0},{"id":"https://openalex.org/C192562407","wikidata":"https://www.wikidata.org/wiki/Q228736","display_name":"Materials science","level":0,"score":0.0},{"id":"https://openalex.org/C39920418","wikidata":"https://www.wikidata.org/wiki/Q11476","display_name":"Kinematics","level":2,"score":0.0},{"id":"https://openalex.org/C159985019","wikidata":"https://www.wikidata.org/wiki/Q181790","display_name":"Composite material","level":1,"score":0.0},{"id":"https://openalex.org/C2524010","wikidata":"https://www.wikidata.org/wiki/Q8087","display_name":"Geometry","level":1,"score":0.0},{"id":"https://openalex.org/C185592680","wikidata":"https://www.wikidata.org/wiki/Q2329","display_name":"Chemistry","level":0,"score":0.0}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.1109/bibe52308.2021.9635320","is_oa":false,"landing_page_url":"https://doi.org/10.1109/bibe52308.2021.9635320","pdf_url":null,"source":{"id":"https://openalex.org/S4363608533","display_name":"2021 IEEE 21st International Conference on Bioinformatics and Bioengineering (BIBE)","issn_l":null,"issn":null,"is_oa":false,"is_in_doaj":false,"is_core":false,"host_organization":null,"host_organization_name":null,"host_organization_lineage":[],"host_organization_lineage_names":[],"type":"conference"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"2021 IEEE 21st International Conference on Bioinformatics and Bioengineering (BIBE)","raw_type":"proceedings-article"}],"best_oa_location":null,"sustainable_development_goals":[],"awards":[{"id":"https://openalex.org/G1529660283","display_name":null,"funder_award_id":"305.6019-20","funder_id":"https://openalex.org/F4320338335","funder_display_name":"H2020 European Research Council"},{"id":"https://openalex.org/G5293110150","display_name":null,"funder_award_id":"CIII-HR-0108","funder_id":"https://openalex.org/F4320328317","funder_display_name":"CEEPUS"},{"id":"https://openalex.org/G7655492722","display_name":null,"funder_award_id":"KK.01.l.1.01.0009","funder_id":"https://openalex.org/F4320335322","funder_display_name":"European Regional Development Fund"}],"funders":[{"id":"https://openalex.org/F4320328317","display_name":"CEEPUS","ror":null},{"id":"https://openalex.org/F4320335322","display_name":"European Regional Development Fund","ror":"https://ror.org/00k4n6c32"},{"id":"https://openalex.org/F4320338335","display_name":"H2020 European Research Council","ror":"https://ror.org/0472cxd90"}],"has_content":{"pdf":false,"grobid_xml":false},"content_urls":null,"referenced_works_count":29,"referenced_works":["https://openalex.org/W49913121","https://openalex.org/W1978777023","https://openalex.org/W2102564672","https://openalex.org/W2728215767","https://openalex.org/W2763220183","https://openalex.org/W2985702256","https://openalex.org/W3016131398","https://openalex.org/W3023736619","https://openalex.org/W3028916651","https://openalex.org/W3030738016","https://openalex.org/W3030790048","https://openalex.org/W3033928040","https://openalex.org/W3036016037","https://openalex.org/W3042753240","https://openalex.org/W3048079539","https://openalex.org/W3090209317","https://openalex.org/W3092408118","https://openalex.org/W3093687066","https://openalex.org/W3104850868","https://openalex.org/W3112926604","https://openalex.org/W3118526204","https://openalex.org/W3123999956","https://openalex.org/W3134451384","https://openalex.org/W3138971305","https://openalex.org/W3175014854","https://openalex.org/W3194871141","https://openalex.org/W3205056559","https://openalex.org/W6778332882","https://openalex.org/W6787321127"],"related_works":["https://openalex.org/W2504004674","https://openalex.org/W1595229445","https://openalex.org/W2498744856","https://openalex.org/W4390482104","https://openalex.org/W2100079542","https://openalex.org/W1994539089","https://openalex.org/W1515939773","https://openalex.org/W2112938363","https://openalex.org/W1601028106","https://openalex.org/W2383398300"],"abstract_inverted_index":{"Simplified":[0],"Molecular":[1],"Input":[2],"Line":[3],"Entry":[4],"System":[5],"(SMILES)":[6],"is":[7,54],"a":[8,23,90,123],"type":[9],"of":[10,19,49,77,93,101,113,118],"chemical":[11,20],"notation.":[12],"The":[13,85,126],"SMILES":[14,45,79,95],"format":[15],"allows":[16,31],"the":[17,44,50,55,71,75,78,94,99,102,116,134],"representation":[18],"structures":[21],"in":[22],"shape":[24],"easily":[25],"readable":[26],"by":[27,83,98],"computer":[28],"programs.":[29],"This":[30],"many":[32],"techniques,":[33],"such":[34],"as":[35],"Artificial":[36],"Neural":[37,57],"Networks":[38,58],"(ANNs)":[39],"to":[40,61],"be":[41],"applied":[42],"on":[43,63,122],"formatted":[46],"data.":[47,67],"One":[48],"highest-performing":[51],"ANN":[52],"types":[53],"Convolutional":[56],"(CNNs),":[59],"designed":[60],"work":[62],"images":[64],"or":[65],"matrix-shaped":[66],"In":[68],"this":[69],"paper,":[70],"authors":[72],"will":[73,87],"present":[74],"preparation":[76],"dataset":[80,103],"for":[81],"use":[82],"CNNs.":[84],"paper":[86],"start":[88],"with":[89,110,133],"brief":[91],"description":[92],"format,":[96,109],"followed":[97],"explanation":[100],"transformation":[104,135],"into":[105],"an":[106,111],"NPY":[107],"matrix-based":[108],"example":[112],"utilization":[114],"via":[115],"application":[117],"popular":[119],"CNN":[120],"architectures":[121],"transformed":[124],"dataset.":[125],"proposed":[127],"architecture":[128],"achieves":[129],"satisfactory":[130,140],"results":[131],"(AUC=0.92),":[132],"algorithm":[136],"speed":[137],"also":[138],"proving":[139],"(0.08":[141],"seconds":[142],"per":[143],"data":[144],"point)":[145]},"counts_by_year":[{"year":2025,"cited_by_count":3},{"year":2024,"cited_by_count":6},{"year":2023,"cited_by_count":2}],"updated_date":"2026-06-11T09:08:48.828518","created_date":"2025-10-10T00:00:00"}
