{"id":"https://openalex.org/W4313527186","doi":"https://doi.org/10.1109/bibm55620.2022.9995393","title":"Molecular Descriptors Property Prediction via a Natural Language Processing Approach","display_name":"Molecular Descriptors Property Prediction via a Natural Language Processing Approach","publication_year":2022,"publication_date":"2022-12-06","ids":{"openalex":"https://openalex.org/W4313527186","doi":"https://doi.org/10.1109/bibm55620.2022.9995393"},"language":"en","primary_location":{"id":"doi:10.1109/bibm55620.2022.9995393","is_oa":false,"landing_page_url":"http://dx.doi.org/10.1109/bibm55620.2022.9995393","pdf_url":null,"source":{"id":"https://openalex.org/S4363607730","display_name":"2022 IEEE International Conference on Bioinformatics and Biomedicine (BIBM)","issn_l":null,"issn":null,"is_oa":false,"is_in_doaj":false,"is_core":false,"host_organization":null,"host_organization_name":null,"host_organization_lineage":[],"host_organization_lineage_names":[],"type":"conference"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"2022 IEEE International Conference on Bioinformatics and Biomedicine (BIBM)","raw_type":"proceedings-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":false,"oa_status":"closed","oa_url":null,"any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5102947600","display_name":"Tuan Tran","orcid":"https://orcid.org/0000-0003-2299-0466"},"institutions":[{"id":"https://openalex.org/I392282","display_name":"University at Albany, State University of New York","ror":"https://ror.org/012zs8222","country_code":"US","type":"education","lineage":["https://openalex.org/I392282"]}],"countries":["US"],"is_corresponding":true,"raw_author_name":"Tuan Tran","raw_affiliation_strings":["University at Albany,Department of Computer Science,Albany,New York","Department of Computer Science, University at Albany, Albany, New York"],"affiliations":[{"raw_affiliation_string":"University at Albany,Department of Computer Science,Albany,New York","institution_ids":["https://openalex.org/I392282"]},{"raw_affiliation_string":"Department of Computer Science, University at Albany, Albany, New York","institution_ids":["https://openalex.org/I392282"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5017440090","display_name":"Chinwe Ekenna","orcid":"https://orcid.org/0000-0002-7027-6040"},"institutions":[{"id":"https://openalex.org/I392282","display_name":"University at Albany, State University of New York","ror":"https://ror.org/012zs8222","country_code":"US","type":"education","lineage":["https://openalex.org/I392282"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Chinwe Ekenna","raw_affiliation_strings":["University at Albany,Department of Computer Science,Albany,New York","Department of Computer Science, University at Albany, Albany, New York"],"affiliations":[{"raw_affiliation_string":"University at Albany,Department of Computer Science,Albany,New York","institution_ids":["https://openalex.org/I392282"]},{"raw_affiliation_string":"Department of Computer Science, University at Albany, Albany, New York","institution_ids":["https://openalex.org/I392282"]}]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":2,"corresponding_author_ids":["https://openalex.org/A5102947600"],"corresponding_institution_ids":["https://openalex.org/I392282"],"apc_list":null,"apc_paid":null,"fwci":0.259,"has_fulltext":false,"cited_by_count":1,"citation_normalized_percentile":{"value":0.44224422,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":{"min":89,"max":94},"biblio":{"volume":"30","issue":null,"first_page":"3492","last_page":"3497"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10211","display_name":"Computational Drug Discovery Methods","score":0.9994000196456909,"subfield":{"id":"https://openalex.org/subfields/1703","display_name":"Computational Theory and Mathematics"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10211","display_name":"Computational Drug Discovery Methods","score":0.9994000196456909,"subfield":{"id":"https://openalex.org/subfields/1703","display_name":"Computational Theory and Mathematics"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T12254","display_name":"Machine Learning in Bioinformatics","score":0.9919999837875366,"subfield":{"id":"https://openalex.org/subfields/1312","display_name":"Molecular Biology"},"field":{"id":"https://openalex.org/fields/13","display_name":"Biochemistry, Genetics and Molecular Biology"},"domain":{"id":"https://openalex.org/domains/1","display_name":"Life Sciences"}},{"id":"https://openalex.org/T11948","display_name":"Machine Learning in Materials Science","score":0.9876999855041504,"subfield":{"id":"https://openalex.org/subfields/2505","display_name":"Materials Chemistry"},"field":{"id":"https://openalex.org/fields/25","display_name":"Materials Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.7525411248207092},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.6647452116012573},{"id":"https://openalex.org/keywords/property","display_name":"Property (philosophy)","score":0.6214222311973572},{"id":"https://openalex.org/keywords/machine-learning","display_name":"Machine learning","score":0.6020352840423584},{"id":"https://openalex.org/keywords/language-model","display_name":"Language model","score":0.5577732920646667},{"id":"https://openalex.org/keywords/natural-language-processing","display_name":"Natural language processing","score":0.45233747363090515},{"id":"https://openalex.org/keywords/supervised-learning","display_name":"Supervised learning","score":0.42954036593437195},{"id":"https://openalex.org/keywords/natural-language","display_name":"Natural language","score":0.4288623631000519},{"id":"https://openalex.org/keywords/artificial-neural-network","display_name":"Artificial neural network","score":0.1651676595211029}],"concepts":[{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.7525411248207092},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.6647452116012573},{"id":"https://openalex.org/C189950617","wikidata":"https://www.wikidata.org/wiki/Q937228","display_name":"Property (philosophy)","level":2,"score":0.6214222311973572},{"id":"https://openalex.org/C119857082","wikidata":"https://www.wikidata.org/wiki/Q2539","display_name":"Machine learning","level":1,"score":0.6020352840423584},{"id":"https://openalex.org/C137293760","wikidata":"https://www.wikidata.org/wiki/Q3621696","display_name":"Language model","level":2,"score":0.5577732920646667},{"id":"https://openalex.org/C204321447","wikidata":"https://www.wikidata.org/wiki/Q30642","display_name":"Natural language processing","level":1,"score":0.45233747363090515},{"id":"https://openalex.org/C136389625","wikidata":"https://www.wikidata.org/wiki/Q334384","display_name":"Supervised learning","level":3,"score":0.42954036593437195},{"id":"https://openalex.org/C195324797","wikidata":"https://www.wikidata.org/wiki/Q33742","display_name":"Natural language","level":2,"score":0.4288623631000519},{"id":"https://openalex.org/C50644808","wikidata":"https://www.wikidata.org/wiki/Q192776","display_name":"Artificial neural network","level":2,"score":0.1651676595211029},{"id":"https://openalex.org/C138885662","wikidata":"https://www.wikidata.org/wiki/Q5891","display_name":"Philosophy","level":0,"score":0.0},{"id":"https://openalex.org/C111472728","wikidata":"https://www.wikidata.org/wiki/Q9471","display_name":"Epistemology","level":1,"score":0.0}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.1109/bibm55620.2022.9995393","is_oa":false,"landing_page_url":"http://dx.doi.org/10.1109/bibm55620.2022.9995393","pdf_url":null,"source":{"id":"https://openalex.org/S4363607730","display_name":"2022 IEEE International Conference on Bioinformatics and Biomedicine (BIBM)","issn_l":null,"issn":null,"is_oa":false,"is_in_doaj":false,"is_core":false,"host_organization":null,"host_organization_name":null,"host_organization_lineage":[],"host_organization_lineage_names":[],"type":"conference"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"2022 IEEE International Conference on Bioinformatics and Biomedicine (BIBM)","raw_type":"proceedings-article"}],"best_oa_location":null,"sustainable_development_goals":[{"display_name":"Quality Education","id":"https://metadata.un.org/sdg/4","score":0.6800000071525574}],"awards":[],"funders":[],"has_content":{"grobid_xml":false,"pdf":false},"content_urls":null,"referenced_works_count":50,"referenced_works":["https://openalex.org/W1522301498","https://openalex.org/W1560202902","https://openalex.org/W1930624869","https://openalex.org/W1973698523","https://openalex.org/W1975147762","https://openalex.org/W2138906088","https://openalex.org/W2405035126","https://openalex.org/W2467309505","https://openalex.org/W2594183968","https://openalex.org/W2614053601","https://openalex.org/W2742753960","https://openalex.org/W2749279690","https://openalex.org/W2785720803","https://openalex.org/W2789816271","https://openalex.org/W2885592687","https://openalex.org/W2888164077","https://openalex.org/W2896457183","https://openalex.org/W2899070097","https://openalex.org/W2931367569","https://openalex.org/W2964015378","https://openalex.org/W2965373594","https://openalex.org/W2966357564","https://openalex.org/W2973114758","https://openalex.org/W2979826702","https://openalex.org/W3005552578","https://openalex.org/W3010813949","https://openalex.org/W3032781902","https://openalex.org/W3036931110","https://openalex.org/W3093934881","https://openalex.org/W3105259638","https://openalex.org/W3109892317","https://openalex.org/W3127596955","https://openalex.org/W3128029990","https://openalex.org/W3215781140","https://openalex.org/W4210592951","https://openalex.org/W4297632148","https://openalex.org/W4297733535","https://openalex.org/W4385245566","https://openalex.org/W6631190155","https://openalex.org/W6726873649","https://openalex.org/W6736685754","https://openalex.org/W6739901393","https://openalex.org/W6745537798","https://openalex.org/W6747978776","https://openalex.org/W6755207826","https://openalex.org/W6766673545","https://openalex.org/W6772452955","https://openalex.org/W6784526300","https://openalex.org/W6786619936","https://openalex.org/W6843615466"],"related_works":["https://openalex.org/W2169518243","https://openalex.org/W2582753012","https://openalex.org/W4300101497","https://openalex.org/W2962977872","https://openalex.org/W2379797514","https://openalex.org/W2391763874","https://openalex.org/W2036456628","https://openalex.org/W4226226396","https://openalex.org/W3153750606","https://openalex.org/W4308854837"],"abstract_inverted_index":{"Malaria":[0],"is":[1,64,91],"a":[2,41,77,94,116],"mosquito-borne":[3],"disease":[4],"caused":[5],"by":[6],"single-celled":[7],"blood":[8],"parasites":[9],"of":[10,30,40,44,80],"the":[11,54,59,86,98,123],"genus":[12],"Plasmodium.":[13],"In":[14],"this":[15],"work,":[16],"we":[17,57],"proposed":[18],"semi-supervised":[19],"machine":[20],"learning":[21,72],"models":[22,121],"for":[23,49,71],"predicting":[24],"anti-malaria":[25],"drugs.":[26],"Our":[27,36],"model":[28,37,90,114],"consists":[29],"two-stage":[31],"procedures:":[32],"pre-training":[33,55],"and":[34,46],"finetuning.":[35],"takes":[38],"advantage":[39],"large":[42],"amount":[43],"unlabeled":[45],"label":[47,99],"data":[48],"molecular":[50,81],"properties":[51],"prediction.":[52],"During":[53],"stage,":[56,88],"incorporate":[58],"Masked":[60],"Language":[61],"Model,":[62],"which":[63],"widely":[65],"used":[66],"in":[67,85],"natural":[68],"language":[69],"processing":[70],"text":[73],"representations,":[74],"to":[75,100],"learn":[76],"representational":[78],"topology":[79],"chemical":[82],"space.":[83],"Then":[84],"fine-tuning":[87],"our":[89,113],"trained":[92],"on":[93,122],"smaller":[95],"dataset":[96],"with":[97,119],"perform":[101],"downstream":[102,125],"tasks":[103,126],"such":[104],"as":[105],"classification":[106],"or":[107],"regression.":[108],"Initial":[109],"results":[110],"show":[111],"that":[112],"has":[115],"comparable":[117],"performance":[118],"state-of-the-art":[120],"selected":[124],"from":[127],"MoleculeNet.":[128]},"counts_by_year":[{"year":2023,"cited_by_count":1}],"updated_date":"2025-12-23T23:11:35.936235","created_date":"2025-10-10T00:00:00"}
