{"id":"https://openalex.org/W4391541076","doi":"https://doi.org/10.1021/acs.jcim.3c01468","title":"Molecular Contrastive Pretraining with Collaborative Featurizations","display_name":"Molecular Contrastive Pretraining with Collaborative Featurizations","publication_year":2024,"publication_date":"2024-02-05","ids":{"openalex":"https://openalex.org/W4391541076","doi":"https://doi.org/10.1021/acs.jcim.3c01468","pmid":"https://pubmed.ncbi.nlm.nih.gov/38315002"},"language":"en","primary_location":{"id":"doi:10.1021/acs.jcim.3c01468","is_oa":false,"landing_page_url":"https://doi.org/10.1021/acs.jcim.3c01468","pdf_url":null,"source":{"id":"https://openalex.org/S167262187","display_name":"Journal of Chemical Information and Modeling","issn_l":"1549-9596","issn":["1549-9596","1549-960X"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310320006","host_organization_name":"American Chemical Society","host_organization_lineage":["https://openalex.org/P4310320006"],"host_organization_lineage_names":["American Chemical Society"],"type":"journal"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Journal of Chemical Information and Modeling","raw_type":"journal-article"},"type":"article","indexed_in":["crossref","pubmed"],"open_access":{"is_oa":false,"oa_status":"closed","oa_url":null,"any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5015101640","display_name":"Yanqiao Zhu","orcid":"https://orcid.org/0000-0003-2205-5304"},"institutions":[{"id":"https://openalex.org/I161318765","display_name":"University of California, Los Angeles","ror":"https://ror.org/046rm7j60","country_code":"US","type":"education","lineage":["https://openalex.org/I161318765"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Yanqiao Zhu","raw_affiliation_strings":["Department of Computer Science, University of California, Los Angeles, Los Angeles, California 90095, United States"],"affiliations":[{"raw_affiliation_string":"Department of Computer Science, University of California, Los Angeles, Los Angeles, California 90095, United States","institution_ids":["https://openalex.org/I161318765"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5075185753","display_name":"D.-H. Chen","orcid":null},"institutions":[{"id":"https://openalex.org/I4210112150","display_name":"Institute of Automation","ror":"https://ror.org/022c3hy66","country_code":"CN","type":"facility","lineage":["https://openalex.org/I19820366","https://openalex.org/I4210112150"]},{"id":"https://openalex.org/I19820366","display_name":"Chinese Academy of Sciences","ror":"https://ror.org/034t30j35","country_code":"CN","type":"funder","lineage":["https://openalex.org/I19820366"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Dingshuo Chen","raw_affiliation_strings":["Center for Research on Intelligent Perception and Computing, Institute of Automation, Chinese Academy of Sciences, Beijing 100190, China"],"affiliations":[{"raw_affiliation_string":"Center for Research on Intelligent Perception and Computing, Institute of Automation, Chinese Academy of Sciences, Beijing 100190, China","institution_ids":["https://openalex.org/I4210112150","https://openalex.org/I19820366"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5006709853","display_name":"Yuanqi Du","orcid":"https://orcid.org/0000-0003-2988-0374"},"institutions":[{"id":"https://openalex.org/I205783295","display_name":"Cornell University","ror":"https://ror.org/05bnh6r87","country_code":"US","type":"education","lineage":["https://openalex.org/I205783295"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Yuanqi Du","raw_affiliation_strings":["Department of Computer Science, Cornell University, Ithaca, New York 14853, United States"],"affiliations":[{"raw_affiliation_string":"Department of Computer Science, Cornell University, Ithaca, New York 14853, United States","institution_ids":["https://openalex.org/I205783295"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5108898964","display_name":"Yingze Wang","orcid":null},"institutions":[{"id":"https://openalex.org/I20231570","display_name":"Peking University","ror":"https://ror.org/02v51f717","country_code":"CN","type":"education","lineage":["https://openalex.org/I20231570"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Yingze Wang","raw_affiliation_strings":["College of Chemistry and Molecular Engineering, Peking University, Beijing 100871, China"],"affiliations":[{"raw_affiliation_string":"College of Chemistry and Molecular Engineering, Peking University, Beijing 100871, China","institution_ids":["https://openalex.org/I20231570"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5100409503","display_name":"Qiang Liu","orcid":"https://orcid.org/0000-0002-9233-3827"},"institutions":[{"id":"https://openalex.org/I4210112150","display_name":"Institute of Automation","ror":"https://ror.org/022c3hy66","country_code":"CN","type":"facility","lineage":["https://openalex.org/I19820366","https://openalex.org/I4210112150"]},{"id":"https://openalex.org/I19820366","display_name":"Chinese Academy of Sciences","ror":"https://ror.org/034t30j35","country_code":"CN","type":"funder","lineage":["https://openalex.org/I19820366"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Qiang Liu","raw_affiliation_strings":["Center for Research on Intelligent Perception and Computing, Institute of Automation, Chinese Academy of Sciences, Beijing 100190, China"],"affiliations":[{"raw_affiliation_string":"Center for Research on Intelligent Perception and Computing, Institute of Automation, Chinese Academy of Sciences, Beijing 100190, China","institution_ids":["https://openalex.org/I4210112150","https://openalex.org/I19820366"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5047523245","display_name":"Shu Wu","orcid":"https://orcid.org/0000-0003-2164-3577"},"institutions":[{"id":"https://openalex.org/I19820366","display_name":"Chinese Academy of Sciences","ror":"https://ror.org/034t30j35","country_code":"CN","type":"funder","lineage":["https://openalex.org/I19820366"]},{"id":"https://openalex.org/I4210112150","display_name":"Institute of Automation","ror":"https://ror.org/022c3hy66","country_code":"CN","type":"facility","lineage":["https://openalex.org/I19820366","https://openalex.org/I4210112150"]}],"countries":["CN"],"is_corresponding":true,"raw_author_name":"Shu Wu","raw_affiliation_strings":["Center for Research on Intelligent Perception and Computing, Institute of Automation, Chinese Academy of Sciences, Beijing 100190, China"],"affiliations":[{"raw_affiliation_string":"Center for Research on Intelligent Perception and Computing, Institute of Automation, Chinese Academy of Sciences, Beijing 100190, China","institution_ids":["https://openalex.org/I4210112150","https://openalex.org/I19820366"]}]}],"institutions":[],"countries_distinct_count":2,"institutions_distinct_count":6,"corresponding_author_ids":["https://openalex.org/A5047523245"],"corresponding_institution_ids":["https://openalex.org/I19820366","https://openalex.org/I4210112150"],"apc_list":null,"apc_paid":null,"fwci":0.7375,"has_fulltext":false,"cited_by_count":6,"citation_normalized_percentile":{"value":0.69705898,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":{"min":90,"max":98},"biblio":{"volume":"64","issue":"4","first_page":"1112","last_page":"1122"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T11948","display_name":"Machine Learning in Materials Science","score":0.9998999834060669,"subfield":{"id":"https://openalex.org/subfields/2505","display_name":"Materials Chemistry"},"field":{"id":"https://openalex.org/fields/25","display_name":"Materials Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T11948","display_name":"Machine Learning in Materials Science","score":0.9998999834060669,"subfield":{"id":"https://openalex.org/subfields/2505","display_name":"Materials Chemistry"},"field":{"id":"https://openalex.org/fields/25","display_name":"Materials Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10211","display_name":"Computational Drug Discovery Methods","score":0.9991999864578247,"subfield":{"id":"https://openalex.org/subfields/1703","display_name":"Computational Theory and Mathematics"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10798","display_name":"Crystallography and molecular interactions","score":0.9965000152587891,"subfield":{"id":"https://openalex.org/subfields/1606","display_name":"Physical and Theoretical Chemistry"},"field":{"id":"https://openalex.org/fields/16","display_name":"Chemistry"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.6227533221244812},{"id":"https://openalex.org/keywords/complement","display_name":"Complement (music)","score":0.598760187625885},{"id":"https://openalex.org/keywords/variety","display_name":"Variety (cybernetics)","score":0.598615825176239},{"id":"https://openalex.org/keywords/molecular-descriptor","display_name":"Molecular descriptor","score":0.5152214169502258},{"id":"https://openalex.org/keywords/molecular-dynamics","display_name":"Molecular dynamics","score":0.48395875096321106},{"id":"https://openalex.org/keywords/property","display_name":"Property (philosophy)","score":0.4753248989582062},{"id":"https://openalex.org/keywords/molecular-model","display_name":"Molecular model","score":0.46712714433670044},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.46660324931144714},{"id":"https://openalex.org/keywords/drug-discovery","display_name":"Drug discovery","score":0.4433528184890747},{"id":"https://openalex.org/keywords/simple","display_name":"Simple (philosophy)","score":0.41651827096939087},{"id":"https://openalex.org/keywords/chemistry","display_name":"Chemistry","score":0.34245622158050537},{"id":"https://openalex.org/keywords/machine-learning","display_name":"Machine learning","score":0.2544700801372528},{"id":"https://openalex.org/keywords/computational-chemistry","display_name":"Computational chemistry","score":0.18317770957946777},{"id":"https://openalex.org/keywords/stereochemistry","display_name":"Stereochemistry","score":0.10431647300720215},{"id":"https://openalex.org/keywords/quantitative-structure\u2013activity-relationship","display_name":"Quantitative structure\u2013activity relationship","score":0.06597515940666199}],"concepts":[{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.6227533221244812},{"id":"https://openalex.org/C112313634","wikidata":"https://www.wikidata.org/wiki/Q7886648","display_name":"Complement (music)","level":5,"score":0.598760187625885},{"id":"https://openalex.org/C136197465","wikidata":"https://www.wikidata.org/wiki/Q1729295","display_name":"Variety (cybernetics)","level":2,"score":0.598615825176239},{"id":"https://openalex.org/C164923092","wikidata":"https://www.wikidata.org/wiki/Q3705921","display_name":"Molecular descriptor","level":3,"score":0.5152214169502258},{"id":"https://openalex.org/C59593255","wikidata":"https://www.wikidata.org/wiki/Q901663","display_name":"Molecular dynamics","level":2,"score":0.48395875096321106},{"id":"https://openalex.org/C189950617","wikidata":"https://www.wikidata.org/wiki/Q937228","display_name":"Property (philosophy)","level":2,"score":0.4753248989582062},{"id":"https://openalex.org/C178910836","wikidata":"https://www.wikidata.org/wiki/Q2196961","display_name":"Molecular model","level":2,"score":0.46712714433670044},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.46660324931144714},{"id":"https://openalex.org/C74187038","wikidata":"https://www.wikidata.org/wiki/Q1418791","display_name":"Drug discovery","level":2,"score":0.4433528184890747},{"id":"https://openalex.org/C2780586882","wikidata":"https://www.wikidata.org/wiki/Q7520643","display_name":"Simple (philosophy)","level":2,"score":0.41651827096939087},{"id":"https://openalex.org/C185592680","wikidata":"https://www.wikidata.org/wiki/Q2329","display_name":"Chemistry","level":0,"score":0.34245622158050537},{"id":"https://openalex.org/C119857082","wikidata":"https://www.wikidata.org/wiki/Q2539","display_name":"Machine learning","level":1,"score":0.2544700801372528},{"id":"https://openalex.org/C147597530","wikidata":"https://www.wikidata.org/wiki/Q369472","display_name":"Computational chemistry","level":1,"score":0.18317770957946777},{"id":"https://openalex.org/C71240020","wikidata":"https://www.wikidata.org/wiki/Q186011","display_name":"Stereochemistry","level":1,"score":0.10431647300720215},{"id":"https://openalex.org/C164126121","wikidata":"https://www.wikidata.org/wiki/Q766383","display_name":"Quantitative structure\u2013activity relationship","level":2,"score":0.06597515940666199},{"id":"https://openalex.org/C104317684","wikidata":"https://www.wikidata.org/wiki/Q7187","display_name":"Gene","level":2,"score":0.0},{"id":"https://openalex.org/C111472728","wikidata":"https://www.wikidata.org/wiki/Q9471","display_name":"Epistemology","level":1,"score":0.0},{"id":"https://openalex.org/C188082640","wikidata":"https://www.wikidata.org/wiki/Q1780899","display_name":"Complementation","level":4,"score":0.0},{"id":"https://openalex.org/C127716648","wikidata":"https://www.wikidata.org/wiki/Q104053","display_name":"Phenotype","level":3,"score":0.0},{"id":"https://openalex.org/C138885662","wikidata":"https://www.wikidata.org/wiki/Q5891","display_name":"Philosophy","level":0,"score":0.0},{"id":"https://openalex.org/C55493867","wikidata":"https://www.wikidata.org/wiki/Q7094","display_name":"Biochemistry","level":1,"score":0.0}],"mesh":[{"descriptor_ui":"D000080486","descriptor_name":"Computational Chemistry","qualifier_ui":null,"qualifier_name":null,"is_major_topic":true},{"descriptor_ui":"D000080486","descriptor_name":"Computational Chemistry","qualifier_ui":null,"qualifier_name":null,"is_major_topic":true},{"descriptor_ui":"D000080486","descriptor_name":"Computational Chemistry","qualifier_ui":null,"qualifier_name":null,"is_major_topic":true},{"descriptor_ui":"D000080486","descriptor_name":"Computational Chemistry","qualifier_ui":null,"qualifier_name":null,"is_major_topic":true},{"descriptor_ui":"D007858","descriptor_name":"Learning","qualifier_ui":null,"qualifier_name":null,"is_major_topic":false},{"descriptor_ui":"D007858","descriptor_name":"Learning","qualifier_ui":null,"qualifier_name":null,"is_major_topic":false},{"descriptor_ui":"D007858","descriptor_name":"Learning","qualifier_ui":null,"qualifier_name":null,"is_major_topic":false},{"descriptor_ui":"D007858","descriptor_name":"Learning","qualifier_ui":null,"qualifier_name":null,"is_major_topic":false},{"descriptor_ui":"D055808","descriptor_name":"Drug Discovery","qualifier_ui":null,"qualifier_name":null,"is_major_topic":true},{"descriptor_ui":"D055808","descriptor_name":"Drug Discovery","qualifier_ui":null,"qualifier_name":null,"is_major_topic":true},{"descriptor_ui":"D055808","descriptor_name":"Drug Discovery","qualifier_ui":null,"qualifier_name":null,"is_major_topic":true},{"descriptor_ui":"D055808","descriptor_name":"Drug Discovery","qualifier_ui":null,"qualifier_name":null,"is_major_topic":true}],"locations_count":2,"locations":[{"id":"doi:10.1021/acs.jcim.3c01468","is_oa":false,"landing_page_url":"https://doi.org/10.1021/acs.jcim.3c01468","pdf_url":null,"source":{"id":"https://openalex.org/S167262187","display_name":"Journal of Chemical Information and Modeling","issn_l":"1549-9596","issn":["1549-9596","1549-960X"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310320006","host_organization_name":"American Chemical Society","host_organization_lineage":["https://openalex.org/P4310320006"],"host_organization_lineage_names":["American Chemical Society"],"type":"journal"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Journal of Chemical Information and Modeling","raw_type":"journal-article"},{"id":"pmid:38315002","is_oa":false,"landing_page_url":"https://pubmed.ncbi.nlm.nih.gov/38315002","pdf_url":null,"source":{"id":"https://openalex.org/S4306525036","display_name":"PubMed","issn_l":null,"issn":null,"is_oa":false,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I1299303238","host_organization_name":"National Institutes of Health","host_organization_lineage":["https://openalex.org/I1299303238"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Journal of chemical information and modeling","raw_type":null}],"best_oa_location":null,"sustainable_development_goals":[],"awards":[{"id":"https://openalex.org/G334303618","display_name":null,"funder_award_id":"62206291","funder_id":"https://openalex.org/F4320321001","funder_display_name":"National Natural Science Foundation of China"},{"id":"https://openalex.org/G3666696391","display_name":null,"funder_award_id":"62372454","funder_id":"https://openalex.org/F4320321001","funder_display_name":"National Natural Science Foundation of China"},{"id":"https://openalex.org/G4127089600","display_name":null,"funder_award_id":"62141608","funder_id":"https://openalex.org/F4320321001","funder_display_name":"National Natural Science Foundation of China"},{"id":"https://openalex.org/G5602928874","display_name":null,"funder_award_id":"2023ZD0120901","funder_id":"https://openalex.org/F4320335777","funder_display_name":"National Key Research and Development Program of China"}],"funders":[{"id":"https://openalex.org/F4320321001","display_name":"National Natural Science Foundation of China","ror":"https://ror.org/01h0zpd94"},{"id":"https://openalex.org/F4320335777","display_name":"National Key Research and Development Program of China","ror":null}],"has_content":{"grobid_xml":false,"pdf":false},"content_urls":null,"referenced_works_count":50,"referenced_works":["https://openalex.org/W70551643","https://openalex.org/W146900863","https://openalex.org/W1971460556","https://openalex.org/W1975147762","https://openalex.org/W1988037271","https://openalex.org/W2016979469","https://openalex.org/W2021748110","https://openalex.org/W2043509228","https://openalex.org/W2044834685","https://openalex.org/W2074142600","https://openalex.org/W2080635178","https://openalex.org/W2096541451","https://openalex.org/W2134164499","https://openalex.org/W2169303530","https://openalex.org/W2244785476","https://openalex.org/W2295598076","https://openalex.org/W2541404351","https://openalex.org/W2594183968","https://openalex.org/W2742127985","https://openalex.org/W2911964244","https://openalex.org/W2965373594","https://openalex.org/W2966357564","https://openalex.org/W2972433884","https://openalex.org/W2973114758","https://openalex.org/W3023371261","https://openalex.org/W3034806393","https://openalex.org/W3035524453","https://openalex.org/W3080997787","https://openalex.org/W3093934881","https://openalex.org/W3115755088","https://openalex.org/W3166272013","https://openalex.org/W3173107846","https://openalex.org/W3188589934","https://openalex.org/W4206367183","https://openalex.org/W4213077304","https://openalex.org/W4214868967","https://openalex.org/W4221155201","https://openalex.org/W4226119281","https://openalex.org/W4280491631","https://openalex.org/W4283727985","https://openalex.org/W4286893572","https://openalex.org/W4286907726","https://openalex.org/W4290875097","https://openalex.org/W4290876361","https://openalex.org/W4304697394","https://openalex.org/W4309791143","https://openalex.org/W4313485929","https://openalex.org/W4317757475","https://openalex.org/W4389471260","https://openalex.org/W6929331632"],"related_works":["https://openalex.org/W2047041070","https://openalex.org/W1518653219","https://openalex.org/W1971138788","https://openalex.org/W2072172337","https://openalex.org/W3113041276","https://openalex.org/W2005591679","https://openalex.org/W4390487607","https://openalex.org/W4285304194","https://openalex.org/W2030892568","https://openalex.org/W1974483352"],"abstract_inverted_index":{"Molecular":[0],"pretraining,":[1],"which":[2],"learns":[3],"molecular":[4,34,38,53,61,133],"representations":[5],"over":[6],"massive":[7],"unlabeled":[8],"data,":[9],"has":[10,30],"become":[11],"a":[12,17,95,129],"prominent":[13],"paradigm":[14],"to":[15],"solve":[16],"variety":[18],"of":[19,52,90,132],"tasks":[20],"in":[21,33,60],"computational":[22],"chemistry":[23],"and":[24,46,74,97,115],"drug":[25],"discovery.":[26],"Recently,":[27],"prosperous":[28],"progress":[29],"been":[31],"made":[32],"pretraining":[35,62,100],"with":[36,55,102],"different":[37,81],"featurizations,":[39],"including":[40],"1D":[41],"SMILES":[42],"strings,":[43],"2D":[44],"graphs,":[45],"3D":[47],"geometries.":[48],"However,":[49],"the":[50],"role":[51],"featurizations":[54,104,110,127],"their":[56],"corresponding":[57],"neural":[58],"architectures":[59],"remains":[63],"largely":[64],"unexamined.":[65],"In":[66,88],"this":[67,91],"paper,":[68],"through":[69],"two":[70,126],"case":[71],"studies\u2500chirality":[72],"classification":[73],"aromatic":[75],"ring":[76],"counting\u2500we":[77],"first":[78],"demonstrate":[79],"that":[80,111,120],"featurization":[82],"techniques":[83],"convey":[84],"chemical":[85],"information":[86],"differently.":[87],"light":[89],"observation,":[92],"we":[93],"propose":[94],"simple":[96],"effective":[98],"MOlecular":[99],"framework":[101],"COllaborative":[103],"(MOCO).":[105],"MOCO":[106],"comprehensively":[107],"leverages":[108],"multiple":[109],"complement":[112],"each":[113],"other":[114],"outperforms":[116],"existing":[117],"state-of-the-art":[118],"models":[119],"solely":[121],"rely":[122],"on":[123,128],"one":[124],"or":[125],"wide":[130],"range":[131],"property":[134],"prediction":[135],"tasks.":[136]},"counts_by_year":[{"year":2025,"cited_by_count":5},{"year":2024,"cited_by_count":1}],"updated_date":"2025-11-06T03:46:38.306776","created_date":"2025-10-10T00:00:00"}
