{"id":"https://openalex.org/W7137882996","doi":"https://doi.org/10.48550/arxiv.2603.15006","title":"Empowering Chemical Structures with Biological Insights for Scalable Phenotypic Virtual Screening","display_name":"Empowering Chemical Structures with Biological Insights for Scalable Phenotypic Virtual Screening","publication_year":2026,"publication_date":"2026-03-16","ids":{"openalex":"https://openalex.org/W7137882996","doi":"https://doi.org/10.48550/arxiv.2603.15006"},"language":null,"primary_location":{"id":"doi:10.48550/arxiv.2603.15006","is_oa":true,"landing_page_url":"https://doi.org/10.48550/arxiv.2603.15006","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":null,"is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"article"},"type":"preprint","indexed_in":["datacite"],"open_access":{"is_oa":true,"oa_status":"green","oa_url":"https://doi.org/10.48550/arxiv.2603.15006","any_repository_has_fulltext":true},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5129729955","display_name":"Xiaoqing Lian","orcid":null},"institutions":[],"countries":[],"is_corresponding":true,"raw_author_name":"Lian, Xiaoqing","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5129675397","display_name":"Pengsen Ma","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Ma, Pengsen","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5129732840","display_name":"Tengfeng Ma","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Ma, Tengfeng","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5084910255","display_name":"Zhonghao Ren","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Ren, Zhonghao","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5084830664","display_name":"Xibao Cai","orcid":"https://orcid.org/0009-0002-2656-6566"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Cai, Xibao","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5129740493","display_name":"Zhixiang Cheng","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Cheng, Zhixiang","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5034581482","display_name":"Bosheng Song","orcid":"https://orcid.org/0000-0002-1479-5399"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Song, Bosheng","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5129653950","display_name":"He Wang","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Wang, He","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5129663448","display_name":"Xiang Pan","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Pan, Xiang","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5129689874","display_name":"Yangyang Chen","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Chen, Yangyang","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5129731101","display_name":"Sisi Yuan","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Yuan, Sisi","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"last","author":{"id":"https://openalex.org/A5129703735","display_name":"Chen Lin","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Lin, Chen","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]}],"institutions":[],"countries_distinct_count":0,"institutions_distinct_count":12,"corresponding_author_ids":["https://openalex.org/A5129729955"],"corresponding_institution_ids":[],"apc_list":null,"apc_paid":null,"fwci":null,"has_fulltext":false,"cited_by_count":0,"citation_normalized_percentile":null,"cited_by_percentile_year":null,"biblio":{"volume":null,"issue":null,"first_page":null,"last_page":null},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T12859","display_name":"Cell Image Analysis Techniques","score":0.9677000045776367,"subfield":{"id":"https://openalex.org/subfields/1304","display_name":"Biophysics"},"field":{"id":"https://openalex.org/fields/13","display_name":"Biochemistry, Genetics and Molecular Biology"},"domain":{"id":"https://openalex.org/domains/1","display_name":"Life Sciences"}},"topics":[{"id":"https://openalex.org/T12859","display_name":"Cell Image Analysis Techniques","score":0.9677000045776367,"subfield":{"id":"https://openalex.org/subfields/1304","display_name":"Biophysics"},"field":{"id":"https://openalex.org/fields/13","display_name":"Biochemistry, Genetics and Molecular Biology"},"domain":{"id":"https://openalex.org/domains/1","display_name":"Life Sciences"}},{"id":"https://openalex.org/T10211","display_name":"Computational Drug Discovery Methods","score":0.02280000038444996,"subfield":{"id":"https://openalex.org/subfields/1703","display_name":"Computational Theory and Mathematics"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T12254","display_name":"Machine Learning in Bioinformatics","score":0.0031999999191612005,"subfield":{"id":"https://openalex.org/subfields/1312","display_name":"Molecular Biology"},"field":{"id":"https://openalex.org/fields/13","display_name":"Biochemistry, Genetics and Molecular Biology"},"domain":{"id":"https://openalex.org/domains/1","display_name":"Life Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/scalability","display_name":"Scalability","score":0.7240999937057495},{"id":"https://openalex.org/keywords/biological-data","display_name":"Biological data","score":0.647599995136261},{"id":"https://openalex.org/keywords/profiling","display_name":"Profiling (computer programming)","score":0.620199978351593},{"id":"https://openalex.org/keywords/encode","display_name":"ENCODE","score":0.5837000012397766},{"id":"https://openalex.org/keywords/identification","display_name":"Identification (biology)","score":0.5468000173568726},{"id":"https://openalex.org/keywords/in-silico","display_name":"In silico","score":0.491100013256073},{"id":"https://openalex.org/keywords/virtual-screening","display_name":"Virtual screening","score":0.4214000105857849},{"id":"https://openalex.org/keywords/drug-discovery","display_name":"Drug discovery","score":0.40689998865127563},{"id":"https://openalex.org/keywords/biological-network","display_name":"Biological network","score":0.4023999869823456}],"concepts":[{"id":"https://openalex.org/C48044578","wikidata":"https://www.wikidata.org/wiki/Q727490","display_name":"Scalability","level":2,"score":0.7240999937057495},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.7050999999046326},{"id":"https://openalex.org/C201797286","wikidata":"https://www.wikidata.org/wiki/Q4914986","display_name":"Biological data","level":2,"score":0.647599995136261},{"id":"https://openalex.org/C187191949","wikidata":"https://www.wikidata.org/wiki/Q1138496","display_name":"Profiling (computer programming)","level":2,"score":0.620199978351593},{"id":"https://openalex.org/C66746571","wikidata":"https://www.wikidata.org/wiki/Q1134833","display_name":"ENCODE","level":3,"score":0.5837000012397766},{"id":"https://openalex.org/C116834253","wikidata":"https://www.wikidata.org/wiki/Q2039217","display_name":"Identification (biology)","level":2,"score":0.5468000173568726},{"id":"https://openalex.org/C70721500","wikidata":"https://www.wikidata.org/wiki/Q177005","display_name":"Computational biology","level":1,"score":0.4950000047683716},{"id":"https://openalex.org/C2775905019","wikidata":"https://www.wikidata.org/wiki/Q192572","display_name":"In silico","level":3,"score":0.491100013256073},{"id":"https://openalex.org/C103697762","wikidata":"https://www.wikidata.org/wiki/Q4112105","display_name":"Virtual screening","level":3,"score":0.4214000105857849},{"id":"https://openalex.org/C74187038","wikidata":"https://www.wikidata.org/wiki/Q1418791","display_name":"Drug discovery","level":2,"score":0.40689998865127563},{"id":"https://openalex.org/C28225019","wikidata":"https://www.wikidata.org/wiki/Q4915005","display_name":"Biological network","level":2,"score":0.4023999869823456},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.39989998936653137},{"id":"https://openalex.org/C98045186","wikidata":"https://www.wikidata.org/wiki/Q205663","display_name":"Process (computing)","level":2,"score":0.3743000030517578},{"id":"https://openalex.org/C124101348","wikidata":"https://www.wikidata.org/wiki/Q172491","display_name":"Data mining","level":1,"score":0.3619999885559082},{"id":"https://openalex.org/C2992918937","wikidata":"https://www.wikidata.org/wiki/Q7239","display_name":"Biological organism","level":3,"score":0.34290000796318054},{"id":"https://openalex.org/C184337299","wikidata":"https://www.wikidata.org/wiki/Q1437428","display_name":"Semantics (computer science)","level":2,"score":0.3370000123977661},{"id":"https://openalex.org/C9927688","wikidata":"https://www.wikidata.org/wiki/Q4915012","display_name":"Biological pathway","level":4,"score":0.3352999985218048},{"id":"https://openalex.org/C119857082","wikidata":"https://www.wikidata.org/wiki/Q2539","display_name":"Machine learning","level":1,"score":0.3208000063896179},{"id":"https://openalex.org/C26517878","wikidata":"https://www.wikidata.org/wiki/Q228039","display_name":"Key (lock)","level":2,"score":0.32010000944137573},{"id":"https://openalex.org/C2780801425","wikidata":"https://www.wikidata.org/wiki/Q5164392","display_name":"Construct (python library)","level":2,"score":0.29820001125335693},{"id":"https://openalex.org/C2777826928","wikidata":"https://www.wikidata.org/wiki/Q3745713","display_name":"Fingerprint (computing)","level":2,"score":0.29089999198913574},{"id":"https://openalex.org/C6555983","wikidata":"https://www.wikidata.org/wiki/Q7181398","display_name":"Phenotypic screening","level":4,"score":0.2741999924182892},{"id":"https://openalex.org/C63479239","wikidata":"https://www.wikidata.org/wiki/Q7353546","display_name":"Robustness (evolution)","level":3,"score":0.2680000066757202},{"id":"https://openalex.org/C152662350","wikidata":"https://www.wikidata.org/wiki/Q815297","display_name":"Systems biology","level":2,"score":0.265500009059906},{"id":"https://openalex.org/C52622490","wikidata":"https://www.wikidata.org/wiki/Q1026626","display_name":"Feature extraction","level":2,"score":0.263700008392334},{"id":"https://openalex.org/C157044486","wikidata":"https://www.wikidata.org/wiki/Q5754482","display_name":"High-content screening","level":3,"score":0.25589999556541443}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.48550/arxiv.2603.15006","is_oa":true,"landing_page_url":"https://doi.org/10.48550/arxiv.2603.15006","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":null,"is_accepted":false,"is_published":null,"raw_source_name":null,"raw_type":"article"}],"best_oa_location":{"id":"doi:10.48550/arxiv.2603.15006","is_oa":true,"landing_page_url":"https://doi.org/10.48550/arxiv.2603.15006","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":null,"is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"article"},"sustainable_development_goals":[],"awards":[],"funders":[],"has_content":{"pdf":false,"grobid_xml":false},"content_urls":null,"referenced_works_count":0,"referenced_works":[],"related_works":[],"abstract_inverted_index":{"Motivation:":[0],"The":[1,38,169],"scalable":[2],"identification":[3],"of":[4,71,111,122,173],"bioactive":[5],"compounds":[6],"is":[7,36,41],"essential":[8],"for":[9,159],"contemporary":[10],"drug":[11],"discovery.":[12],"This":[13,64],"process":[14],"faces":[15],"a":[16,74,112,153],"key":[17],"trade-off:":[18],"structural":[19],"screening":[20],"offers":[21],"scalability":[22],"but":[23,35],"lacks":[24],"biological":[25,33,45,59,86,93,114],"context,":[26],"whereas":[27],"high-content":[28],"phenotypic":[29],"profiling":[30],"provides":[31],"deep":[32],"insights":[34],"resource-intensive.":[37],"primary":[39],"challenge":[40],"to":[42,88],"extract":[43],"robust":[44],"signals":[46,105],"from":[47,116],"noisy":[48],"data":[49,60,102],"and":[50,100,119,167,171],"encode":[51],"them":[52],"into":[53],"representations":[54,83],"that":[55,76,128],"do":[56],"not":[57],"require":[58],"at":[61,177],"inference.":[62],"Results:":[63],"study":[65],"presents":[66],"DECODE":[67,95,129,174],"(DEcomposing":[68],"Cellular":[69],"Observations":[70],"Drug":[72],"Effects),":[73],"framework":[75,151],"bridges":[77],"this":[78],"gap":[79],"by":[80],"empowering":[81],"chemical":[82,117,143],"with":[84,137],"intrinsic":[85],"semantics":[87],"enable":[89],"structure-based":[90],"in":[91,134,145,156],"silico":[92],"profiling.":[94],"leverages":[96],"limited":[97],"paired":[98],"transcriptomic":[99],"morphological":[101],"as":[103],"supervisory":[104],"during":[106,163],"training,":[107],"enabling":[108],"the":[109,150],"extraction":[110],"measurement-invariant":[113],"fingerprint":[115],"structures":[118],"explicit":[120],"filtering":[121],"experimental":[123],"noise.":[124],"Our":[125],"evaluations":[126],"demonstrate":[127],"retrieves":[130],"functionally":[131],"similar":[132],"drugs":[133],"zero-shot":[135],"settings":[136],"over":[138,142],"20%":[139],"relative":[140],"improvement":[141],"baselines":[144],"mechanism-of-action":[146],"(MOA)":[147],"prediction.":[148],"Furthermore,":[149],"achieves":[152],"6-fold":[154],"increase":[155],"hit":[157],"rates":[158],"novel":[160],"anti-cancer":[161],"agents":[162],"external":[164],"validation.":[165],"Availability":[166],"implementation:":[168],"codes":[170],"datasets":[172],"are":[175],"available":[176],"https://github.com/lian-xiao/DECODE.":[178]},"counts_by_year":[],"updated_date":"2026-05-05T08:41:31.759640","created_date":"2026-03-18T00:00:00"}
