{"id":"https://openalex.org/W4229049377","doi":"https://doi.org/10.1109/cibcb55180.2022.9863032","title":"Compound Virtual Screening by Learning-to-Rank with Gradient Boosting Decision Tree and Enrichment-based Cumulative Gain","display_name":"Compound Virtual Screening by Learning-to-Rank with Gradient Boosting Decision Tree and Enrichment-based Cumulative Gain","publication_year":2022,"publication_date":"2022-08-15","ids":{"openalex":"https://openalex.org/W4229049377","doi":"https://doi.org/10.1109/cibcb55180.2022.9863032"},"language":"en","primary_location":{"id":"doi:10.1109/cibcb55180.2022.9863032","is_oa":false,"landing_page_url":"https://doi.org/10.1109/cibcb55180.2022.9863032","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"2022 IEEE Conference on Computational Intelligence in Bioinformatics and Computational Biology (CIBCB)","raw_type":"proceedings-article"},"type":"preprint","indexed_in":["arxiv","crossref"],"open_access":{"is_oa":true,"oa_status":"green","oa_url":"https://arxiv.org/pdf/2205.02169","any_repository_has_fulltext":true},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5005331808","display_name":"Kairi Furui","orcid":"https://orcid.org/0000-0003-1097-0003"},"institutions":[{"id":"https://openalex.org/I114531698","display_name":"Tokyo Institute of Technology","ror":"https://ror.org/0112mx960","country_code":"JP","type":"education","lineage":["https://openalex.org/I114531698"]}],"countries":["JP"],"is_corresponding":true,"raw_author_name":"Kairi Furui","raw_affiliation_strings":["School of Computing, Tokyo Institute of Technology,Department of Computer Science,Kanagawa,Japan","Department of Computer Science, School of Computing, Tokyo Institute of Technology, Kanagawa, Japan"],"affiliations":[{"raw_affiliation_string":"School of Computing, Tokyo Institute of Technology,Department of Computer Science,Kanagawa,Japan","institution_ids":["https://openalex.org/I114531698"]},{"raw_affiliation_string":"Department of Computer Science, School of Computing, Tokyo Institute of Technology, Kanagawa, Japan","institution_ids":["https://openalex.org/I114531698"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5061510293","display_name":"Masahito Ohue","orcid":"https://orcid.org/0000-0002-0120-1643"},"institutions":[{"id":"https://openalex.org/I114531698","display_name":"Tokyo Institute of Technology","ror":"https://ror.org/0112mx960","country_code":"JP","type":"education","lineage":["https://openalex.org/I114531698"]}],"countries":["JP"],"is_corresponding":false,"raw_author_name":"Masahito Ohue","raw_affiliation_strings":["School of Computing, Tokyo Institute of Technology,Department of Computer Science,Kanagawa,Japan","Department of Computer Science, School of Computing, Tokyo Institute of Technology, Kanagawa, Japan"],"affiliations":[{"raw_affiliation_string":"School of Computing, Tokyo Institute of Technology,Department of Computer Science,Kanagawa,Japan","institution_ids":["https://openalex.org/I114531698"]},{"raw_affiliation_string":"Department of Computer Science, School of Computing, Tokyo Institute of Technology, Kanagawa, Japan","institution_ids":["https://openalex.org/I114531698"]}]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":2,"corresponding_author_ids":["https://openalex.org/A5005331808"],"corresponding_institution_ids":["https://openalex.org/I114531698"],"apc_list":null,"apc_paid":null,"fwci":1.052,"has_fulltext":false,"cited_by_count":7,"citation_normalized_percentile":{"value":0.7905897,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":{"min":90,"max":97},"biblio":{"volume":null,"issue":null,"first_page":"1","last_page":"7"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10211","display_name":"Computational Drug Discovery Methods","score":0.9995999932289124,"subfield":{"id":"https://openalex.org/subfields/1703","display_name":"Computational Theory and Mathematics"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10211","display_name":"Computational Drug Discovery Methods","score":0.9995999932289124,"subfield":{"id":"https://openalex.org/subfields/1703","display_name":"Computational Theory and Mathematics"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11948","display_name":"Machine Learning in Materials Science","score":0.9811000227928162,"subfield":{"id":"https://openalex.org/subfields/2505","display_name":"Materials Chemistry"},"field":{"id":"https://openalex.org/fields/25","display_name":"Materials Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T12535","display_name":"Machine Learning and Data Classification","score":0.9028000235557556,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/learning-to-rank","display_name":"Learning to rank","score":0.7388554811477661},{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.7148403525352478},{"id":"https://openalex.org/keywords/ranking","display_name":"Ranking (information retrieval)","score":0.6965664029121399},{"id":"https://openalex.org/keywords/machine-learning","display_name":"Machine learning","score":0.6133948564529419},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.5835208892822266},{"id":"https://openalex.org/keywords/virtual-screening","display_name":"Virtual screening","score":0.5549050569534302},{"id":"https://openalex.org/keywords/metric","display_name":"Metric (unit)","score":0.5474900603294373},{"id":"https://openalex.org/keywords/rank","display_name":"Rank (graph theory)","score":0.5388038158416748},{"id":"https://openalex.org/keywords/random-forest","display_name":"Random forest","score":0.52914959192276},{"id":"https://openalex.org/keywords/ranking-svm","display_name":"Ranking SVM","score":0.5087190270423889},{"id":"https://openalex.org/keywords/boosting","display_name":"Boosting (machine learning)","score":0.5047577619552612},{"id":"https://openalex.org/keywords/ordinal-regression","display_name":"Ordinal regression","score":0.4435853660106659},{"id":"https://openalex.org/keywords/regression","display_name":"Regression","score":0.41380468010902405},{"id":"https://openalex.org/keywords/data-mining","display_name":"Data mining","score":0.3694179654121399},{"id":"https://openalex.org/keywords/mathematics","display_name":"Mathematics","score":0.20923686027526855},{"id":"https://openalex.org/keywords/pharmacophore","display_name":"Pharmacophore","score":0.1781359314918518},{"id":"https://openalex.org/keywords/statistics","display_name":"Statistics","score":0.15566030144691467},{"id":"https://openalex.org/keywords/bioinformatics","display_name":"Bioinformatics","score":0.1218593418598175}],"concepts":[{"id":"https://openalex.org/C86037889","wikidata":"https://www.wikidata.org/wiki/Q4330127","display_name":"Learning to rank","level":3,"score":0.7388554811477661},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.7148403525352478},{"id":"https://openalex.org/C189430467","wikidata":"https://www.wikidata.org/wiki/Q7293293","display_name":"Ranking (information retrieval)","level":2,"score":0.6965664029121399},{"id":"https://openalex.org/C119857082","wikidata":"https://www.wikidata.org/wiki/Q2539","display_name":"Machine learning","level":1,"score":0.6133948564529419},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.5835208892822266},{"id":"https://openalex.org/C103697762","wikidata":"https://www.wikidata.org/wiki/Q4112105","display_name":"Virtual screening","level":3,"score":0.5549050569534302},{"id":"https://openalex.org/C176217482","wikidata":"https://www.wikidata.org/wiki/Q860554","display_name":"Metric (unit)","level":2,"score":0.5474900603294373},{"id":"https://openalex.org/C164226766","wikidata":"https://www.wikidata.org/wiki/Q7293202","display_name":"Rank (graph theory)","level":2,"score":0.5388038158416748},{"id":"https://openalex.org/C169258074","wikidata":"https://www.wikidata.org/wiki/Q245748","display_name":"Random forest","level":2,"score":0.52914959192276},{"id":"https://openalex.org/C124975894","wikidata":"https://www.wikidata.org/wiki/Q7293290","display_name":"Ranking SVM","level":3,"score":0.5087190270423889},{"id":"https://openalex.org/C46686674","wikidata":"https://www.wikidata.org/wiki/Q466303","display_name":"Boosting (machine learning)","level":2,"score":0.5047577619552612},{"id":"https://openalex.org/C110313322","wikidata":"https://www.wikidata.org/wiki/Q7100793","display_name":"Ordinal regression","level":2,"score":0.4435853660106659},{"id":"https://openalex.org/C83546350","wikidata":"https://www.wikidata.org/wiki/Q1139051","display_name":"Regression","level":2,"score":0.41380468010902405},{"id":"https://openalex.org/C124101348","wikidata":"https://www.wikidata.org/wiki/Q172491","display_name":"Data mining","level":1,"score":0.3694179654121399},{"id":"https://openalex.org/C33923547","wikidata":"https://www.wikidata.org/wiki/Q395","display_name":"Mathematics","level":0,"score":0.20923686027526855},{"id":"https://openalex.org/C56173144","wikidata":"https://www.wikidata.org/wiki/Q1539893","display_name":"Pharmacophore","level":2,"score":0.1781359314918518},{"id":"https://openalex.org/C105795698","wikidata":"https://www.wikidata.org/wiki/Q12483","display_name":"Statistics","level":1,"score":0.15566030144691467},{"id":"https://openalex.org/C60644358","wikidata":"https://www.wikidata.org/wiki/Q128570","display_name":"Bioinformatics","level":1,"score":0.1218593418598175},{"id":"https://openalex.org/C86803240","wikidata":"https://www.wikidata.org/wiki/Q420","display_name":"Biology","level":0,"score":0.0},{"id":"https://openalex.org/C114614502","wikidata":"https://www.wikidata.org/wiki/Q76592","display_name":"Combinatorics","level":1,"score":0.0},{"id":"https://openalex.org/C21547014","wikidata":"https://www.wikidata.org/wiki/Q1423657","display_name":"Operations management","level":1,"score":0.0},{"id":"https://openalex.org/C162324750","wikidata":"https://www.wikidata.org/wiki/Q8134","display_name":"Economics","level":0,"score":0.0}],"mesh":[],"locations_count":2,"locations":[{"id":"doi:10.1109/cibcb55180.2022.9863032","is_oa":false,"landing_page_url":"https://doi.org/10.1109/cibcb55180.2022.9863032","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"2022 IEEE Conference on Computational Intelligence in Bioinformatics and Computational Biology (CIBCB)","raw_type":"proceedings-article"},{"id":"pmh:oai:arXiv.org:2205.02169","is_oa":true,"landing_page_url":"http://arxiv.org/abs/2205.02169","pdf_url":"https://arxiv.org/pdf/2205.02169","source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"text"}],"best_oa_location":{"id":"pmh:oai:arXiv.org:2205.02169","is_oa":true,"landing_page_url":"http://arxiv.org/abs/2205.02169","pdf_url":"https://arxiv.org/pdf/2205.02169","source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"text"},"sustainable_development_goals":[{"score":0.6200000047683716,"id":"https://metadata.un.org/sdg/3","display_name":"Good health and well-being"}],"awards":[{"id":"https://openalex.org/G6013431047","display_name":null,"funder_award_id":"20H04280","funder_id":"https://openalex.org/F4320334764","funder_display_name":"Japan Society for the Promotion of Science"},{"id":"https://openalex.org/G7732009912","display_name":null,"funder_award_id":"JPMJAX20A3","funder_id":"https://openalex.org/F4320320907","funder_display_name":"Japan Science and Technology Corporation"},{"id":"https://openalex.org/G8317022281","display_name":null,"funder_award_id":"JPMJFR216J","funder_id":"https://openalex.org/F4320334789","funder_display_name":"Japan Science and Technology Agency"}],"funders":[{"id":"https://openalex.org/F4320311405","display_name":"Japan Agency for Medical Research and Development","ror":"https://ror.org/004rtk039"},{"id":"https://openalex.org/F4320320907","display_name":"Japan Science and Technology Corporation","ror":"https://ror.org/00097mb19"},{"id":"https://openalex.org/F4320322704","display_name":"Tokyo Institute of Technology","ror":"https://ror.org/0112mx960"},{"id":"https://openalex.org/F4320334764","display_name":"Japan Society for the Promotion of Science","ror":"https://ror.org/00hhkn466"},{"id":"https://openalex.org/F4320334789","display_name":"Japan Science and Technology Agency","ror":"https://ror.org/00097mb19"}],"has_content":{"grobid_xml":false,"pdf":false},"content_urls":null,"referenced_works_count":33,"referenced_works":["https://openalex.org/W1521626043","https://openalex.org/W1969231756","https://openalex.org/W1985554184","https://openalex.org/W1988037271","https://openalex.org/W1999798000","https://openalex.org/W2021630848","https://openalex.org/W2069870183","https://openalex.org/W2076412827","https://openalex.org/W2077004593","https://openalex.org/W2081123119","https://openalex.org/W2112937261","https://openalex.org/W2115584760","https://openalex.org/W2116528443","https://openalex.org/W2126255586","https://openalex.org/W2128877075","https://openalex.org/W2143331230","https://openalex.org/W2295598076","https://openalex.org/W2400628046","https://openalex.org/W2605046621","https://openalex.org/W2768348081","https://openalex.org/W2791355014","https://openalex.org/W2898073868","https://openalex.org/W2900090807","https://openalex.org/W2963392959","https://openalex.org/W3014852814","https://openalex.org/W3016398046","https://openalex.org/W3043660595","https://openalex.org/W3159656606","https://openalex.org/W3216888722","https://openalex.org/W4210683988","https://openalex.org/W4241119204","https://openalex.org/W4241676240","https://openalex.org/W4287071232"],"related_works":["https://openalex.org/W85699040","https://openalex.org/W2986119073","https://openalex.org/W3127142483","https://openalex.org/W2128281062","https://openalex.org/W2114531539","https://openalex.org/W3001149962","https://openalex.org/W3089100822","https://openalex.org/W2125398996","https://openalex.org/W2142697503","https://openalex.org/W2963356411"],"abstract_inverted_index":{"Learning-to-rank,":[0],"a":[1,59,124,179,241],"machine":[2],"learning":[3],"technique":[4],"widely":[5,99],"used":[6,58,100,136,148],"in":[7,53,101,137,233],"information":[8,102],"retrieval,":[9,103],"has":[10],"recently":[11],"been":[12,68],"applied":[13],"to":[14,21,190,230],"the":[15,23,74,89,108,138,149,192,200,204,224],"problem":[16],"of":[17,26,50,114,141,194,245],"ligand-based":[18,161],"virtual":[19,162],"screening":[20,55,143,247],"accelerate":[22],"early":[24],"stages":[25],"new":[27,180],"drug":[28],"development.":[29],"Ranking":[30],"prediction":[31,52,125],"models":[32,173],"learn":[33],"based":[34],"on":[35,217],"ordinal":[36],"relationships,":[37],"making":[38],"them":[39],"suitable":[40],"for":[41,160,240],"integrating":[42],"assay":[43],"data":[44],"from":[45],"various":[46],"environments.":[47],"Existing":[48],"studies":[49],"rank":[51],"compound":[54,142,246],"have":[56,66,83],"generally":[57],"learning-to-rank":[60,80,208],"method":[61],"called":[62,92,156],"RankSVM.":[63],"However,":[64],"they":[65],"not":[67],"compared":[69,166],"with":[70,152,167,207],"or":[71],"validated":[72],"against":[73],"gradient":[75],"boosting":[76],"decision":[77],"tree":[78],"(GBDT)-based":[79],"methods":[81,170,212],"that":[82,203,223],"gained":[84],"popularity":[85],"recently.":[86],"Furthermore,":[87],"although":[88],"ranking":[90,153,181,195],"metric":[91],"Normalized":[93,183],"Discounted":[94,185],"Cumulative":[95,186],"Gain":[96,187],"(NDCG)":[97],"is":[98,134],"it":[104],"only":[105],"determines":[106],"whether":[107],"predictions":[109,196,225,232],"are":[110],"better":[111],"than":[112,129],"those":[113],"other":[115,118],"models.":[116],"In":[117,198],"words,":[119],"NDCG":[120,133],"cannot":[121],"recognize":[122],"when":[123],"model":[126,151,206],"produces":[127],"worse":[128],"random":[130,231],"results.":[131],"Nevertheless,":[132],"still":[135],"performance":[139],"evaluation":[140],"using":[144,174,213],"learning-to-rank.":[145],"This":[146],"study":[147],"GBDT":[150,172,205,214],"loss":[154],"functions,":[155],"lambdarank":[157],"and":[158,171,215],"lambdaloss,":[159],"screening;":[163],"results":[164,201],"were":[165,228],"existing":[168,210],"RankSVM":[169,216],"regression.":[175],"We":[176],"also":[177],"proposed":[178],"metric,":[182],"Enrichment":[184],"(NEDCG),":[188],"aiming":[189],"evaluate":[191],"goodness":[193],"properly.":[197],"addition,":[199],"showed":[202,222],"outperformed":[209],"regression":[211,227],"diverse":[218],"datasets.":[219],"Finally,":[220],"NEDCG":[221],"by":[226],"comparable":[229],"multi-assay,":[234],"multi-family":[235],"datasets,":[236],"demonstrating":[237],"its":[238],"usefulness":[239],"more":[242],"direct":[243],"assessment":[244],"performance.":[248]},"counts_by_year":[{"year":2025,"cited_by_count":3},{"year":2024,"cited_by_count":1},{"year":2023,"cited_by_count":3}],"updated_date":"2026-03-20T23:20:44.827607","created_date":"2025-10-10T00:00:00"}
