{"id":"https://openalex.org/W4391445361","doi":"https://doi.org/10.1186/s12859-024-05666-0","title":"Multi-label classification with XGBoost for metabolic pathway prediction","display_name":"Multi-label classification with XGBoost for metabolic pathway prediction","publication_year":2024,"publication_date":"2024-02-01","ids":{"openalex":"https://openalex.org/W4391445361","doi":"https://doi.org/10.1186/s12859-024-05666-0","pmid":"https://pubmed.ncbi.nlm.nih.gov/38297220"},"language":"en","primary_location":{"id":"doi:10.1186/s12859-024-05666-0","is_oa":true,"landing_page_url":"https://doi.org/10.1186/s12859-024-05666-0","pdf_url":"https://bmcbioinformatics.biomedcentral.com/counter/pdf/10.1186/s12859-024-05666-0","source":{"id":"https://openalex.org/S19032547","display_name":"BMC Bioinformatics","issn_l":"1471-2105","issn":["1471-2105"],"is_oa":true,"is_in_doaj":true,"is_core":true,"host_organization":"https://openalex.org/P4310320256","host_organization_name":"BioMed Central","host_organization_lineage":["https://openalex.org/P4310320256","https://openalex.org/P4310319965"],"host_organization_lineage_names":["BioMed Central","Springer Nature"],"type":"journal"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"BMC Bioinformatics","raw_type":"journal-article"},"type":"article","indexed_in":["crossref","doaj","pubmed"],"open_access":{"is_oa":true,"oa_status":"gold","oa_url":"https://bmcbioinformatics.biomedcentral.com/counter/pdf/10.1186/s12859-024-05666-0","any_repository_has_fulltext":true},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5019407505","display_name":"Hyunwhan Joe","orcid":"https://orcid.org/0000-0001-9637-4573"},"institutions":[{"id":"https://openalex.org/I139264467","display_name":"Seoul National University","ror":"https://ror.org/04h9pn542","country_code":"KR","type":"education","lineage":["https://openalex.org/I139264467"]}],"countries":["KR"],"is_corresponding":true,"raw_author_name":"Hyunwhan Joe","raw_affiliation_strings":["Biomedical Knowledge Engineering Lab., Seoul National University, Seoul, Republic of Korea"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"Biomedical Knowledge Engineering Lab., Seoul National University, Seoul, Republic of Korea","institution_ids":["https://openalex.org/I139264467"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5058110900","display_name":"Hong\u2010Gee Kim","orcid":"https://orcid.org/0000-0002-2610-4321"},"institutions":[{"id":"https://openalex.org/I139264467","display_name":"Seoul National University","ror":"https://ror.org/04h9pn542","country_code":"KR","type":"education","lineage":["https://openalex.org/I139264467"]},{"id":"https://openalex.org/I4210123907","display_name":"National University College","ror":"https://ror.org/02hs8e066","country_code":"PR","type":"education","lineage":["https://openalex.org/I4210123907"]},{"id":"https://openalex.org/I4210158657","display_name":"Seoul National University Dental Hospital","ror":"https://ror.org/0494zgc81","country_code":"KR","type":"healthcare","lineage":["https://openalex.org/I139264467","https://openalex.org/I4210158657"]}],"countries":["KR","PR"],"is_corresponding":false,"raw_author_name":"Hong-Gee Kim","raw_affiliation_strings":["Biomedical Knowledge Engineering Lab., Seoul National University, Seoul, Republic of Korea. hgkim@snu.ac.kr","School of Dentistry and Dental Research Institute, Seoul National University, Seoul, Republic of Korea. hgkim@snu.ac.kr","Biomedical Knowledge Engineering Lab., Seoul National University, Seoul, Republic of Korea"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"Biomedical Knowledge Engineering Lab., Seoul National University, Seoul, Republic of Korea. hgkim@snu.ac.kr","institution_ids":["https://openalex.org/I4210123907","https://openalex.org/I139264467"]},{"raw_affiliation_string":"School of Dentistry and Dental Research Institute, Seoul National University, Seoul, Republic of Korea. hgkim@snu.ac.kr","institution_ids":["https://openalex.org/I4210158657"]},{"raw_affiliation_string":"Biomedical Knowledge Engineering Lab., Seoul National University, Seoul, Republic of Korea","institution_ids":["https://openalex.org/I139264467"]}]}],"institutions":[],"countries_distinct_count":2,"institutions_distinct_count":2,"corresponding_author_ids":["https://openalex.org/A5019407505"],"corresponding_institution_ids":["https://openalex.org/I139264467"],"apc_list":{"value":1690,"currency":"GBP","value_usd":2072},"apc_paid":{"value":1690,"currency":"GBP","value_usd":2072},"fwci":4.1512,"has_fulltext":true,"cited_by_count":19,"citation_normalized_percentile":{"value":0.94646235,"is_in_top_1_percent":false,"is_in_top_10_percent":true},"cited_by_percentile_year":{"min":98,"max":99},"biblio":{"volume":"25","issue":"1","first_page":"52","last_page":"52"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T12254","display_name":"Machine Learning in Bioinformatics","score":0.7767999768257141,"subfield":{"id":"https://openalex.org/subfields/1312","display_name":"Molecular Biology"},"field":{"id":"https://openalex.org/fields/13","display_name":"Biochemistry, Genetics and Molecular Biology"},"domain":{"id":"https://openalex.org/domains/1","display_name":"Life Sciences"}},"topics":[{"id":"https://openalex.org/T12254","display_name":"Machine Learning in Bioinformatics","score":0.7767999768257141,"subfield":{"id":"https://openalex.org/subfields/1312","display_name":"Molecular Biology"},"field":{"id":"https://openalex.org/fields/13","display_name":"Biochemistry, Genetics and Molecular Biology"},"domain":{"id":"https://openalex.org/domains/1","display_name":"Life Sciences"}},{"id":"https://openalex.org/T10887","display_name":"Bioinformatics and Genomic Networks","score":0.0812000036239624,"subfield":{"id":"https://openalex.org/subfields/1312","display_name":"Molecular Biology"},"field":{"id":"https://openalex.org/fields/13","display_name":"Biochemistry, Genetics and Molecular Biology"},"domain":{"id":"https://openalex.org/domains/1","display_name":"Life Sciences"}},{"id":"https://openalex.org/T10932","display_name":"Microbial Metabolic Engineering and Bioproduction","score":0.03150000050663948,"subfield":{"id":"https://openalex.org/subfields/1312","display_name":"Molecular Biology"},"field":{"id":"https://openalex.org/fields/13","display_name":"Biochemistry, Genetics and Molecular Biology"},"domain":{"id":"https://openalex.org/domains/1","display_name":"Life Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/machine-learning","display_name":"Machine learning","score":0.735169529914856},{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.734853208065033},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.6946446299552917},{"id":"https://openalex.org/keywords/classifier","display_name":"Classifier (UML)","score":0.6901213526725769},{"id":"https://openalex.org/keywords/pruning","display_name":"Pruning","score":0.6572359800338745},{"id":"https://openalex.org/keywords/ranking","display_name":"Ranking (information retrieval)","score":0.4395330846309662},{"id":"https://openalex.org/keywords/dna-microarray","display_name":"DNA microarray","score":0.4280101954936981},{"id":"https://openalex.org/keywords/deep-learning","display_name":"Deep learning","score":0.4160047471523285},{"id":"https://openalex.org/keywords/organism","display_name":"Organism","score":0.4100644588470459},{"id":"https://openalex.org/keywords/biology","display_name":"Biology","score":0.17709481716156006},{"id":"https://openalex.org/keywords/gene","display_name":"Gene","score":0.12062886357307434},{"id":"https://openalex.org/keywords/genetics","display_name":"Genetics","score":0.0765714943408966}],"concepts":[{"id":"https://openalex.org/C119857082","wikidata":"https://www.wikidata.org/wiki/Q2539","display_name":"Machine learning","level":1,"score":0.735169529914856},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.734853208065033},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.6946446299552917},{"id":"https://openalex.org/C95623464","wikidata":"https://www.wikidata.org/wiki/Q1096149","display_name":"Classifier (UML)","level":2,"score":0.6901213526725769},{"id":"https://openalex.org/C108010975","wikidata":"https://www.wikidata.org/wiki/Q500094","display_name":"Pruning","level":2,"score":0.6572359800338745},{"id":"https://openalex.org/C189430467","wikidata":"https://www.wikidata.org/wiki/Q7293293","display_name":"Ranking (information retrieval)","level":2,"score":0.4395330846309662},{"id":"https://openalex.org/C95371953","wikidata":"https://www.wikidata.org/wiki/Q591745","display_name":"DNA microarray","level":4,"score":0.4280101954936981},{"id":"https://openalex.org/C108583219","wikidata":"https://www.wikidata.org/wiki/Q197536","display_name":"Deep learning","level":2,"score":0.4160047471523285},{"id":"https://openalex.org/C137858568","wikidata":"https://www.wikidata.org/wiki/Q7239","display_name":"Organism","level":2,"score":0.4100644588470459},{"id":"https://openalex.org/C86803240","wikidata":"https://www.wikidata.org/wiki/Q420","display_name":"Biology","level":0,"score":0.17709481716156006},{"id":"https://openalex.org/C104317684","wikidata":"https://www.wikidata.org/wiki/Q7187","display_name":"Gene","level":2,"score":0.12062886357307434},{"id":"https://openalex.org/C54355233","wikidata":"https://www.wikidata.org/wiki/Q7162","display_name":"Genetics","level":1,"score":0.0765714943408966},{"id":"https://openalex.org/C6557445","wikidata":"https://www.wikidata.org/wiki/Q173113","display_name":"Agronomy","level":1,"score":0.0},{"id":"https://openalex.org/C150194340","wikidata":"https://www.wikidata.org/wiki/Q26972","display_name":"Gene expression","level":3,"score":0.0}],"mesh":[{"descriptor_ui":"D000069550","descriptor_name":"Machine Learning","qualifier_ui":null,"qualifier_name":null,"is_major_topic":true},{"descriptor_ui":"D000069550","descriptor_name":"Machine Learning","qualifier_ui":null,"qualifier_name":null,"is_major_topic":true},{"descriptor_ui":"D000069550","descriptor_name":"Machine Learning","qualifier_ui":null,"qualifier_name":null,"is_major_topic":true},{"descriptor_ui":"D000069550","descriptor_name":"Machine Learning","qualifier_ui":null,"qualifier_name":null,"is_major_topic":true},{"descriptor_ui":"D001695","descriptor_name":"Biology","qualifier_ui":null,"qualifier_name":null,"is_major_topic":false},{"descriptor_ui":"D001695","descriptor_name":"Biology","qualifier_ui":null,"qualifier_name":null,"is_major_topic":false},{"descriptor_ui":"D001695","descriptor_name":"Biology","qualifier_ui":null,"qualifier_name":null,"is_major_topic":false},{"descriptor_ui":"D001695","descriptor_name":"Biology","qualifier_ui":null,"qualifier_name":null,"is_major_topic":false},{"descriptor_ui":"D016678","descriptor_name":"Genome","qualifier_ui":null,"qualifier_name":null,"is_major_topic":false},{"descriptor_ui":"D016678","descriptor_name":"Genome","qualifier_ui":null,"qualifier_name":null,"is_major_topic":false},{"descriptor_ui":"D016678","descriptor_name":"Genome","qualifier_ui":null,"qualifier_name":null,"is_major_topic":false},{"descriptor_ui":"D016678","descriptor_name":"Genome","qualifier_ui":null,"qualifier_name":null,"is_major_topic":false},{"descriptor_ui":"D053858","descriptor_name":"Metabolic Networks and Pathways","qualifier_ui":null,"qualifier_name":null,"is_major_topic":true},{"descriptor_ui":"D053858","descriptor_name":"Metabolic Networks and Pathways","qualifier_ui":null,"qualifier_name":null,"is_major_topic":true},{"descriptor_ui":"D053858","descriptor_name":"Metabolic Networks and Pathways","qualifier_ui":null,"qualifier_name":null,"is_major_topic":true},{"descriptor_ui":"D053858","descriptor_name":"Metabolic Networks and Pathways","qualifier_ui":null,"qualifier_name":null,"is_major_topic":true}],"locations_count":4,"locations":[{"id":"doi:10.1186/s12859-024-05666-0","is_oa":true,"landing_page_url":"https://doi.org/10.1186/s12859-024-05666-0","pdf_url":"https://bmcbioinformatics.biomedcentral.com/counter/pdf/10.1186/s12859-024-05666-0","source":{"id":"https://openalex.org/S19032547","display_name":"BMC Bioinformatics","issn_l":"1471-2105","issn":["1471-2105"],"is_oa":true,"is_in_doaj":true,"is_core":true,"host_organization":"https://openalex.org/P4310320256","host_organization_name":"BioMed Central","host_organization_lineage":["https://openalex.org/P4310320256","https://openalex.org/P4310319965"],"host_organization_lineage_names":["BioMed Central","Springer Nature"],"type":"journal"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"BMC Bioinformatics","raw_type":"journal-article"},{"id":"pmid:38297220","is_oa":false,"landing_page_url":"https://pubmed.ncbi.nlm.nih.gov/38297220","pdf_url":null,"source":{"id":"https://openalex.org/S4306525036","display_name":"PubMed","issn_l":null,"issn":null,"is_oa":false,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I1299303238","host_organization_name":"National Institutes of Health","host_organization_lineage":["https://openalex.org/I1299303238"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"BMC bioinformatics","raw_type":null},{"id":"pmh:oai:pubmedcentral.nih.gov:10832249","is_oa":true,"landing_page_url":"https://www.ncbi.nlm.nih.gov/pmc/articles/10832249","pdf_url":"https://pmc.ncbi.nlm.nih.gov/articles/PMC10832249/pdf/12859_2024_Article_5666.pdf","source":{"id":"https://openalex.org/S2764455111","display_name":"PubMed Central","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I1299303238","host_organization_name":"National Institutes of Health","host_organization_lineage":["https://openalex.org/I1299303238"],"host_organization_lineage_names":[],"type":"repository"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":"BMC Bioinformatics","raw_type":"Text"},{"id":"pmh:oai:doaj.org/article:053bec36905745f6946f4a92c67377b4","is_oa":true,"landing_page_url":"https://doaj.org/article/053bec36905745f6946f4a92c67377b4","pdf_url":null,"source":{"id":"https://openalex.org/S4306401280","display_name":"DOAJ (DOAJ: Directory of Open Access Journals)","issn_l":null,"issn":null,"is_oa":false,"is_in_doaj":false,"is_core":false,"host_organization":null,"host_organization_name":null,"host_organization_lineage":[],"host_organization_lineage_names":[],"type":"repository"},"license":"cc-by-sa","license_id":"https://openalex.org/licenses/cc-by-sa","version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":"BMC Bioinformatics, Vol 25, Iss 1, Pp 1-15 (2024)","raw_type":"article"}],"best_oa_location":{"id":"doi:10.1186/s12859-024-05666-0","is_oa":true,"landing_page_url":"https://doi.org/10.1186/s12859-024-05666-0","pdf_url":"https://bmcbioinformatics.biomedcentral.com/counter/pdf/10.1186/s12859-024-05666-0","source":{"id":"https://openalex.org/S19032547","display_name":"BMC Bioinformatics","issn_l":"1471-2105","issn":["1471-2105"],"is_oa":true,"is_in_doaj":true,"is_core":true,"host_organization":"https://openalex.org/P4310320256","host_organization_name":"BioMed Central","host_organization_lineage":["https://openalex.org/P4310320256","https://openalex.org/P4310319965"],"host_organization_lineage_names":["BioMed Central","Springer Nature"],"type":"journal"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"BMC Bioinformatics","raw_type":"journal-article"},"sustainable_development_goals":[],"awards":[{"id":"https://openalex.org/G2564581808","display_name":null,"funder_award_id":"RS-2023-00268071","funder_id":"https://openalex.org/F4320328359","funder_display_name":"Ministry of Science and ICT, South Korea"},{"id":"https://openalex.org/G6436755233","display_name":null,"funder_award_id":"RS-2023-00268071","funder_id":"https://openalex.org/F4320322120","funder_display_name":"National Research Foundation of Korea"}],"funders":[{"id":"https://openalex.org/F4320320671","display_name":"National Research Foundation","ror":"https://ror.org/05s0g1g46"},{"id":"https://openalex.org/F4320322120","display_name":"National Research Foundation of Korea","ror":"https://ror.org/013aysd81"},{"id":"https://openalex.org/F4320328359","display_name":"Ministry of Science and ICT, South Korea","ror":"https://ror.org/01wpjm123"}],"has_content":{"grobid_xml":false,"pdf":true},"content_urls":{"pdf":"https://content.openalex.org/works/W4391445361.pdf"},"referenced_works_count":33,"referenced_works":["https://openalex.org/W1678356000","https://openalex.org/W1969675093","https://openalex.org/W1996047071","https://openalex.org/W1997996256","https://openalex.org/W2058501095","https://openalex.org/W2066656905","https://openalex.org/W2077631777","https://openalex.org/W2111470171","https://openalex.org/W2111973517","https://openalex.org/W2134394193","https://openalex.org/W2146241755","https://openalex.org/W2155201905","https://openalex.org/W2160453515","https://openalex.org/W2162473677","https://openalex.org/W2163922914","https://openalex.org/W2295598076","https://openalex.org/W2749464300","https://openalex.org/W2767245172","https://openalex.org/W2773939681","https://openalex.org/W2977870980","https://openalex.org/W2997158276","https://openalex.org/W3043794400","https://openalex.org/W3089740292","https://openalex.org/W3093585277","https://openalex.org/W3169203486","https://openalex.org/W3185730212","https://openalex.org/W3186101535","https://openalex.org/W3216660278","https://openalex.org/W4210531762","https://openalex.org/W4223530030","https://openalex.org/W4283155576","https://openalex.org/W4292168089","https://openalex.org/W4366990373"],"related_works":["https://openalex.org/W24843447","https://openalex.org/W94193318","https://openalex.org/W1547180633","https://openalex.org/W2073808674","https://openalex.org/W2173289516","https://openalex.org/W322176015","https://openalex.org/W20947408","https://openalex.org/W2028140658","https://openalex.org/W2073011570","https://openalex.org/W2468061618"],"abstract_inverted_index":{"BACKGROUND:":[0],"Metabolic":[1],"pathway":[2,33,118,126,198,232],"prediction":[3,34,119,127,199,233],"is":[4,53,59],"one":[5],"possible":[6],"approach":[7],"to":[8,46,84,103,108,170],"address":[9],"the":[10,47,78,123,154,157,168,172,227],"problem":[11],"in":[12,30,44,100,167,206],"system":[13],"biology":[14],"of":[15,156,208,229],"reconstructing":[16],"an":[17],"organism's":[18],"metabolic":[19,117],"network":[20],"from":[21,81,130,222],"its":[22,70],"genome":[23],"sequence.":[24],"Recently":[25],"there":[26],"have":[27],"been":[28],"developments":[29],"machine":[31,39,93,230],"learning-based":[32,40,94,231],"methods":[35,200,234],"that":[36,38,60,86,97,152,160,193,226],"conclude":[37],"approaches":[41,95],"are":[42,164],"similar":[43],"performance":[45,101,228],"most":[48],"used":[49],"method,":[50],"PathoLogic":[51,64,87,202,243],"which":[52,68],"a":[54,115,149],"rule-based":[55],"method.":[56],"One":[57],"issue":[58],"previous":[61,82,92,197],"studies":[62,83],"evaluated":[63],"without":[65,182],"taxonomic":[66,89,204,245],"pruning":[67,90,205],"decreases":[69],"performance.":[71],"RESULTS:":[72],"In":[73],"this":[74,136],"study,":[75],"we":[76,112],"update":[77],"evaluation":[79],"results":[80,191,221],"demonstrate":[85],"with":[88,180,203,244],"outperforms":[91],"and":[96,181,187,212,239],"further":[98],"improvements":[99],"need":[102],"be":[104,109,236],"made":[105],"for":[106],"them":[107],"competitive.":[110],"Furthermore,":[111],"introduce":[113],"mlXGPR,":[114],"XGBoost-based":[116],"method":[120,151],"based":[121],"on":[122,135,185,215],"multi-label":[124,137],"classification":[125],"framework":[128,138],"introduced":[129],"mlLGPR.":[131],"We":[132,147,177],"also":[133],"improve":[134],"by":[139],"utilizing":[140],"correlations":[141,173],"between":[142,174],"labels":[143,175],"using":[144],"classifier":[145,183],"chains.":[146],"propose":[148],"ranking":[150],"determines":[153],"order":[155],"chain":[158,169],"so":[159],"lower":[161],"performing":[162],"classifiers":[163],"placed":[165],"later":[166],"utilize":[171],"more.":[176],"evaluate":[178],"mlXGPR":[179,194],"chains":[184],"single-organism":[186],"multi-organism":[188],"benchmarks.":[189,218],"Our":[190],"indicate":[192,225],"outperform":[195,242],"other":[196],"including":[201],"terms":[207],"hamming":[209],"loss,":[210],"precision":[211],"F1":[213],"score":[214],"single":[216],"organism":[217],"CONCLUSIONS:":[219],"The":[220],"our":[223],"study":[224],"can":[235,240],"substantially":[237],"improved":[238],"even":[241],"pruning.":[246]},"counts_by_year":[{"year":2026,"cited_by_count":3},{"year":2025,"cited_by_count":8},{"year":2024,"cited_by_count":8}],"updated_date":"2026-05-06T08:25:59.206177","created_date":"2025-10-10T00:00:00"}
