{"id":"https://openalex.org/W7126046958","doi":"https://doi.org/10.1109/bibm66473.2025.11356101","title":"Minimal Features Subset Enabling Essential Gene Prediction Within and Between Organisms for Sulfate Reducing Bacteria Family","display_name":"Minimal Features Subset Enabling Essential Gene Prediction Within and Between Organisms for Sulfate Reducing Bacteria Family","publication_year":2025,"publication_date":"2025-12-15","ids":{"openalex":"https://openalex.org/W7126046958","doi":"https://doi.org/10.1109/bibm66473.2025.11356101"},"language":null,"primary_location":{"id":"doi:10.1109/bibm66473.2025.11356101","is_oa":false,"landing_page_url":"https://doi.org/10.1109/bibm66473.2025.11356101","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"2025 IEEE International Conference on Bioinformatics and Biomedicine (BIBM)","raw_type":"proceedings-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":false,"oa_status":"closed","oa_url":null,"any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5124172818","display_name":"Alain Bertrand Bomgni","orcid":null},"institutions":[{"id":"https://openalex.org/I126547033","display_name":"Oglala Lakota College","ror":"https://ror.org/012y1mj37","country_code":"US","type":"education","lineage":["https://openalex.org/I126547033"]}],"countries":["US"],"is_corresponding":true,"raw_author_name":"Alain Bertrand Bomgni","raw_affiliation_strings":["Math Science and Technology Oglala Lakota College,Kyle,SD,USA"],"affiliations":[{"raw_affiliation_string":"Math Science and Technology Oglala Lakota College,Kyle,SD,USA","institution_ids":["https://openalex.org/I126547033"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5124276500","display_name":"Junior Basile Fofack","orcid":null},"institutions":[{"id":"https://openalex.org/I178331978","display_name":"Universit\u00e9 de Dschang","ror":"https://ror.org/0566t4z20","country_code":"CM","type":"education","lineage":["https://openalex.org/I178331978"]}],"countries":["CM"],"is_corresponding":false,"raw_author_name":"Junior Basile Fofack","raw_affiliation_strings":["University of Dschang,Dept. of Computer Science,Dschang,Cameroon"],"affiliations":[{"raw_affiliation_string":"University of Dschang,Dept. of Computer Science,Dschang,Cameroon","institution_ids":["https://openalex.org/I178331978"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5124243243","display_name":"Shiva Aryal","orcid":null},"institutions":[{"id":"https://openalex.org/I189957204","display_name":"University of South Dakota","ror":"https://ror.org/0043h8f16","country_code":"US","type":"education","lineage":["https://openalex.org/I189957204"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Shiva Aryal","raw_affiliation_strings":["University of South Dakota,Dept. of Biomedical Engineering,Vermillion,SD,USA"],"affiliations":[{"raw_affiliation_string":"University of South Dakota,Dept. of Biomedical Engineering,Vermillion,SD,USA","institution_ids":["https://openalex.org/I189957204"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5124159682","display_name":"Jerry Garvin Lonlac Konlac","orcid":null},"institutions":[{"id":"https://openalex.org/I205703379","display_name":"Institut Mines-T\u00e9l\u00e9com","ror":"https://ror.org/025vp2923","country_code":"FR","type":"facility","lineage":["https://openalex.org/I205703379"]}],"countries":["FR"],"is_corresponding":false,"raw_author_name":"Jerry Garvin Lonlac Konlac","raw_affiliation_strings":["IMT Nord Europe Institut Mines-T&#x00E9;l&#x00E9;com, University of Lille, Centre for Digital Systems,Lille,France,F-59000"],"affiliations":[{"raw_affiliation_string":"IMT Nord Europe Institut Mines-T&#x00E9;l&#x00E9;com, University of Lille, Centre for Digital Systems,Lille,France,F-59000","institution_ids":["https://openalex.org/I205703379"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5061731299","display_name":"V. Gadhamshetty","orcid":null},"institutions":[{"id":"https://openalex.org/I184647316","display_name":"South Dakota School of Mines and Technology","ror":"https://ror.org/00ch7yk27","country_code":"US","type":"education","lineage":["https://openalex.org/I184647316"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Venkataramana Gadhamshetty","raw_affiliation_strings":["South Dakota School of Mines,Civil and Environmental Engineering Dept.,Rapid City,SD,USA"],"affiliations":[{"raw_affiliation_string":"South Dakota School of Mines,Civil and Environmental Engineering Dept.,Rapid City,SD,USA","institution_ids":["https://openalex.org/I184647316"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5124195086","display_name":"Etienne Gnimpieba Z.","orcid":null},"institutions":[{"id":"https://openalex.org/I189957204","display_name":"University of South Dakota","ror":"https://ror.org/0043h8f16","country_code":"US","type":"education","lineage":["https://openalex.org/I189957204"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Etienne Gnimpieba Z.","raw_affiliation_strings":["University of South Dakota,Dept. of Biomedical Engineering,Vermillion,SD,USA"],"affiliations":[{"raw_affiliation_string":"University of South Dakota,Dept. of Biomedical Engineering,Vermillion,SD,USA","institution_ids":["https://openalex.org/I189957204"]}]}],"institutions":[],"countries_distinct_count":3,"institutions_distinct_count":6,"corresponding_author_ids":["https://openalex.org/A5124172818"],"corresponding_institution_ids":["https://openalex.org/I126547033"],"apc_list":null,"apc_paid":null,"fwci":0.0,"has_fulltext":false,"cited_by_count":0,"citation_normalized_percentile":{"value":0.61499622,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":null,"biblio":{"volume":null,"issue":null,"first_page":"7516","last_page":"7525"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T12247","display_name":"Microbial Applications in Construction Materials","score":0.18359999358654022,"subfield":{"id":"https://openalex.org/subfields/2305","display_name":"Environmental Engineering"},"field":{"id":"https://openalex.org/fields/23","display_name":"Environmental Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T12247","display_name":"Microbial Applications in Construction Materials","score":0.18359999358654022,"subfield":{"id":"https://openalex.org/subfields/2305","display_name":"Environmental Engineering"},"field":{"id":"https://openalex.org/fields/23","display_name":"Environmental Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10015","display_name":"Genomics and Phylogenetic Studies","score":0.1128000020980835,"subfield":{"id":"https://openalex.org/subfields/1312","display_name":"Molecular Biology"},"field":{"id":"https://openalex.org/fields/13","display_name":"Biochemistry, Genetics and Molecular Biology"},"domain":{"id":"https://openalex.org/domains/1","display_name":"Life Sciences"}},{"id":"https://openalex.org/T11923","display_name":"Mine drainage and remediation techniques","score":0.051500000059604645,"subfield":{"id":"https://openalex.org/subfields/2304","display_name":"Environmental Chemistry"},"field":{"id":"https://openalex.org/fields/23","display_name":"Environmental Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/biomedicine","display_name":"Biomedicine","score":0.7039999961853027},{"id":"https://openalex.org/keywords/classifier","display_name":"Classifier (UML)","score":0.4952000081539154},{"id":"https://openalex.org/keywords/identification","display_name":"Identification (biology)","score":0.4823000133037567},{"id":"https://openalex.org/keywords/organism","display_name":"Organism","score":0.4462999999523163},{"id":"https://openalex.org/keywords/model-organism","display_name":"Model organism","score":0.4345000088214874},{"id":"https://openalex.org/keywords/feature-selection","display_name":"Feature selection","score":0.4203000068664551},{"id":"https://openalex.org/keywords/gene","display_name":"Gene","score":0.38999998569488525},{"id":"https://openalex.org/keywords/feature","display_name":"Feature (linguistics)","score":0.36410000920295715},{"id":"https://openalex.org/keywords/in-silico","display_name":"In silico","score":0.361299991607666}],"concepts":[{"id":"https://openalex.org/C66782513","wikidata":"https://www.wikidata.org/wiki/Q864601","display_name":"Biomedicine","level":2,"score":0.7039999961853027},{"id":"https://openalex.org/C70721500","wikidata":"https://www.wikidata.org/wiki/Q177005","display_name":"Computational biology","level":1,"score":0.5460000038146973},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.4970000088214874},{"id":"https://openalex.org/C95623464","wikidata":"https://www.wikidata.org/wiki/Q1096149","display_name":"Classifier (UML)","level":2,"score":0.4952000081539154},{"id":"https://openalex.org/C116834253","wikidata":"https://www.wikidata.org/wiki/Q2039217","display_name":"Identification (biology)","level":2,"score":0.4823000133037567},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.48019999265670776},{"id":"https://openalex.org/C119857082","wikidata":"https://www.wikidata.org/wiki/Q2539","display_name":"Machine learning","level":1,"score":0.46380001306533813},{"id":"https://openalex.org/C137858568","wikidata":"https://www.wikidata.org/wiki/Q7239","display_name":"Organism","level":2,"score":0.4462999999523163},{"id":"https://openalex.org/C86803240","wikidata":"https://www.wikidata.org/wiki/Q420","display_name":"Biology","level":0,"score":0.4449999928474426},{"id":"https://openalex.org/C19843653","wikidata":"https://www.wikidata.org/wiki/Q213907","display_name":"Model organism","level":3,"score":0.4345000088214874},{"id":"https://openalex.org/C148483581","wikidata":"https://www.wikidata.org/wiki/Q446488","display_name":"Feature selection","level":2,"score":0.4203000068664551},{"id":"https://openalex.org/C104317684","wikidata":"https://www.wikidata.org/wiki/Q7187","display_name":"Gene","level":2,"score":0.38999998569488525},{"id":"https://openalex.org/C2776401178","wikidata":"https://www.wikidata.org/wiki/Q12050496","display_name":"Feature (linguistics)","level":2,"score":0.36410000920295715},{"id":"https://openalex.org/C2775905019","wikidata":"https://www.wikidata.org/wiki/Q192572","display_name":"In silico","level":3,"score":0.361299991607666},{"id":"https://openalex.org/C2780801425","wikidata":"https://www.wikidata.org/wiki/Q5164392","display_name":"Construct (python library)","level":2,"score":0.3314000070095062},{"id":"https://openalex.org/C81669768","wikidata":"https://www.wikidata.org/wiki/Q2359161","display_name":"Precision and recall","level":2,"score":0.3197999894618988},{"id":"https://openalex.org/C124101348","wikidata":"https://www.wikidata.org/wiki/Q172491","display_name":"Data mining","level":1,"score":0.31839999556541443},{"id":"https://openalex.org/C66024118","wikidata":"https://www.wikidata.org/wiki/Q1122506","display_name":"Computational model","level":2,"score":0.3158000111579895},{"id":"https://openalex.org/C152662350","wikidata":"https://www.wikidata.org/wiki/Q815297","display_name":"Systems biology","level":2,"score":0.2987000048160553},{"id":"https://openalex.org/C177264268","wikidata":"https://www.wikidata.org/wiki/Q1514741","display_name":"Set (abstract data type)","level":2,"score":0.2944999933242798},{"id":"https://openalex.org/C141231307","wikidata":"https://www.wikidata.org/wiki/Q7020","display_name":"Genome","level":3,"score":0.289000004529953},{"id":"https://openalex.org/C45804977","wikidata":"https://www.wikidata.org/wiki/Q7239673","display_name":"Predictive modelling","level":2,"score":0.2879999876022339},{"id":"https://openalex.org/C194356953","wikidata":"https://www.wikidata.org/wiki/Q648314","display_name":"Sulfate-reducing bacteria","level":3,"score":0.2761000096797943},{"id":"https://openalex.org/C2778827112","wikidata":"https://www.wikidata.org/wiki/Q22245680","display_name":"Feature engineering","level":3,"score":0.27559998631477356},{"id":"https://openalex.org/C105565629","wikidata":"https://www.wikidata.org/wiki/Q1248292","display_name":"Gene prediction","level":4,"score":0.27459999918937683},{"id":"https://openalex.org/C48702757","wikidata":"https://www.wikidata.org/wiki/Q8269924","display_name":"Biological classification","level":2,"score":0.26969999074935913},{"id":"https://openalex.org/C112313634","wikidata":"https://www.wikidata.org/wiki/Q7886648","display_name":"Complement (music)","level":5,"score":0.2653999924659729}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.1109/bibm66473.2025.11356101","is_oa":false,"landing_page_url":"https://doi.org/10.1109/bibm66473.2025.11356101","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"2025 IEEE International Conference on Bioinformatics and Biomedicine (BIBM)","raw_type":"proceedings-article"}],"best_oa_location":null,"sustainable_development_goals":[],"awards":[{"id":"https://openalex.org/G1642783708","display_name":null,"funder_award_id":"5P20GM103443-20","funder_id":"https://openalex.org/F4320332161","funder_display_name":"National Institutes of Health"},{"id":"https://openalex.org/G5950939161","display_name":null,"funder_award_id":"OIA-1849206,OIA-1920954","funder_id":"https://openalex.org/F4320306076","funder_display_name":"National Science Foundation"}],"funders":[{"id":"https://openalex.org/F4320306076","display_name":"National Science Foundation","ror":"https://ror.org/021nxhr62"},{"id":"https://openalex.org/F4320332161","display_name":"National Institutes of Health","ror":"https://ror.org/01cwqze88"}],"has_content":{"grobid_xml":false,"pdf":false},"content_urls":null,"referenced_works_count":40,"referenced_works":["https://openalex.org/W1993220166","https://openalex.org/W2025971310","https://openalex.org/W2113140044","https://openalex.org/W2118830783","https://openalex.org/W2128784723","https://openalex.org/W2136632285","https://openalex.org/W2138164217","https://openalex.org/W2146245198","https://openalex.org/W2171464043","https://openalex.org/W2334956771","https://openalex.org/W2341018731","https://openalex.org/W2515139970","https://openalex.org/W2559588208","https://openalex.org/W2599873893","https://openalex.org/W2770062471","https://openalex.org/W2793168264","https://openalex.org/W2904672199","https://openalex.org/W2935703330","https://openalex.org/W2948511028","https://openalex.org/W2973219450","https://openalex.org/W3060299613","https://openalex.org/W3090449731","https://openalex.org/W3111363293","https://openalex.org/W3152564577","https://openalex.org/W3203207117","https://openalex.org/W3216419673","https://openalex.org/W4205097571","https://openalex.org/W4206639076","https://openalex.org/W4313515887","https://openalex.org/W4313527418","https://openalex.org/W4319436492","https://openalex.org/W4365449055","https://openalex.org/W4389306773","https://openalex.org/W4389310586","https://openalex.org/W4390970472","https://openalex.org/W4390971148","https://openalex.org/W4391606045","https://openalex.org/W4395030222","https://openalex.org/W4403561447","https://openalex.org/W4406260077"],"related_works":[],"abstract_inverted_index":{"The":[0,193,234],"identification":[1,17],"of":[2,16,26,31,37,69,122,145,150,160,183,200,203,206,211,244,276,282],"essential":[3,174],"genes":[4],"has":[5,268],"garnered":[6],"considerable":[7],"attention":[8],"from":[9,155],"researchers":[10,289],"in":[11,34,274,295,303],"recent":[12],"years.":[13],"This":[14],"process":[15],"uncovers":[18],"minimal":[19,120,136],"functional":[20],"modules":[21],"that":[22,110,128],"enable":[23],"the":[24,35,67,143,226,242,283,292,296],"survival":[25],"an":[27,198,209],"organism,":[28],"making":[29],"it":[30],"paramount":[32],"importance":[33],"fields":[36],"biomedicine":[38],"and":[39,61,75,101,157,208,254,263],"biotechnology.":[40],"To":[41],"address":[42],"this":[43,83,214,286],"challenging":[44],"issue,":[45],"computational":[46],"methods":[47,273],"have":[48,72,76],"become":[49],"increasingly":[50],"utilized":[51],"to":[52,58,108,164,218,258,290,301],"complement":[53],"experimental":[54,305],"approaches,":[55],"which":[56],"tend":[57],"be":[59,132],"intricate":[60],"costly.":[62],"Various":[63],"classifiers,":[64],"based":[65],"on":[66],"selection":[68],"feature":[70,177],"sets,":[71],"been":[73],"proposed":[74,272],"shown":[77],"promising":[78],"results":[79,235],"thus":[80],"far.":[81],"In":[82],"paper,":[84],"leveraging":[85],"50":[86],"sulfate":[87],"reducing":[88],"bacteria":[89],"(SRB)":[90],"organisms":[91,163,240],"-":[92],"microbes":[93],"frequently":[94],"associated":[95],"with":[96,247,298],"biofilm":[97],"formation,":[98],"biofilm-driven":[99],"corrosion,":[100],"complex":[102],"microbial":[103],"community":[104],"dynamics;":[105],"we":[106,126,187],"aim":[107],"show":[109],"classifiers":[111],"can":[112,131],"achieve":[113],"very":[114],"good":[115],"performance":[116,130],"using":[117,229],"only":[118],"a":[119,166],"set":[121],"relevant":[123,137],"features.":[124,184],"Specifically,":[125],"demonstrate":[127],"classifier":[129],"improved":[133],"by":[134,225],"considering":[135],"features":[138,152],"while":[139],"taking":[140],"into":[141],"account":[142],"taxonomy":[144],"different":[146],"organisms.":[147,233],"A":[148],"total":[149],"37,500":[151],"were":[153],"generated":[154],"nucleotide":[156],"protein":[158],"sequences":[159],"41":[161],"SRB":[162,232],"construct":[165],"machine":[167],"learning":[168],"model":[169],"system":[170,215],"aimed":[171],"at":[172],"predicting":[173],"genes.":[175],"Our":[176,266],"engineering":[178],"module":[179],"identified":[180],"58":[181],"subsets":[182],"Through":[185],"cross-validation,":[186],"achieved":[188],"competitive":[189],"intra-organism":[190],"prediction":[191],"performance.":[192],"best":[194],"models":[195,246],"obtained":[196,236],"had":[197],"AUC":[199,256],"0.99,":[201,204,207,259],"precision":[202],"recall":[205],"F1-score":[210],"0.99.":[212],"Subsequently,":[213],"was":[216],"used":[217],"perform":[219],"extra-organism":[220],"(new":[221],"organism":[222],"not":[223],"seen":[224],"model)":[227],"validation":[228],"nine":[230],"left-out":[231],"for":[237],"these":[238],"test":[239],"demonstrated":[241],"efficacy":[243],"our":[245],"maximum":[248,250,252,255],"precision,":[249],"recall,":[251],"F1-score,":[253],"equal":[257],"<tex":[260],"xmlns:mml=\"http://www.w3.org/1998/Math/MathML\"":[261],"xmlns:xlink=\"http://www.w3.org/1999/xlink\">$0.99,0.99$</tex>,":[262],"0.97,":[264],"respectively.":[265],"approach":[267,287],"significantly":[269],"outperformed":[270],"previously":[271],"terms":[275],"average":[277],"metrics,":[278],"indicating":[279],"better":[280],"generalization":[281],"models.":[284],"Finally,":[285],"allows":[288],"evaluate":[291],"predicted":[293],"result":[294],"lab":[297],"fewer":[299],"variables":[300],"consider":[302],"their":[304],"design.":[306]},"counts_by_year":[],"updated_date":"2026-04-09T08:11:56.329763","created_date":"2026-01-30T00:00:00"}
