{"id":"https://openalex.org/W4417250791","doi":"https://doi.org/10.1109/bibe66822.2025.00114","title":"Blood-Based Minimal Gene Panel for Granulocytic Phenotyping in Copd Using Contrastive Graph Learning and Gradient Boosted Classification","display_name":"Blood-Based Minimal Gene Panel for Granulocytic Phenotyping in Copd Using Contrastive Graph Learning and Gradient Boosted Classification","publication_year":2025,"publication_date":"2025-11-06","ids":{"openalex":"https://openalex.org/W4417250791","doi":"https://doi.org/10.1109/bibe66822.2025.00114"},"language":null,"primary_location":{"id":"doi:10.1109/bibe66822.2025.00114","is_oa":false,"landing_page_url":"https://doi.org/10.1109/bibe66822.2025.00114","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"2025 IEEE 25th International Conference on Bioinformatics and Bioengineering (BIBE)","raw_type":"proceedings-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":false,"oa_status":"closed","oa_url":null,"any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":null,"display_name":"Aadit Shrivastava","orcid":null},"institutions":[{"id":"https://openalex.org/I4210162751","display_name":"Newark Academy","ror":"https://ror.org/05d3xvm78","country_code":"US","type":"education","lineage":["https://openalex.org/I4210162751"]}],"countries":["US"],"is_corresponding":true,"raw_author_name":"Aadit Shrivastava","raw_affiliation_strings":["Biology Dept. of Science, Newark Academy,Livingston,United States"],"affiliations":[{"raw_affiliation_string":"Biology Dept. of Science, Newark Academy,Livingston,United States","institution_ids":["https://openalex.org/I4210162751"]}]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":1,"corresponding_author_ids":[],"corresponding_institution_ids":["https://openalex.org/I4210162751"],"apc_list":null,"apc_paid":null,"fwci":0.0,"has_fulltext":false,"cited_by_count":0,"citation_normalized_percentile":{"value":0.34354385,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":null,"biblio":{"volume":null,"issue":null,"first_page":"658","last_page":"663"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T12254","display_name":"Machine Learning in Bioinformatics","score":0.11029999703168869,"subfield":{"id":"https://openalex.org/subfields/1312","display_name":"Molecular Biology"},"field":{"id":"https://openalex.org/fields/13","display_name":"Biochemistry, Genetics and Molecular Biology"},"domain":{"id":"https://openalex.org/domains/1","display_name":"Life Sciences"}},"topics":[{"id":"https://openalex.org/T12254","display_name":"Machine Learning in Bioinformatics","score":0.11029999703168869,"subfield":{"id":"https://openalex.org/subfields/1312","display_name":"Molecular Biology"},"field":{"id":"https://openalex.org/fields/13","display_name":"Biochemistry, Genetics and Molecular Biology"},"domain":{"id":"https://openalex.org/domains/1","display_name":"Life Sciences"}},{"id":"https://openalex.org/T11289","display_name":"Single-cell and spatial transcriptomics","score":0.07739999890327454,"subfield":{"id":"https://openalex.org/subfields/1312","display_name":"Molecular Biology"},"field":{"id":"https://openalex.org/fields/13","display_name":"Biochemistry, Genetics and Molecular Biology"},"domain":{"id":"https://openalex.org/domains/1","display_name":"Life Sciences"}},{"id":"https://openalex.org/T11642","display_name":"Genomics and Rare Diseases","score":0.07150000333786011,"subfield":{"id":"https://openalex.org/subfields/1311","display_name":"Genetics"},"field":{"id":"https://openalex.org/fields/13","display_name":"Biochemistry, Genetics and Molecular Biology"},"domain":{"id":"https://openalex.org/domains/1","display_name":"Life Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/classifier","display_name":"Classifier (UML)","score":0.5370000004768372},{"id":"https://openalex.org/keywords/random-forest","display_name":"Random forest","score":0.5108000040054321},{"id":"https://openalex.org/keywords/feature-selection","display_name":"Feature selection","score":0.478300005197525},{"id":"https://openalex.org/keywords/logistic-regression","display_name":"Logistic regression","score":0.4383000135421753},{"id":"https://openalex.org/keywords/copd","display_name":"COPD","score":0.4287000000476837},{"id":"https://openalex.org/keywords/graph","display_name":"Graph","score":0.4050000011920929},{"id":"https://openalex.org/keywords/pulmonary-disease","display_name":"Pulmonary disease","score":0.4016000032424927},{"id":"https://openalex.org/keywords/gradient-boosting","display_name":"Gradient boosting","score":0.3944000005722046}],"concepts":[{"id":"https://openalex.org/C95623464","wikidata":"https://www.wikidata.org/wiki/Q1096149","display_name":"Classifier (UML)","level":2,"score":0.5370000004768372},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.5224999785423279},{"id":"https://openalex.org/C169258074","wikidata":"https://www.wikidata.org/wiki/Q245748","display_name":"Random forest","level":2,"score":0.5108000040054321},{"id":"https://openalex.org/C148483581","wikidata":"https://www.wikidata.org/wiki/Q446488","display_name":"Feature selection","level":2,"score":0.478300005197525},{"id":"https://openalex.org/C151956035","wikidata":"https://www.wikidata.org/wiki/Q1132755","display_name":"Logistic regression","level":2,"score":0.4383000135421753},{"id":"https://openalex.org/C2776780178","wikidata":"https://www.wikidata.org/wiki/Q199804","display_name":"COPD","level":2,"score":0.4287000000476837},{"id":"https://openalex.org/C132525143","wikidata":"https://www.wikidata.org/wiki/Q141488","display_name":"Graph","level":2,"score":0.4050000011920929},{"id":"https://openalex.org/C2992779976","wikidata":"https://www.wikidata.org/wiki/Q3286546","display_name":"Pulmonary disease","level":2,"score":0.4016000032424927},{"id":"https://openalex.org/C70153297","wikidata":"https://www.wikidata.org/wiki/Q5591907","display_name":"Gradient boosting","level":3,"score":0.3944000005722046},{"id":"https://openalex.org/C188441871","wikidata":"https://www.wikidata.org/wiki/Q7554146","display_name":"Softmax function","level":3,"score":0.39320001006126404},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.37459999322891235},{"id":"https://openalex.org/C12267149","wikidata":"https://www.wikidata.org/wiki/Q282453","display_name":"Support vector machine","level":2,"score":0.3675000071525574},{"id":"https://openalex.org/C153180895","wikidata":"https://www.wikidata.org/wiki/Q7148389","display_name":"Pattern recognition (psychology)","level":2,"score":0.3594000041484833},{"id":"https://openalex.org/C71924100","wikidata":"https://www.wikidata.org/wiki/Q11190","display_name":"Medicine","level":0,"score":0.3562999963760376},{"id":"https://openalex.org/C2776879701","wikidata":"https://www.wikidata.org/wiki/Q25048660","display_name":"Multiple kernel learning","level":4,"score":0.3409000039100647},{"id":"https://openalex.org/C127716648","wikidata":"https://www.wikidata.org/wiki/Q104053","display_name":"Phenotype","level":3,"score":0.34040001034736633},{"id":"https://openalex.org/C169903167","wikidata":"https://www.wikidata.org/wiki/Q3985153","display_name":"Test set","level":2,"score":0.33489999175071716},{"id":"https://openalex.org/C2984324147","wikidata":"https://www.wikidata.org/wiki/Q3080021","display_name":"Gene selection","level":5,"score":0.32989999651908875},{"id":"https://openalex.org/C119857082","wikidata":"https://www.wikidata.org/wiki/Q2539","display_name":"Machine learning","level":1,"score":0.3091999888420105},{"id":"https://openalex.org/C119043178","wikidata":"https://www.wikidata.org/wiki/Q320723","display_name":"Covariate","level":2,"score":0.30720001459121704},{"id":"https://openalex.org/C2781067378","wikidata":"https://www.wikidata.org/wiki/Q17027399","display_name":"Interpretability","level":2,"score":0.2919999957084656},{"id":"https://openalex.org/C83546350","wikidata":"https://www.wikidata.org/wiki/Q1139051","display_name":"Regression","level":2,"score":0.28450000286102295},{"id":"https://openalex.org/C108583219","wikidata":"https://www.wikidata.org/wiki/Q197536","display_name":"Deep learning","level":2,"score":0.2802000045776367},{"id":"https://openalex.org/C104317684","wikidata":"https://www.wikidata.org/wiki/Q7187","display_name":"Gene","level":2,"score":0.25369998812675476}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.1109/bibe66822.2025.00114","is_oa":false,"landing_page_url":"https://doi.org/10.1109/bibe66822.2025.00114","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"2025 IEEE 25th International Conference on Bioinformatics and Bioengineering (BIBE)","raw_type":"proceedings-article"}],"best_oa_location":null,"sustainable_development_goals":[],"awards":[],"funders":[],"has_content":{"grobid_xml":false,"pdf":false},"content_urls":null,"referenced_works_count":4,"referenced_works":["https://openalex.org/W1981947694","https://openalex.org/W2889531427","https://openalex.org/W4389187939","https://openalex.org/W4399387247"],"related_works":[],"abstract_inverted_index":{"Chronic":[0],"obstructive":[1],"pulmonary":[2],"disease":[3],"(COPD)":[4],"affects":[5],"over":[6],"480":[7],"million":[8],"people":[9],"worldwide,":[10],"underscoring":[11],"the":[12,49,132,152],"need":[13],"for":[14,169],"clinically":[15,161],"scalable,":[16],"non-invasive":[17],"inflammatory":[18],"subtyping.":[19],"This":[20],"study":[21],"presents":[22],"a":[23,35,41,69,104,160],"pipeline":[24],"that":[25],"uses":[26],"contrastive":[27,56],"graph":[28],"learning":[29],"on":[30,103],"peripheral-blood":[31],"RNA-sequencing":[32],"to":[33],"curate":[34],"compact":[36],"gene":[37,167],"panel":[38,71,94,154,168],"and":[39,64,100,117,127,137,163],"power":[40],"gradient":[42],"boosted":[43],"classifier":[44],"of":[45,62,68],"granulocytic":[46,171],"phenotypes.":[47],"Using":[48],"GSE240656":[50],"multi-cohort":[51],"dataset":[52],"(<tex":[53],"xmlns:mml=\"http://www.w3.org/1998/Math/MathML\"":[54,109],"xmlns:xlink=\"http://www.w3.org/1999/xlink\">$\\mathbf{n}=294$</tex>),":[55],"embeddings":[57],"aligned":[58],"with":[59,131,140],"clinical":[60,133],"labeling":[61],"phenotypes":[63],"guided":[65],"algorithmic":[66],"selection":[67],"16-gene":[70],"(S100A8,":[72],"S100A9,":[73],"MPO,":[74],"ELANE,":[75],"CXCL8,":[76],"MMP9,":[77],"S100A12,":[78],"CLC,":[79],"PRG2,":[80],"RNASE2,":[81],"IL5RA,":[82],"SIGLEC8,":[83],"CCR3,":[84],"PTGDR2,":[85],"LTF,":[86],"IFIT3).":[87],"A":[88],"LightGBM":[89],"model":[90],"trained":[91],"using":[92],"this":[93],"achieved":[95],"0.915":[96],"accuracy,":[97],"0.928":[98],"macro-F1,":[99],"0.967":[101],"macro-AUROC":[102],"sealed":[105],"test":[106],"set":[107],"<tex":[108],"xmlns:xlink=\"http://www.w3.org/1999/xlink\">$(\\mathbf{n}=59)$</tex>,":[110],"outperforming":[111],"feedforward":[112],"neural":[113],"network,":[114],"random":[115],"forest,":[116],"logistic":[118],"regression":[119],"classifiers.":[120],"The":[121],"calibrated":[122],"probability":[123],"difference":[124],"between":[125,135],"eosinophilic":[126],"neutrophilic":[128],"classes":[129],"correlated":[130],"log-ratio":[134],"eosinophil":[136],"neutrophil":[138],"counts,":[139],"Spearman's":[141],"coefficient":[142],"equaling":[143],"0.80.":[144],"Global":[145],"SHAP":[146],"exhibited":[147],"distributed,":[148],"mechanism-consistent":[149],"attributions,":[150],"supporting":[151],"deliberate":[153],"curation":[155],"method.":[156],"These":[157],"results":[158],"support":[159],"feasible":[162],"explainable":[164],"blood-based":[165],"minimal":[166],"predictive":[170],"phenotyping":[172],"in":[173],"COPD.":[174]},"counts_by_year":[],"updated_date":"2026-04-21T08:09:41.155169","created_date":"2025-12-11T00:00:00"}
