{"id":"https://openalex.org/W4224237848","doi":"https://doi.org/10.48550/arxiv.2204.09291","title":"Improving generalization of machine learning-identified biomarkers with causal modeling: an investigation into immune receptor diagnostics","display_name":"Improving generalization of machine learning-identified biomarkers with causal modeling: an investigation into immune receptor diagnostics","publication_year":2022,"publication_date":"2022-04-20","ids":{"openalex":"https://openalex.org/W4224237848","doi":"https://doi.org/10.48550/arxiv.2204.09291"},"language":"en","primary_location":{"id":"pmh:oai:arXiv.org:2204.09291","is_oa":true,"landing_page_url":"http://arxiv.org/abs/2204.09291","pdf_url":"https://arxiv.org/pdf/2204.09291","source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":"","raw_type":"text"},"type":"preprint","indexed_in":["arxiv","datacite"],"open_access":{"is_oa":true,"oa_status":"green","oa_url":"https://arxiv.org/pdf/2204.09291","any_repository_has_fulltext":true},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5037853098","display_name":"Milena Pavlovi\u0107","orcid":"https://orcid.org/0000-0002-2484-3868"},"institutions":[],"countries":[],"is_corresponding":true,"raw_author_name":"Pavlovi\u0107, Milena","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5069724737","display_name":"Ghadi S. Al Hajj","orcid":"https://orcid.org/0000-0003-1639-1424"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Hajj, Ghadi S. Al","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5046161876","display_name":"Johan Pensar","orcid":"https://orcid.org/0000-0002-5158-5761"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Kanduri, Chakravarthi","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5039901579","display_name":"Mollie E. Wood","orcid":"https://orcid.org/0000-0002-9302-2641"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Pensar, Johan","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5081876747","display_name":"Ludvig M. Sollid","orcid":"https://orcid.org/0000-0001-8860-704X"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Wood, Mollie","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5089158926","display_name":"Victor Greiff","orcid":"https://orcid.org/0000-0003-2622-5032"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Sollid, Ludvig M.","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5054500587","display_name":"Geir Kjetil Sandve","orcid":"https://orcid.org/0000-0002-4959-1409"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Greiff, Victor","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"last","author":{"id":null,"display_name":"Sandve, Geir Kjetil","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Sandve, Geir Kjetil","raw_affiliation_strings":[],"affiliations":[]}],"institutions":[],"countries_distinct_count":0,"institutions_distinct_count":8,"corresponding_author_ids":["https://openalex.org/A5037853098"],"corresponding_institution_ids":[],"apc_list":null,"apc_paid":null,"fwci":null,"has_fulltext":false,"cited_by_count":7,"citation_normalized_percentile":null,"cited_by_percentile_year":null,"biblio":{"volume":null,"issue":null,"first_page":null,"last_page":null},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10211","display_name":"Computational Drug Discovery Methods","score":0.9819999933242798,"subfield":{"id":"https://openalex.org/subfields/1703","display_name":"Computational Theory and Mathematics"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10211","display_name":"Computational Drug Discovery Methods","score":0.9819999933242798,"subfield":{"id":"https://openalex.org/subfields/1703","display_name":"Computational Theory and Mathematics"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10621","display_name":"Gene Regulatory Network Analysis","score":0.980400025844574,"subfield":{"id":"https://openalex.org/subfields/1312","display_name":"Molecular Biology"},"field":{"id":"https://openalex.org/fields/13","display_name":"Biochemistry, Genetics and Molecular Biology"},"domain":{"id":"https://openalex.org/domains/1","display_name":"Life Sciences"}},{"id":"https://openalex.org/T10885","display_name":"Gene expression and cancer classification","score":0.980400025844574,"subfield":{"id":"https://openalex.org/subfields/1312","display_name":"Molecular Biology"},"field":{"id":"https://openalex.org/fields/13","display_name":"Biochemistry, Genetics and Molecular Biology"},"domain":{"id":"https://openalex.org/domains/1","display_name":"Life Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/robustness","display_name":"Robustness (evolution)","score":0.8095988631248474},{"id":"https://openalex.org/keywords/machine-learning","display_name":"Machine learning","score":0.7230721712112427},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.6695519685745239},{"id":"https://openalex.org/keywords/generalization","display_name":"Generalization","score":0.625450849533081},{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.6014634966850281},{"id":"https://openalex.org/keywords/biomarker","display_name":"Biomarker","score":0.43924179673194885},{"id":"https://openalex.org/keywords/causal-model","display_name":"Causal model","score":0.42241039872169495},{"id":"https://openalex.org/keywords/computational-biology","display_name":"Computational biology","score":0.32038259506225586},{"id":"https://openalex.org/keywords/medicine","display_name":"Medicine","score":0.1653701364994049},{"id":"https://openalex.org/keywords/biology","display_name":"Biology","score":0.15116295218467712},{"id":"https://openalex.org/keywords/mathematics","display_name":"Mathematics","score":0.10574454069137573}],"concepts":[{"id":"https://openalex.org/C63479239","wikidata":"https://www.wikidata.org/wiki/Q7353546","display_name":"Robustness (evolution)","level":3,"score":0.8095988631248474},{"id":"https://openalex.org/C119857082","wikidata":"https://www.wikidata.org/wiki/Q2539","display_name":"Machine learning","level":1,"score":0.7230721712112427},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.6695519685745239},{"id":"https://openalex.org/C177148314","wikidata":"https://www.wikidata.org/wiki/Q170084","display_name":"Generalization","level":2,"score":0.625450849533081},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.6014634966850281},{"id":"https://openalex.org/C2781197716","wikidata":"https://www.wikidata.org/wiki/Q864574","display_name":"Biomarker","level":2,"score":0.43924179673194885},{"id":"https://openalex.org/C11671645","wikidata":"https://www.wikidata.org/wiki/Q5054567","display_name":"Causal model","level":2,"score":0.42241039872169495},{"id":"https://openalex.org/C70721500","wikidata":"https://www.wikidata.org/wiki/Q177005","display_name":"Computational biology","level":1,"score":0.32038259506225586},{"id":"https://openalex.org/C71924100","wikidata":"https://www.wikidata.org/wiki/Q11190","display_name":"Medicine","level":0,"score":0.1653701364994049},{"id":"https://openalex.org/C86803240","wikidata":"https://www.wikidata.org/wiki/Q420","display_name":"Biology","level":0,"score":0.15116295218467712},{"id":"https://openalex.org/C33923547","wikidata":"https://www.wikidata.org/wiki/Q395","display_name":"Mathematics","level":0,"score":0.10574454069137573},{"id":"https://openalex.org/C104317684","wikidata":"https://www.wikidata.org/wiki/Q7187","display_name":"Gene","level":2,"score":0.0},{"id":"https://openalex.org/C55493867","wikidata":"https://www.wikidata.org/wiki/Q7094","display_name":"Biochemistry","level":1,"score":0.0},{"id":"https://openalex.org/C134306372","wikidata":"https://www.wikidata.org/wiki/Q7754","display_name":"Mathematical analysis","level":1,"score":0.0},{"id":"https://openalex.org/C142724271","wikidata":"https://www.wikidata.org/wiki/Q7208","display_name":"Pathology","level":1,"score":0.0}],"mesh":[],"locations_count":3,"locations":[{"id":"pmh:oai:arXiv.org:2204.09291","is_oa":true,"landing_page_url":"http://arxiv.org/abs/2204.09291","pdf_url":"https://arxiv.org/pdf/2204.09291","source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":"","raw_type":"text"},{"id":"pmh:oai:zenodo.org:7727894","is_oa":true,"landing_page_url":"https://zenodo.org/record/7727894","pdf_url":null,"source":{"id":"https://openalex.org/S4306400562","display_name":"Zenodo (CERN European Organization for Nuclear Research)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I67311998","host_organization_name":"European Organization for Nuclear Research","host_organization_lineage":["https://openalex.org/I67311998"],"host_organization_lineage_names":[],"type":"repository"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"info:eu-repo/semantics/other"},{"id":"doi:10.48550/arxiv.2204.09291","is_oa":true,"landing_page_url":"https://doi.org/10.48550/arxiv.2204.09291","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":null,"is_accepted":false,"is_published":null,"raw_source_name":null,"raw_type":"article"}],"best_oa_location":{"id":"pmh:oai:arXiv.org:2204.09291","is_oa":true,"landing_page_url":"http://arxiv.org/abs/2204.09291","pdf_url":"https://arxiv.org/pdf/2204.09291","source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":"","raw_type":"text"},"sustainable_development_goals":[{"display_name":"Quality Education","score":0.4399999976158142,"id":"https://metadata.un.org/sdg/4"}],"awards":[],"funders":[],"has_content":{"grobid_xml":false,"pdf":false},"content_urls":null,"referenced_works_count":0,"referenced_works":[],"related_works":["https://openalex.org/W3162204513","https://openalex.org/W2371138613","https://openalex.org/W2048963458","https://openalex.org/W43109613","https://openalex.org/W2359952343","https://openalex.org/W2239445980","https://openalex.org/W2533581028","https://openalex.org/W2080152487","https://openalex.org/W3083152911","https://openalex.org/W3022347918"],"abstract_inverted_index":{"Machine":[0],"learning":[1],"is":[2],"increasingly":[3],"used":[4],"to":[5,21,28,52],"discover":[6],"diagnostic":[7],"and":[8,31,48,55,89,119,127],"prognostic":[9],"biomarkers":[10],"from":[11],"high-dimensional":[12,74],"molecular":[13],"data.":[14],"However,":[15],"a":[16,39,64,70],"variety":[17],"of":[18,45,57,92,124],"factors":[19,91],"related":[20],"experimental":[22,90],"design":[23],"may":[24,96],"affect":[25],"the":[26,43,53,93,98,122,125],"ability":[27],"learn":[29],"generalizable":[30],"clinically":[32],"applicable":[33],"diagnostics.":[34,60],"Here,":[35],"we":[36,67,84,103],"argue":[37,104],"that":[38,105,129],"causal":[40,106],"perspective":[41],"improves":[42,108],"identification":[44],"these":[46],"challenges":[47],"formalizes":[49],"their":[50],"relation":[51],"robustness":[54,112],"generalization":[56],"machine":[58,109],"learning-based":[59,110],"To":[61],"make":[62],"for":[63],"concrete":[65],"discussion,":[66],"focus":[68],"on":[69],"specific,":[71],"recently":[72],"established":[73],"biomarker":[75,111],"-":[76],"adaptive":[77],"immune":[78],"receptor":[79],"repertoires":[80],"(AIRRs).":[81],"Through":[82],"simulations,":[83],"illustrate":[85],"how":[86],"major":[87],"biological":[88],"AIRR":[94],"domain":[95],"influence":[97],"learned":[99],"biomarkers.":[100],"In":[101],"conclusion,":[102],"modeling":[107],"by":[113,120],"identifying":[114],"stable":[115],"relations":[116,126],"between":[117,131],"variables":[118,128],"guiding":[121],"adjustment":[123],"vary":[130],"populations.":[132]},"counts_by_year":[{"year":2024,"cited_by_count":2},{"year":2023,"cited_by_count":5}],"updated_date":"2026-03-10T16:38:18.471706","created_date":"2025-10-10T00:00:00"}
