{"id":"https://openalex.org/W7131871035","doi":"https://doi.org/10.48550/arxiv.2602.22387","title":"Disentangling Shared and Target-Enriched Topics via Background-Contrastive Non-negative Matrix Factorization","display_name":"Disentangling Shared and Target-Enriched Topics via Background-Contrastive Non-negative Matrix Factorization","publication_year":2026,"publication_date":"2026-02-25","ids":{"openalex":"https://openalex.org/W7131871035","doi":"https://doi.org/10.48550/arxiv.2602.22387"},"language":null,"primary_location":{"id":"pmh:doi:10.48550/arxiv.2602.22387","is_oa":true,"landing_page_url":null,"pdf_url":null,"source":{"id":"https://openalex.org/S4406922384","display_name":"Open MIND","issn_l":null,"issn":null,"is_oa":false,"is_in_doaj":false,"is_core":false,"host_organization":null,"host_organization_name":null,"host_organization_lineage":[],"host_organization_lineage_names":[],"type":"repository"},"license":"publisher-specific-oa","license_id":"https://openalex.org/licenses/publisher-specific-oa","version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"Article"},"type":"preprint","indexed_in":["datacite"],"open_access":{"is_oa":true,"oa_status":"green","oa_url":null,"any_repository_has_fulltext":true},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5127161335","display_name":"Yixuan Li","orcid":null},"institutions":[],"countries":[],"is_corresponding":true,"raw_author_name":"Li, Yixuan","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5012091034","display_name":"Archer Y. Yang","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Yang, Archer Y.","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"last","author":{"id":"https://openalex.org/A5127215952","display_name":"Yue Li","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Li, Yue","raw_affiliation_strings":[],"affiliations":[]}],"institutions":[],"countries_distinct_count":0,"institutions_distinct_count":3,"corresponding_author_ids":["https://openalex.org/A5127161335"],"corresponding_institution_ids":[],"apc_list":null,"apc_paid":null,"fwci":null,"has_fulltext":false,"cited_by_count":0,"citation_normalized_percentile":null,"cited_by_percentile_year":null,"biblio":{"volume":null,"issue":null,"first_page":null,"last_page":null},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T11289","display_name":"Single-cell and spatial transcriptomics","score":0.39649999141693115,"subfield":{"id":"https://openalex.org/subfields/1312","display_name":"Molecular Biology"},"field":{"id":"https://openalex.org/fields/13","display_name":"Biochemistry, Genetics and Molecular Biology"},"domain":{"id":"https://openalex.org/domains/1","display_name":"Life Sciences"}},"topics":[{"id":"https://openalex.org/T11289","display_name":"Single-cell and spatial transcriptomics","score":0.39649999141693115,"subfield":{"id":"https://openalex.org/subfields/1312","display_name":"Molecular Biology"},"field":{"id":"https://openalex.org/fields/13","display_name":"Biochemistry, Genetics and Molecular Biology"},"domain":{"id":"https://openalex.org/domains/1","display_name":"Life Sciences"}},{"id":"https://openalex.org/T10885","display_name":"Gene expression and cancer classification","score":0.28870001435279846,"subfield":{"id":"https://openalex.org/subfields/1312","display_name":"Molecular Biology"},"field":{"id":"https://openalex.org/fields/13","display_name":"Biochemistry, Genetics and Molecular Biology"},"domain":{"id":"https://openalex.org/domains/1","display_name":"Life Sciences"}},{"id":"https://openalex.org/T11307","display_name":"Domain Adaptation and Few-Shot Learning","score":0.05040000006556511,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/matrix-decomposition","display_name":"Matrix decomposition","score":0.6366999745368958},{"id":"https://openalex.org/keywords/multiplicative-function","display_name":"Multiplicative function","score":0.6202999949455261},{"id":"https://openalex.org/keywords/scalability","display_name":"Scalability","score":0.5105999708175659},{"id":"https://openalex.org/keywords/dependency","display_name":"Dependency (UML)","score":0.4903999865055084},{"id":"https://openalex.org/keywords/factorization","display_name":"Factorization","score":0.4560000002384186},{"id":"https://openalex.org/keywords/biological-data","display_name":"Biological data","score":0.44999998807907104},{"id":"https://openalex.org/keywords/feature","display_name":"Feature (linguistics)","score":0.4471000134944916},{"id":"https://openalex.org/keywords/multiplication","display_name":"Multiplication (music)","score":0.4221999943256378},{"id":"https://openalex.org/keywords/curse-of-dimensionality","display_name":"Curse of dimensionality","score":0.3880000114440918}],"concepts":[{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.7096999883651733},{"id":"https://openalex.org/C42355184","wikidata":"https://www.wikidata.org/wiki/Q1361088","display_name":"Matrix decomposition","level":3,"score":0.6366999745368958},{"id":"https://openalex.org/C42747912","wikidata":"https://www.wikidata.org/wiki/Q1048447","display_name":"Multiplicative function","level":2,"score":0.6202999949455261},{"id":"https://openalex.org/C48044578","wikidata":"https://www.wikidata.org/wiki/Q727490","display_name":"Scalability","level":2,"score":0.5105999708175659},{"id":"https://openalex.org/C19768560","wikidata":"https://www.wikidata.org/wiki/Q320727","display_name":"Dependency (UML)","level":2,"score":0.4903999865055084},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.48820000886917114},{"id":"https://openalex.org/C80444323","wikidata":"https://www.wikidata.org/wiki/Q2878974","display_name":"Theoretical computer science","level":1,"score":0.4650000035762787},{"id":"https://openalex.org/C187834632","wikidata":"https://www.wikidata.org/wiki/Q188804","display_name":"Factorization","level":2,"score":0.4560000002384186},{"id":"https://openalex.org/C201797286","wikidata":"https://www.wikidata.org/wiki/Q4914986","display_name":"Biological data","level":2,"score":0.44999998807907104},{"id":"https://openalex.org/C2776401178","wikidata":"https://www.wikidata.org/wiki/Q12050496","display_name":"Feature (linguistics)","level":2,"score":0.4471000134944916},{"id":"https://openalex.org/C2780595030","wikidata":"https://www.wikidata.org/wiki/Q3860309","display_name":"Multiplication (music)","level":2,"score":0.4221999943256378},{"id":"https://openalex.org/C111030470","wikidata":"https://www.wikidata.org/wiki/Q1430460","display_name":"Curse of dimensionality","level":2,"score":0.3880000114440918},{"id":"https://openalex.org/C70518039","wikidata":"https://www.wikidata.org/wiki/Q16000077","display_name":"Dimensionality reduction","level":2,"score":0.38749998807907104},{"id":"https://openalex.org/C152671427","wikidata":"https://www.wikidata.org/wiki/Q10843505","display_name":"Non-negative matrix factorization","level":4,"score":0.3853999972343445},{"id":"https://openalex.org/C17349429","wikidata":"https://www.wikidata.org/wiki/Q1049914","display_name":"Matrix multiplication","level":3,"score":0.3732999861240387},{"id":"https://openalex.org/C153180895","wikidata":"https://www.wikidata.org/wiki/Q7148389","display_name":"Pattern recognition (psychology)","level":2,"score":0.3693000078201294},{"id":"https://openalex.org/C75684735","wikidata":"https://www.wikidata.org/wiki/Q858810","display_name":"Big data","level":2,"score":0.34220001101493835},{"id":"https://openalex.org/C2778334786","wikidata":"https://www.wikidata.org/wiki/Q1586270","display_name":"Variation (astronomy)","level":2,"score":0.33550000190734863},{"id":"https://openalex.org/C106487976","wikidata":"https://www.wikidata.org/wiki/Q685816","display_name":"Matrix (chemical analysis)","level":2,"score":0.3215000033378601},{"id":"https://openalex.org/C11413529","wikidata":"https://www.wikidata.org/wiki/Q8366","display_name":"Algorithm","level":1,"score":0.321399986743927},{"id":"https://openalex.org/C22019652","wikidata":"https://www.wikidata.org/wiki/Q331309","display_name":"Overfitting","level":3,"score":0.2994000017642975},{"id":"https://openalex.org/C2780985081","wikidata":"https://www.wikidata.org/wiki/Q676502","display_name":"Data Matrix","level":5,"score":0.29120001196861267},{"id":"https://openalex.org/C119857082","wikidata":"https://www.wikidata.org/wiki/Q2539","display_name":"Machine learning","level":1,"score":0.2892000079154968},{"id":"https://openalex.org/C160920958","wikidata":"https://www.wikidata.org/wiki/Q7662746","display_name":"Synthetic data","level":2,"score":0.28859999775886536},{"id":"https://openalex.org/C124101348","wikidata":"https://www.wikidata.org/wiki/Q172491","display_name":"Data mining","level":1,"score":0.28519999980926514},{"id":"https://openalex.org/C2776545253","wikidata":"https://www.wikidata.org/wiki/Q5464292","display_name":"Folding (DSP implementation)","level":2,"score":0.27070000767707825},{"id":"https://openalex.org/C111335779","wikidata":"https://www.wikidata.org/wiki/Q3454686","display_name":"Reduction (mathematics)","level":2,"score":0.26649999618530273},{"id":"https://openalex.org/C125411270","wikidata":"https://www.wikidata.org/wiki/Q18653","display_name":"Encoding (memory)","level":2,"score":0.25929999351501465}],"mesh":[],"locations_count":2,"locations":[{"id":"pmh:doi:10.48550/arxiv.2602.22387","is_oa":true,"landing_page_url":null,"pdf_url":null,"source":{"id":"https://openalex.org/S4406922384","display_name":"Open MIND","issn_l":null,"issn":null,"is_oa":false,"is_in_doaj":false,"is_core":false,"host_organization":null,"host_organization_name":null,"host_organization_lineage":[],"host_organization_lineage_names":[],"type":"repository"},"license":"publisher-specific-oa","license_id":"https://openalex.org/licenses/publisher-specific-oa","version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"Article"},{"id":"doi:10.48550/arxiv.2602.22387","is_oa":true,"landing_page_url":"https://doi.org/10.48550/arxiv.2602.22387","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":null,"is_accepted":false,"is_published":null,"raw_source_name":null,"raw_type":"article"}],"best_oa_location":{"id":"pmh:doi:10.48550/arxiv.2602.22387","is_oa":true,"landing_page_url":null,"pdf_url":null,"source":{"id":"https://openalex.org/S4406922384","display_name":"Open MIND","issn_l":null,"issn":null,"is_oa":false,"is_in_doaj":false,"is_core":false,"host_organization":null,"host_organization_name":null,"host_organization_lineage":[],"host_organization_lineage_names":[],"type":"repository"},"license":"publisher-specific-oa","license_id":"https://openalex.org/licenses/publisher-specific-oa","version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"Article"},"sustainable_development_goals":[],"awards":[],"funders":[],"has_content":{"pdf":false,"grobid_xml":false},"content_urls":null,"referenced_works_count":0,"referenced_works":[],"related_works":[],"abstract_inverted_index":{"Biological":[0],"signals":[1,159],"of":[2],"interest":[3],"in":[4,167,177,182,188],"high-dimensional":[5],"data":[6,142],"are":[7,43,55,105],"often":[8,44],"masked":[9],"by":[10,77,120,161],"dominant":[11],"variation":[12],"shared":[13,88],"across":[14],"conditions.":[15],"This":[16,99],"variation,":[17],"arising":[18],"from":[19,32],"baseline":[20],"biological":[21,49,155],"structure":[22],"or":[23,61],"technical":[24],"effects,":[25],"can":[26],"prevent":[27],"standard":[28],"dimensionality":[29],"reduction":[30],"methods":[31,54],"resolving":[33],"condition-specific":[34],"structure.":[35,98],"The":[36],"challenge":[37],"is":[38,118,132],"that":[39,95,104,130],"these":[40],"confounding":[41],"topics":[42,76],"unknown":[45],"and":[46,83,112,138,153,184],"mixed":[47],"with":[48],"signals.":[50],"Existing":[51],"background":[52,66,86],"correction":[53],"either":[56],"unscalable":[57],"to":[58,140,147],"high":[59],"dimensions":[60],"not":[62],"interpretable.":[63],"We":[64],"introduce":[65],"contrastive":[67,93],"Non-negative":[68],"Matrix":[69],"Factorization":[70],"(\\model),":[71],"which":[72],"extracts":[73],"target-enriched":[74],"latent":[75],"jointly":[78],"factorizing":[79],"a":[80,84,92],"target":[81],"dataset":[82],"matched":[85],"using":[87],"non-negative":[89,102],"bases":[90],"under":[91],"objective":[94],"suppresses":[96],"background-expressed":[97],"approach":[100],"yields":[101],"components":[103],"directly":[106],"interpretable":[107],"at":[108],"the":[109],"feature":[110],"level,":[111],"explicitly":[113],"isolates":[114],"target-specific":[115],"variation.":[116],"\\model":[117,157],"learned":[119],"an":[121],"efficient":[122,134],"multiplicative":[123],"update":[124],"algorithm":[125],"via":[126,143],"matrix":[127],"multiplication":[128],"such":[129],"it":[131],"highly":[133],"on":[135],"GPU":[136],"hardware":[137],"scalable":[139],"big":[141],"minibatch":[144],"training":[145],"akin":[146],"deep":[148],"learning":[149],"approach.":[150],"Across":[151],"simulations":[152],"diverse":[154],"datasets,":[156],"reveals":[158],"obscured":[160],"conventional":[162],"methods,":[163],"including":[164],"disease-associated":[165],"programs":[166],"postmortem":[168],"depressive":[169],"brain":[170],"single-cell":[171],"RNA-seq,":[172],"genotype-linked":[173],"protein":[174],"expression":[175],"patterns":[176],"mice,":[178],"treatment-specific":[179],"transcriptional":[180],"changes":[181],"leukemia,":[183],"TP53-dependent":[185],"drug":[186],"responses":[187],"cancer":[189],"cell":[190],"lines.":[191]},"counts_by_year":[],"updated_date":"2026-04-04T16:13:02.066488","created_date":"2026-02-28T00:00:00"}
