{"id":"https://openalex.org/W7138089501","doi":"https://doi.org/10.1609/aaai.v40i1.37046","title":"CLM-Access: A Specialized Foundation Model for High-Dimensional Single-Cell ATAC-Seq Analysis","display_name":"CLM-Access: A Specialized Foundation Model for High-Dimensional Single-Cell ATAC-Seq Analysis","publication_year":2026,"publication_date":"2026-03-14","ids":{"openalex":"https://openalex.org/W7138089501","doi":"https://doi.org/10.1609/aaai.v40i1.37046"},"language":null,"primary_location":{"id":"doi:10.1609/aaai.v40i1.37046","is_oa":true,"landing_page_url":"https://doi.org/10.1609/aaai.v40i1.37046","pdf_url":"https://ojs.aaai.org/index.php/AAAI/article/download/37046/41008","source":{"id":"https://openalex.org/S4210191458","display_name":"Proceedings of the AAAI Conference on Artificial Intelligence","issn_l":"2159-5399","issn":["2159-5399","2374-3468"],"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/P4310320058","host_organization_name":"Association for the Advancement of Artificial Intelligence","host_organization_lineage":["https://openalex.org/P4310320058"],"host_organization_lineage_names":["Association for the Advancement of Artificial Intelligence"],"type":"conference"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Proceedings of the AAAI Conference on Artificial Intelligence","raw_type":"journal-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":true,"oa_status":"diamond","oa_url":"https://ojs.aaai.org/index.php/AAAI/article/download/37046/41008","any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5129653718","display_name":"Ziqiang Liu","orcid":null},"institutions":[{"id":"https://openalex.org/I19820366","display_name":"Chinese Academy of Sciences","ror":"https://ror.org/034t30j35","country_code":"CN","type":"government","lineage":["https://openalex.org/I19820366"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Ziqiang Liu","raw_affiliation_strings":["Hangzhou Institute of Medicine, Chinese Academy of Sciences"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"Hangzhou Institute of Medicine, Chinese Academy of Sciences","institution_ids":["https://openalex.org/I19820366"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5129677013","display_name":"Bowen Li","orcid":null},"institutions":[{"id":"https://openalex.org/I19820366","display_name":"Chinese Academy of Sciences","ror":"https://ror.org/034t30j35","country_code":"CN","type":"government","lineage":["https://openalex.org/I19820366"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Bowen Li","raw_affiliation_strings":["Hangzhou Institute of Medicine, Chinese Academy of Sciences"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"Hangzhou Institute of Medicine, Chinese Academy of Sciences","institution_ids":["https://openalex.org/I19820366"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5129711568","display_name":"Zhenyu Xu","orcid":null},"institutions":[{"id":"https://openalex.org/I204512498","display_name":"University of Macau","ror":"https://ror.org/01r4q9n85","country_code":"MO","type":"education","lineage":["https://openalex.org/I204512498"]}],"countries":["MO"],"is_corresponding":false,"raw_author_name":"Zhenyu Xu","raw_affiliation_strings":["Hangzhou Institute of Medicine, Chinese Academy of Sciences\nFaculty of Health Science, University of Macau"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"Hangzhou Institute of Medicine, Chinese Academy of Sciences\nFaculty of Health Science, University of Macau","institution_ids":["https://openalex.org/I204512498"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5126439126","display_name":"Yantao Li","orcid":null},"institutions":[{"id":"https://openalex.org/I19820366","display_name":"Chinese Academy of Sciences","ror":"https://ror.org/034t30j35","country_code":"CN","type":"government","lineage":["https://openalex.org/I19820366"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Yantao Li","raw_affiliation_strings":["Hangzhou Institute of Medicine, Chinese Academy of Sciences"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"Hangzhou Institute of Medicine, Chinese Academy of Sciences","institution_ids":["https://openalex.org/I19820366"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5067464588","display_name":"Junwei Zhang","orcid":null},"institutions":[{"id":"https://openalex.org/I19820366","display_name":"Chinese Academy of Sciences","ror":"https://ror.org/034t30j35","country_code":"CN","type":"government","lineage":["https://openalex.org/I19820366"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Junwei Zhang","raw_affiliation_strings":["Hangzhou Institute of Medicine, Chinese Academy of Sciences"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"Hangzhou Institute of Medicine, Chinese Academy of Sciences","institution_ids":["https://openalex.org/I19820366"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5063787927","display_name":"Chulin Sha","orcid":"https://orcid.org/0000-0001-8725-8642"},"institutions":[{"id":"https://openalex.org/I19820366","display_name":"Chinese Academy of Sciences","ror":"https://ror.org/034t30j35","country_code":"CN","type":"government","lineage":["https://openalex.org/I19820366"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Chulin Sha","raw_affiliation_strings":["Hangzhou Institute of Medicine, Chinese Academy of Sciences"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"Hangzhou Institute of Medicine, Chinese Academy of Sciences","institution_ids":["https://openalex.org/I19820366"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5129681367","display_name":"Xiaolin Li","orcid":null},"institutions":[{"id":"https://openalex.org/I19820366","display_name":"Chinese Academy of Sciences","ror":"https://ror.org/034t30j35","country_code":"CN","type":"government","lineage":["https://openalex.org/I19820366"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Xiaolin Li","raw_affiliation_strings":["Hangzhou Institute of Medicine, Chinese Academy of Sciences"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"Hangzhou Institute of Medicine, Chinese Academy of Sciences","institution_ids":["https://openalex.org/I19820366"]}]}],"institutions":[],"countries_distinct_count":2,"institutions_distinct_count":7,"corresponding_author_ids":[],"corresponding_institution_ids":[],"apc_list":null,"apc_paid":null,"fwci":8.9091,"has_fulltext":true,"cited_by_count":1,"citation_normalized_percentile":{"value":0.96907216,"is_in_top_1_percent":false,"is_in_top_10_percent":true},"cited_by_percentile_year":{"min":95,"max":98},"biblio":{"volume":"40","issue":"1","first_page":"791","last_page":"799"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T11289","display_name":"Single-cell and spatial transcriptomics","score":0.9785000085830688,"subfield":{"id":"https://openalex.org/subfields/1312","display_name":"Molecular Biology"},"field":{"id":"https://openalex.org/fields/13","display_name":"Biochemistry, Genetics and Molecular Biology"},"domain":{"id":"https://openalex.org/domains/1","display_name":"Life Sciences"}},"topics":[{"id":"https://openalex.org/T11289","display_name":"Single-cell and spatial transcriptomics","score":0.9785000085830688,"subfield":{"id":"https://openalex.org/subfields/1312","display_name":"Molecular Biology"},"field":{"id":"https://openalex.org/fields/13","display_name":"Biochemistry, Genetics and Molecular Biology"},"domain":{"id":"https://openalex.org/domains/1","display_name":"Life Sciences"}},{"id":"https://openalex.org/T11307","display_name":"Domain Adaptation and Few-Shot Learning","score":0.001500000013038516,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T12254","display_name":"Machine Learning in Bioinformatics","score":0.00139999995008111,"subfield":{"id":"https://openalex.org/subfields/1312","display_name":"Molecular Biology"},"field":{"id":"https://openalex.org/fields/13","display_name":"Biochemistry, Genetics and Molecular Biology"},"domain":{"id":"https://openalex.org/domains/1","display_name":"Life Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/variety","display_name":"Variety (cybernetics)","score":0.5073999762535095},{"id":"https://openalex.org/keywords/expression","display_name":"Expression (computer science)","score":0.45559999346733093},{"id":"https://openalex.org/keywords/pipeline","display_name":"Pipeline (software)","score":0.4375},{"id":"https://openalex.org/keywords/representation","display_name":"Representation (politics)","score":0.42800000309944153},{"id":"https://openalex.org/keywords/function","display_name":"Function (biology)","score":0.42570000886917114},{"id":"https://openalex.org/keywords/foundation","display_name":"Foundation (evidence)","score":0.41589999198913574},{"id":"https://openalex.org/keywords/epigenomics","display_name":"Epigenomics","score":0.39320001006126404},{"id":"https://openalex.org/keywords/chromatin","display_name":"Chromatin","score":0.37619999051094055},{"id":"https://openalex.org/keywords/scalability","display_name":"Scalability","score":0.36730000376701355}],"concepts":[{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.6541000008583069},{"id":"https://openalex.org/C136197465","wikidata":"https://www.wikidata.org/wiki/Q1729295","display_name":"Variety (cybernetics)","level":2,"score":0.5073999762535095},{"id":"https://openalex.org/C90559484","wikidata":"https://www.wikidata.org/wiki/Q778379","display_name":"Expression (computer science)","level":2,"score":0.45559999346733093},{"id":"https://openalex.org/C43521106","wikidata":"https://www.wikidata.org/wiki/Q2165493","display_name":"Pipeline (software)","level":2,"score":0.4375},{"id":"https://openalex.org/C2776359362","wikidata":"https://www.wikidata.org/wiki/Q2145286","display_name":"Representation (politics)","level":3,"score":0.42800000309944153},{"id":"https://openalex.org/C14036430","wikidata":"https://www.wikidata.org/wiki/Q3736076","display_name":"Function (biology)","level":2,"score":0.42570000886917114},{"id":"https://openalex.org/C2780966255","wikidata":"https://www.wikidata.org/wiki/Q5474306","display_name":"Foundation (evidence)","level":2,"score":0.41589999198913574},{"id":"https://openalex.org/C2522767166","wikidata":"https://www.wikidata.org/wiki/Q2374463","display_name":"Data science","level":1,"score":0.39959999918937683},{"id":"https://openalex.org/C121912465","wikidata":"https://www.wikidata.org/wiki/Q3589153","display_name":"Epigenomics","level":5,"score":0.39320001006126404},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.3880000114440918},{"id":"https://openalex.org/C83640560","wikidata":"https://www.wikidata.org/wiki/Q180951","display_name":"Chromatin","level":3,"score":0.37619999051094055},{"id":"https://openalex.org/C48044578","wikidata":"https://www.wikidata.org/wiki/Q727490","display_name":"Scalability","level":2,"score":0.36730000376701355},{"id":"https://openalex.org/C41608201","wikidata":"https://www.wikidata.org/wiki/Q980509","display_name":"Embedding","level":2,"score":0.3637000024318695},{"id":"https://openalex.org/C195324797","wikidata":"https://www.wikidata.org/wiki/Q33742","display_name":"Natural language","level":2,"score":0.34779998660087585},{"id":"https://openalex.org/C2776207758","wikidata":"https://www.wikidata.org/wiki/Q5303302","display_name":"Downstream (manufacturing)","level":2,"score":0.3100000023841858},{"id":"https://openalex.org/C138958017","wikidata":"https://www.wikidata.org/wiki/Q190087","display_name":"Data type","level":2,"score":0.30970001220703125},{"id":"https://openalex.org/C61423126","wikidata":"https://www.wikidata.org/wiki/Q187432","display_name":"Scripting language","level":2,"score":0.3043999969959259},{"id":"https://openalex.org/C28719098","wikidata":"https://www.wikidata.org/wiki/Q44946","display_name":"Point (geometry)","level":2,"score":0.3000999987125397},{"id":"https://openalex.org/C77618280","wikidata":"https://www.wikidata.org/wiki/Q1155772","display_name":"Scheme (mathematics)","level":2,"score":0.2946999967098236},{"id":"https://openalex.org/C137293760","wikidata":"https://www.wikidata.org/wiki/Q3621696","display_name":"Language model","level":2,"score":0.2937000095844269},{"id":"https://openalex.org/C2776214188","wikidata":"https://www.wikidata.org/wiki/Q408386","display_name":"Inference","level":2,"score":0.29100000858306885},{"id":"https://openalex.org/C26517878","wikidata":"https://www.wikidata.org/wiki/Q228039","display_name":"Key (lock)","level":2,"score":0.2865000069141388},{"id":"https://openalex.org/C2777611551","wikidata":"https://www.wikidata.org/wiki/Q17951","display_name":"Jargon","level":2,"score":0.2800999879837036},{"id":"https://openalex.org/C115903868","wikidata":"https://www.wikidata.org/wiki/Q80993","display_name":"Software engineering","level":1,"score":0.2766000032424927},{"id":"https://openalex.org/C2777402240","wikidata":"https://www.wikidata.org/wiki/Q6783436","display_name":"Masking (illustration)","level":2,"score":0.2621000111103058},{"id":"https://openalex.org/C90734943","wikidata":"https://www.wikidata.org/wiki/Q17008777","display_name":"Conceptualization","level":2,"score":0.259799987077713},{"id":"https://openalex.org/C125411270","wikidata":"https://www.wikidata.org/wiki/Q18653","display_name":"Encoding (memory)","level":2,"score":0.25870001316070557}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.1609/aaai.v40i1.37046","is_oa":true,"landing_page_url":"https://doi.org/10.1609/aaai.v40i1.37046","pdf_url":"https://ojs.aaai.org/index.php/AAAI/article/download/37046/41008","source":{"id":"https://openalex.org/S4210191458","display_name":"Proceedings of the AAAI Conference on Artificial Intelligence","issn_l":"2159-5399","issn":["2159-5399","2374-3468"],"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/P4310320058","host_organization_name":"Association for the Advancement of Artificial Intelligence","host_organization_lineage":["https://openalex.org/P4310320058"],"host_organization_lineage_names":["Association for the Advancement of Artificial Intelligence"],"type":"conference"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Proceedings of the AAAI Conference on Artificial Intelligence","raw_type":"journal-article"}],"best_oa_location":{"id":"doi:10.1609/aaai.v40i1.37046","is_oa":true,"landing_page_url":"https://doi.org/10.1609/aaai.v40i1.37046","pdf_url":"https://ojs.aaai.org/index.php/AAAI/article/download/37046/41008","source":{"id":"https://openalex.org/S4210191458","display_name":"Proceedings of the AAAI Conference on Artificial Intelligence","issn_l":"2159-5399","issn":["2159-5399","2374-3468"],"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/P4310320058","host_organization_name":"Association for the Advancement of Artificial Intelligence","host_organization_lineage":["https://openalex.org/P4310320058"],"host_organization_lineage_names":["Association for the Advancement of Artificial Intelligence"],"type":"conference"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Proceedings of the AAAI Conference on Artificial Intelligence","raw_type":"journal-article"},"sustainable_development_goals":[{"display_name":"Quality Education","score":0.7566288113594055,"id":"https://metadata.un.org/sdg/4"}],"awards":[],"funders":[],"has_content":{"grobid_xml":true,"pdf":true},"content_urls":{"pdf":"https://content.openalex.org/works/W7138089501.pdf","grobid_xml":"https://content.openalex.org/works/W7138089501.grobid-xml"},"referenced_works_count":0,"referenced_works":[],"related_works":[],"abstract_inverted_index":{"Inspired":[0],"by":[1],"the":[2,82,89,225],"success":[3],"of":[4,45,53,85,92,96,143,227],"large":[5],"language":[6,11,14],"models":[7,15,37,55],"(LLMs)":[8],"in":[9,193,229],"natural":[10],"processing,":[12],"cell":[13,25,201],"(CLMs)":[16],"have":[17,38],"emerged":[18],"as":[19],"a":[20,43,51,116,150,163,213],"promising":[21],"paradigm":[22],"to":[23,81,156],"learn":[24],"representations":[26],"from":[27,33],"high-dimensional":[28,159],"single-cell":[29,64,220,230],"data\u2014particularly":[30],"transcriptomic":[31],"profiles":[32],"scRNA-seq.":[34],"These":[35],"foundation":[36,54,118,217],"shown":[39],"remarkable":[40],"potential":[41],"across":[42],"variety":[44],"downstream":[46,195],"applications.":[47],"However,":[48],"there":[49],"remains":[50],"lack":[52,95],"for":[56,69,120,219],"scATAC-seq":[57,86,121],"data,":[58,87],"which":[59],"measures":[60],"chromatin":[61,93,147],"accessibility":[62],"at":[63],"level":[65],"and":[66,101,113,153,161,166,179,207,215,223],"is":[67,76],"critical":[68],"decoding":[70],"epigenetic":[71],"regulation.":[72],"Developing":[73],"such":[74],"model":[75,119,218],"considerably":[77],"more":[78],"challenging":[79],"due":[80],"unique":[83],"characteristics":[84],"including":[88,197],"vast":[90],"number":[91],"regions,":[94],"standardized":[97],"annotations,":[98],"extreme":[99],"sparsity,":[100],"near-binary":[102],"distributions.":[103],"To":[104],"address":[105],"these":[106],"challenges,":[107],"we":[108,185],"systematically":[109],"explore":[110],"various":[111],"strategies":[112],"propose":[114],"CLM-Access,":[115],"specialized":[117,151],"data.":[122],"CLM-Access":[123,188],"incorporates":[124],"three":[125],"main":[126],"innovations:":[127],"(1)":[128],"an":[129,140],"unified":[130,141],"data":[131],"processing":[132],"pipeline":[133],"that":[134,170,187],"maps":[135],"2.8":[136],"million":[137,146],"cells":[138],"onto":[139],"reference":[142],"over":[144],"1":[145],"regions;":[148],"(2)":[149],"patching":[152],"embedding":[154],"strategy":[155],"effectively":[157],"manage":[158],"inputs;":[160],"(3)":[162],"tailored":[164],"masking":[165],"loss":[167],"function":[168],"design":[169],"preserves":[171],"fine-grained":[172],"regional":[173],"information":[174],"while":[175],"enhancing":[176],"training":[177],"efficiency":[178],"representation":[180],"quality.":[181],"With":[182],"comprehensive":[183],"benchmarks,":[184],"show":[186],"significantly":[189],"outperforms":[190],"existing":[191],"methods":[192],"key":[194],"tasks,":[196],"batch":[198],"effect":[199],"correction,":[200],"type":[202],"annotation,":[203],"RNA":[204],"expression":[205],"prediction,":[206],"multi-modal":[208],"integration.":[209],"This":[210],"work":[211],"establishes":[212],"scalable":[214],"interpretable":[216],"epigenomic":[221],"analysis":[222],"expands":[224],"application":[226],"CLMs":[228],"research.":[231]},"counts_by_year":[{"year":2026,"cited_by_count":1}],"updated_date":"2026-06-11T09:08:48.828518","created_date":"2026-03-18T00:00:00"}
