{"id":"https://openalex.org/W7143504550","doi":"https://doi.org/10.48550/arxiv.2603.26465","title":"A Boltzmann-machine-enhanced Transformer For DNA Sequence Classification","display_name":"A Boltzmann-machine-enhanced Transformer For DNA Sequence Classification","publication_year":2026,"publication_date":"2026-03-27","ids":{"openalex":"https://openalex.org/W7143504550","doi":"https://doi.org/10.48550/arxiv.2603.26465"},"language":null,"primary_location":{"id":"doi:10.48550/arxiv.2603.26465","is_oa":true,"landing_page_url":"https://doi.org/10.48550/arxiv.2603.26465","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":null,"is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"article"},"type":"preprint","indexed_in":["datacite"],"open_access":{"is_oa":true,"oa_status":"green","oa_url":"https://doi.org/10.48550/arxiv.2603.26465","any_repository_has_fulltext":true},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5130958088","display_name":"Zhixuan Cao","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Cao, Zhixuan","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5101111162","display_name":"Yishu Xu","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Xu, Yishu","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"last","author":{"id":"https://openalex.org/A5130952866","display_name":"Xuang WU","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"WU, Xuang","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]}],"institutions":[],"countries_distinct_count":0,"institutions_distinct_count":3,"corresponding_author_ids":[],"corresponding_institution_ids":[],"apc_list":null,"apc_paid":null,"fwci":null,"has_fulltext":false,"cited_by_count":0,"citation_normalized_percentile":null,"cited_by_percentile_year":null,"biblio":{"volume":null,"issue":null,"first_page":null,"last_page":null},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10222","display_name":"Genomics and Chromatin Dynamics","score":0.19249999523162842,"subfield":{"id":"https://openalex.org/subfields/1312","display_name":"Molecular Biology"},"field":{"id":"https://openalex.org/fields/13","display_name":"Biochemistry, Genetics and Molecular Biology"},"domain":{"id":"https://openalex.org/domains/1","display_name":"Life Sciences"}},"topics":[{"id":"https://openalex.org/T10222","display_name":"Genomics and Chromatin Dynamics","score":0.19249999523162842,"subfield":{"id":"https://openalex.org/subfields/1312","display_name":"Molecular Biology"},"field":{"id":"https://openalex.org/fields/13","display_name":"Biochemistry, Genetics and Molecular Biology"},"domain":{"id":"https://openalex.org/domains/1","display_name":"Life Sciences"}},{"id":"https://openalex.org/T12254","display_name":"Machine Learning in Bioinformatics","score":0.1307000070810318,"subfield":{"id":"https://openalex.org/subfields/1312","display_name":"Molecular Biology"},"field":{"id":"https://openalex.org/fields/13","display_name":"Biochemistry, Genetics and Molecular Biology"},"domain":{"id":"https://openalex.org/domains/1","display_name":"Life Sciences"}},{"id":"https://openalex.org/T12946","display_name":"Fractal and DNA sequence analysis","score":0.11069999635219574,"subfield":{"id":"https://openalex.org/subfields/1312","display_name":"Molecular Biology"},"field":{"id":"https://openalex.org/fields/13","display_name":"Biochemistry, Genetics and Molecular Biology"},"domain":{"id":"https://openalex.org/domains/1","display_name":"Life Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/inference","display_name":"Inference","score":0.6140999794006348},{"id":"https://openalex.org/keywords/pairwise-comparison","display_name":"Pairwise comparison","score":0.536300003528595},{"id":"https://openalex.org/keywords/softmax-function","display_name":"Softmax function","score":0.5268999934196472},{"id":"https://openalex.org/keywords/transformer","display_name":"Transformer","score":0.4449000060558319},{"id":"https://openalex.org/keywords/binary-number","display_name":"Binary number","score":0.4262999892234802},{"id":"https://openalex.org/keywords/discriminative-model","display_name":"Discriminative model","score":0.42100000381469727},{"id":"https://openalex.org/keywords/latent-variable","display_name":"Latent variable","score":0.3970000147819519},{"id":"https://openalex.org/keywords/differentiable-function","display_name":"Differentiable function","score":0.383899986743927},{"id":"https://openalex.org/keywords/sequence","display_name":"Sequence (biology)","score":0.36419999599456787}],"concepts":[{"id":"https://openalex.org/C2776214188","wikidata":"https://www.wikidata.org/wiki/Q408386","display_name":"Inference","level":2,"score":0.6140999794006348},{"id":"https://openalex.org/C184898388","wikidata":"https://www.wikidata.org/wiki/Q1435712","display_name":"Pairwise comparison","level":2,"score":0.536300003528595},{"id":"https://openalex.org/C188441871","wikidata":"https://www.wikidata.org/wiki/Q7554146","display_name":"Softmax function","level":3,"score":0.5268999934196472},{"id":"https://openalex.org/C11413529","wikidata":"https://www.wikidata.org/wiki/Q8366","display_name":"Algorithm","level":1,"score":0.47600001096725464},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.4740999937057495},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.45249998569488525},{"id":"https://openalex.org/C66322947","wikidata":"https://www.wikidata.org/wiki/Q11658","display_name":"Transformer","level":3,"score":0.4449000060558319},{"id":"https://openalex.org/C48372109","wikidata":"https://www.wikidata.org/wiki/Q3913","display_name":"Binary number","level":2,"score":0.4262999892234802},{"id":"https://openalex.org/C97931131","wikidata":"https://www.wikidata.org/wiki/Q5282087","display_name":"Discriminative model","level":2,"score":0.42100000381469727},{"id":"https://openalex.org/C51167844","wikidata":"https://www.wikidata.org/wiki/Q4422623","display_name":"Latent variable","level":2,"score":0.3970000147819519},{"id":"https://openalex.org/C202615002","wikidata":"https://www.wikidata.org/wiki/Q783507","display_name":"Differentiable function","level":2,"score":0.383899986743927},{"id":"https://openalex.org/C2778112365","wikidata":"https://www.wikidata.org/wiki/Q3511065","display_name":"Sequence (biology)","level":2,"score":0.36419999599456787},{"id":"https://openalex.org/C49937458","wikidata":"https://www.wikidata.org/wiki/Q2599292","display_name":"Probabilistic logic","level":2,"score":0.35830000042915344},{"id":"https://openalex.org/C160234255","wikidata":"https://www.wikidata.org/wiki/Q812535","display_name":"Bayesian inference","level":3,"score":0.35269999504089355},{"id":"https://openalex.org/C155846161","wikidata":"https://www.wikidata.org/wiki/Q1143367","display_name":"Graphical model","level":2,"score":0.3490000069141388},{"id":"https://openalex.org/C153180895","wikidata":"https://www.wikidata.org/wiki/Q7148389","display_name":"Pattern recognition (psychology)","level":2,"score":0.34439998865127563},{"id":"https://openalex.org/C186370098","wikidata":"https://www.wikidata.org/wiki/Q442787","display_name":"Energy (signal processing)","level":2,"score":0.3294000029563904},{"id":"https://openalex.org/C33923547","wikidata":"https://www.wikidata.org/wiki/Q395","display_name":"Mathematics","level":0,"score":0.32739999890327454},{"id":"https://openalex.org/C124101348","wikidata":"https://www.wikidata.org/wiki/Q172491","display_name":"Data mining","level":1,"score":0.31520000100135803},{"id":"https://openalex.org/C119857082","wikidata":"https://www.wikidata.org/wiki/Q2539","display_name":"Machine learning","level":1,"score":0.3095000088214874},{"id":"https://openalex.org/C14961307","wikidata":"https://www.wikidata.org/wiki/Q5377176","display_name":"Energy minimization","level":2,"score":0.29789999127388},{"id":"https://openalex.org/C107673813","wikidata":"https://www.wikidata.org/wiki/Q812534","display_name":"Bayesian probability","level":2,"score":0.29660001397132874},{"id":"https://openalex.org/C80444323","wikidata":"https://www.wikidata.org/wiki/Q2878974","display_name":"Theoretical computer science","level":1,"score":0.29330000281333923},{"id":"https://openalex.org/C114289077","wikidata":"https://www.wikidata.org/wiki/Q3284399","display_name":"Statistical model","level":2,"score":0.28619998693466187},{"id":"https://openalex.org/C33553690","wikidata":"https://www.wikidata.org/wiki/Q17014702","display_name":"Free energy principle","level":2,"score":0.27480000257492065},{"id":"https://openalex.org/C57830394","wikidata":"https://www.wikidata.org/wiki/Q278079","display_name":"Posterior probability","level":3,"score":0.2741999924182892},{"id":"https://openalex.org/C190502265","wikidata":"https://www.wikidata.org/wiki/Q17069496","display_name":"MNIST database","level":3,"score":0.2694000005722046},{"id":"https://openalex.org/C185798385","wikidata":"https://www.wikidata.org/wiki/Q1161707","display_name":"Benchmark (surveying)","level":2,"score":0.26739999651908875},{"id":"https://openalex.org/C192328126","wikidata":"https://www.wikidata.org/wiki/Q4514647","display_name":"Schematic","level":2,"score":0.26489999890327454},{"id":"https://openalex.org/C65965080","wikidata":"https://www.wikidata.org/wiki/Q1806885","display_name":"Latent variable model","level":3,"score":0.2603999972343445},{"id":"https://openalex.org/C179518139","wikidata":"https://www.wikidata.org/wiki/Q5140297","display_name":"Coding (social sciences)","level":2,"score":0.25540000200271606},{"id":"https://openalex.org/C61224824","wikidata":"https://www.wikidata.org/wiki/Q2260434","display_name":"Mixture model","level":2,"score":0.25360000133514404}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.48550/arxiv.2603.26465","is_oa":true,"landing_page_url":"https://doi.org/10.48550/arxiv.2603.26465","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":null,"is_accepted":false,"is_published":null,"raw_source_name":null,"raw_type":"article"}],"best_oa_location":{"id":"doi:10.48550/arxiv.2603.26465","is_oa":true,"landing_page_url":"https://doi.org/10.48550/arxiv.2603.26465","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":null,"is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"article"},"sustainable_development_goals":[{"score":0.8253955245018005,"display_name":"Affordable and clean energy","id":"https://metadata.un.org/sdg/7"}],"awards":[],"funders":[],"has_content":{"pdf":false,"grobid_xml":false},"content_urls":null,"referenced_works_count":0,"referenced_works":[],"related_works":[],"abstract_inverted_index":{"DNA":[0,62],"sequence":[1,63],"classification":[2,154],"requires":[3],"not":[4],"only":[5],"high":[6],"predictive":[7],"accuracy":[8],"but":[9],"also":[10],"the":[11,25,69,159,175,178,186,193],"ability":[12],"to":[13,76,127,137,161,185],"uncover":[14],"latent":[15,78,105],"site":[16],"interactions,":[17],"combinatorial":[18,110],"regulation,":[19],"and":[20,39,81,100,104,132,155,169,181,192,211],"epistasis-like":[21],"higher-order":[22,109],"dependencies.":[23,111],"Although":[24],"standard":[26],"Transformer":[27,60],"provides":[28,200],"strong":[29],"global":[30],"modeling":[31],"capacity,":[32],"its":[33],"softmax":[34],"attention":[35],"is":[36,120],"continuous,":[37],"dense,":[38],"weakly":[40],"constrained,":[41],"making":[42],"it":[43,134],"better":[44],"suited":[45],"for":[46,61,213],"information":[47],"routing":[48],"than":[49],"explicit":[50],"structure":[51],"discovery.":[52],"In":[53],"this":[54],"paper,":[55],"we":[56,122,151],"propose":[57],"a":[58,85,201],"Boltzmann-machine-enhanced":[59],"classification.":[64],"Built":[65],"on":[66,216],"multi-head":[67],"attention,":[68],"model":[70,108,160],"introduces":[71],"structured":[72,214],"binary":[73],"gating":[74,118],"variables":[75],"represent":[77],"query-key":[79],"connections":[80],"constrains":[82],"them":[83],"with":[84,135],"Boltzmann-style":[86],"energy":[87,156,179,184],"function.":[88],"Query-key":[89],"similarity":[90],"defines":[91],"local":[92],"bias":[93],"terms,":[94],"learnable":[95],"pairwise":[96],"interactions":[97],"capture":[98],"synergy":[99],"competition":[101],"between":[102],"edges,":[103],"hidden":[106],"units":[107],"Since":[112],"exact":[113],"posterior":[114],"inference":[115,126],"over":[116],"discrete":[117,209],"graphs":[119],"intractable,":[121],"use":[123],"mean-field":[124,187],"variational":[125,182],"estimate":[128],"edge":[129],"activation":[130],"probabilities":[131,141],"combine":[133],"Gumbel-Softmax":[136,190],"progressively":[138],"compress":[139],"continuous":[140],"into":[142],"near-discrete":[143],"gates":[144],"while":[145,165],"preserving":[146],"end-to-end":[147],"differentiability.":[148],"During":[149],"training,":[150],"jointly":[152],"optimize":[153],"losses,":[157],"encouraging":[158],"achieve":[162],"accurate":[163],"prediction":[164],"favoring":[166],"low-energy,":[167],"stable,":[168],"interpretable":[170],"structures.":[171],"We":[172],"further":[173],"derive":[174],"framework":[176,199],"from":[177],"function":[180],"free":[183],"fixed-point":[188],"equations,":[189],"relaxation,":[191],"final":[194],"joint":[195],"objective.":[196],"The":[197],"proposed":[198],"unified":[202],"view":[203],"of":[204],"integrating":[205],"Boltzmann":[206],"machines,":[207],"differentiable":[208],"optimization,":[210],"Transformers":[212],"learning":[215],"biological":[217],"sequences.":[218]},"counts_by_year":[],"updated_date":"2026-06-11T09:08:48.828518","created_date":"2026-03-31T00:00:00"}
