{"id":"https://openalex.org/W7116058981","doi":"https://doi.org/10.48550/arxiv.2512.14726","title":"Quantum Decision Transformers (QDT): Synergistic Entanglement and Interference for Offline Reinforcement Learning","display_name":"Quantum Decision Transformers (QDT): Synergistic Entanglement and Interference for Offline Reinforcement Learning","publication_year":2025,"publication_date":"2025-12-09","ids":{"openalex":"https://openalex.org/W7116058981","doi":"https://doi.org/10.48550/arxiv.2512.14726"},"language":null,"primary_location":{"id":"doi:10.48550/arxiv.2512.14726","is_oa":true,"landing_page_url":"https://doi.org/10.48550/arxiv.2512.14726","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":null,"is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"article"},"type":"preprint","indexed_in":["datacite"],"open_access":{"is_oa":true,"oa_status":"green","oa_url":"https://doi.org/10.48550/arxiv.2512.14726","any_repository_has_fulltext":true},"authorships":[{"author_position":"first","author":{"id":null,"display_name":"Weinberg, Abraham Itzhak","orcid":null},"institutions":[],"countries":[],"is_corresponding":true,"raw_author_name":"Weinberg, Abraham Itzhak","raw_affiliation_strings":[],"affiliations":[]}],"institutions":[],"countries_distinct_count":0,"institutions_distinct_count":1,"corresponding_author_ids":[],"corresponding_institution_ids":[],"apc_list":null,"apc_paid":null,"fwci":null,"has_fulltext":false,"cited_by_count":0,"citation_normalized_percentile":null,"cited_by_percentile_year":null,"biblio":{"volume":null,"issue":null,"first_page":null,"last_page":null},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10682","display_name":"Quantum Computing Algorithms and Architecture","score":0.48669999837875366,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10682","display_name":"Quantum Computing Algorithms and Architecture","score":0.48669999837875366,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T12611","display_name":"Neural Networks and Reservoir Computing","score":0.09000000357627869,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10502","display_name":"Advanced Memory and Neural Computing","score":0.04859999939799309,"subfield":{"id":"https://openalex.org/subfields/2208","display_name":"Electrical and Electronic Engineering"},"field":{"id":"https://openalex.org/fields/22","display_name":"Engineering"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/reinforcement-learning","display_name":"Reinforcement learning","score":0.7789000272750854},{"id":"https://openalex.org/keywords/transformer","display_name":"Transformer","score":0.5555999875068665},{"id":"https://openalex.org/keywords/modular-design","display_name":"Modular design","score":0.5002999901771545},{"id":"https://openalex.org/keywords/feed-forward","display_name":"Feed forward","score":0.44940000772476196},{"id":"https://openalex.org/keywords/artificial-neural-network","display_name":"Artificial neural network","score":0.439300000667572},{"id":"https://openalex.org/keywords/curse-of-dimensionality","display_name":"Curse of dimensionality","score":0.38449999690055847},{"id":"https://openalex.org/keywords/interdependence","display_name":"Interdependence","score":0.35019999742507935}],"concepts":[{"id":"https://openalex.org/C97541855","wikidata":"https://www.wikidata.org/wiki/Q830687","display_name":"Reinforcement learning","level":2,"score":0.7789000272750854},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.6956999897956848},{"id":"https://openalex.org/C66322947","wikidata":"https://www.wikidata.org/wiki/Q11658","display_name":"Transformer","level":3,"score":0.5555999875068665},{"id":"https://openalex.org/C101468663","wikidata":"https://www.wikidata.org/wiki/Q1620158","display_name":"Modular design","level":2,"score":0.5002999901771545},{"id":"https://openalex.org/C38858127","wikidata":"https://www.wikidata.org/wiki/Q5441228","display_name":"Feed forward","level":2,"score":0.44940000772476196},{"id":"https://openalex.org/C50644808","wikidata":"https://www.wikidata.org/wiki/Q192776","display_name":"Artificial neural network","level":2,"score":0.439300000667572},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.42570000886917114},{"id":"https://openalex.org/C111030470","wikidata":"https://www.wikidata.org/wiki/Q1430460","display_name":"Curse of dimensionality","level":2,"score":0.38449999690055847},{"id":"https://openalex.org/C185874996","wikidata":"https://www.wikidata.org/wiki/Q269699","display_name":"Interdependence","level":2,"score":0.35019999742507935},{"id":"https://openalex.org/C119857082","wikidata":"https://www.wikidata.org/wiki/Q2539","display_name":"Machine learning","level":1,"score":0.33239999413490295},{"id":"https://openalex.org/C120314980","wikidata":"https://www.wikidata.org/wiki/Q180634","display_name":"Distributed computing","level":1,"score":0.3027999997138977},{"id":"https://openalex.org/C179799912","wikidata":"https://www.wikidata.org/wiki/Q205084","display_name":"Computational complexity theory","level":2,"score":0.3027999997138977},{"id":"https://openalex.org/C123657996","wikidata":"https://www.wikidata.org/wiki/Q12271","display_name":"Architecture","level":2,"score":0.296999990940094},{"id":"https://openalex.org/C84114770","wikidata":"https://www.wikidata.org/wiki/Q46344","display_name":"Quantum","level":2,"score":0.28949999809265137},{"id":"https://openalex.org/C58053490","wikidata":"https://www.wikidata.org/wiki/Q176555","display_name":"Quantum computer","level":3,"score":0.28049999475479126},{"id":"https://openalex.org/C108583219","wikidata":"https://www.wikidata.org/wiki/Q197536","display_name":"Deep learning","level":2,"score":0.27810001373291016},{"id":"https://openalex.org/C193415008","wikidata":"https://www.wikidata.org/wiki/Q639681","display_name":"Network architecture","level":2,"score":0.2685999870300293},{"id":"https://openalex.org/C121040770","wikidata":"https://www.wikidata.org/wiki/Q215675","display_name":"Quantum entanglement","level":3,"score":0.2615000009536743}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.48550/arxiv.2512.14726","is_oa":true,"landing_page_url":"https://doi.org/10.48550/arxiv.2512.14726","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":null,"is_accepted":false,"is_published":null,"raw_source_name":null,"raw_type":"article"}],"best_oa_location":{"id":"doi:10.48550/arxiv.2512.14726","is_oa":true,"landing_page_url":"https://doi.org/10.48550/arxiv.2512.14726","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":null,"is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"article"},"sustainable_development_goals":[],"awards":[],"funders":[],"has_content":{"grobid_xml":false,"pdf":false},"content_urls":null,"referenced_works_count":0,"referenced_works":[],"related_works":[],"abstract_inverted_index":{"Offline":[0],"reinforcement":[1,190],"learning":[2,5,191],"enables":[3],"policy":[4],"from":[6],"pre-collected":[7],"datasets":[8],"without":[9],"environment":[10],"interaction,":[11],"but":[12],"existing":[13],"Decision":[14,31],"Transformer":[15,32],"(DT)":[16],"architectures":[17,182],"struggle":[18],"with":[19,53,65,91,186],"long-horizon":[20],"credit":[21,151],"assignment":[22,152],"and":[23,61,68,162],"complex":[24],"state-action":[25],"dependencies.":[26],"We":[27],"introduce":[28],"the":[29],"Quantum":[30,62],"(QDT),":[33],"a":[34,176],"novel":[35],"architecture":[36,130,194],"incorporating":[37],"quantum-inspired":[38,107,129,172],"computational":[39,148],"mechanisms":[40,137],"to":[41,88,192],"address":[42],"these":[43],"challenges.":[44],"Our":[45,143],"approach":[46],"integrates":[47],"two":[48],"core":[49],"components:":[50,108],"Quantum-Inspired":[51],"Attention":[52],"entanglement":[54],"operations":[55],"that":[56,127],"capture":[57],"non-local":[58,154],"feature":[59],"correlations,":[60,155],"Feedforward":[63],"Networks":[64],"multi-path":[66],"processing":[67],"learnable":[69,167],"interference":[70],"for":[71,179],"adaptive":[72,163],"computation.":[73],"Through":[74],"comprehensive":[75],"experiments":[76],"on":[77],"continuous":[78],"control":[79],"tasks,":[80],"we":[81],"demonstrate":[82],"over":[83],"2,000\\%":[84],"performance":[85],"improvement":[86],"compared":[87],"standard":[89],"DTs,":[90],"superior":[92],"generalization":[93],"across":[94],"varying":[95],"data":[96],"qualities.":[97],"Critically,":[98],"our":[99],"ablation":[100],"studies":[101],"reveal":[102],"strong":[103],"synergistic":[104],"effects":[105],"between":[106],"neither":[109],"alone":[110],"achieves":[111],"competitive":[112],"performance,":[113],"yet":[114],"their":[115],"combination":[116],"produces":[117],"dramatic":[118],"improvements":[119],"far":[120],"exceeding":[121],"individual":[122],"contributions.":[123],"This":[124],"synergy":[125],"demonstrates":[126],"effective":[128],"design":[131,173,195],"requires":[132],"holistic":[133],"co-design":[134],"of":[135],"interdependent":[136],"rather":[138],"than":[139],"modular":[140],"component":[141],"adoption.":[142],"analysis":[144],"identifies":[145],"three":[146],"key":[147],"advantages:":[149],"enhanced":[150],"through":[153,166],"implicit":[156],"ensemble":[157],"behavior":[158],"via":[159],"parallel":[160],"processing,":[161],"resource":[164],"allocation":[165],"interference.":[168],"These":[169],"findings":[170],"establish":[171],"principles":[174],"as":[175],"promising":[177],"direction":[178],"advancing":[180],"transformer":[181],"in":[183],"sequential":[184],"decision-making,":[185],"implications":[187],"extending":[188],"beyond":[189],"neural":[193],"more":[196],"broadly.":[197]},"counts_by_year":[],"updated_date":"2025-12-19T19:45:34.690201","created_date":"2025-12-19T00:00:00"}
