{"id":"https://openalex.org/W2981943555","doi":"https://doi.org/10.1109/tnnls.2019.2942951","title":"AlphaSeq: Sequence Discovery With Deep Reinforcement Learning","display_name":"AlphaSeq: Sequence Discovery With Deep Reinforcement Learning","publication_year":2019,"publication_date":"2019-10-21","ids":{"openalex":"https://openalex.org/W2981943555","doi":"https://doi.org/10.1109/tnnls.2019.2942951","mag":"2981943555","pmid":"https://pubmed.ncbi.nlm.nih.gov/31634848"},"language":"en","primary_location":{"id":"doi:10.1109/tnnls.2019.2942951","is_oa":false,"landing_page_url":"https://doi.org/10.1109/tnnls.2019.2942951","pdf_url":null,"source":{"id":"https://openalex.org/S4210175523","display_name":"IEEE Transactions on Neural Networks and Learning Systems","issn_l":"2162-237X","issn":["2162-237X","2162-2388"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310319808","host_organization_name":"Institute of Electrical and Electronics Engineers","host_organization_lineage":["https://openalex.org/P4310319808"],"host_organization_lineage_names":["Institute of Electrical and Electronics Engineers"],"type":"journal"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"IEEE Transactions on Neural Networks and Learning Systems","raw_type":"journal-article"},"type":"article","indexed_in":["crossref","pubmed"],"open_access":{"is_oa":false,"oa_status":"closed","oa_url":null,"any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5037069274","display_name":"Yulin Shao","orcid":"https://orcid.org/0000-0002-6300-3175"},"institutions":[{"id":"https://openalex.org/I177725633","display_name":"Chinese University of Hong Kong","ror":"https://ror.org/00t33hh48","country_code":"HK","type":"education","lineage":["https://openalex.org/I177725633"]}],"countries":["HK"],"is_corresponding":true,"raw_author_name":"Yulin Shao","raw_affiliation_strings":["Department of Information Engineering, The Chinese University of Hong Kong, Hong Kong"],"affiliations":[{"raw_affiliation_string":"Department of Information Engineering, The Chinese University of Hong Kong, Hong Kong","institution_ids":["https://openalex.org/I177725633"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5019164720","display_name":"Soung Chang Liew","orcid":"https://orcid.org/0000-0001-7055-6483"},"institutions":[{"id":"https://openalex.org/I177725633","display_name":"Chinese University of Hong Kong","ror":"https://ror.org/00t33hh48","country_code":"HK","type":"education","lineage":["https://openalex.org/I177725633"]}],"countries":["HK"],"is_corresponding":false,"raw_author_name":"Soung Chang Liew","raw_affiliation_strings":["Department of Information Engineering, The Chinese University of Hong Kong, Hong Kong"],"affiliations":[{"raw_affiliation_string":"Department of Information Engineering, The Chinese University of Hong Kong, Hong Kong","institution_ids":["https://openalex.org/I177725633"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5066110295","display_name":"Taotao Wang","orcid":"https://orcid.org/0000-0001-9454-4997"},"institutions":[{"id":"https://openalex.org/I177725633","display_name":"Chinese University of Hong Kong","ror":"https://ror.org/00t33hh48","country_code":"HK","type":"education","lineage":["https://openalex.org/I177725633"]},{"id":"https://openalex.org/I180726961","display_name":"Shenzhen University","ror":"https://ror.org/01vy4gh70","country_code":"CN","type":"education","lineage":["https://openalex.org/I180726961"]}],"countries":["CN","HK"],"is_corresponding":false,"raw_author_name":"Taotao Wang","raw_affiliation_strings":["College of Information Engineering, Shenzhen University, Shenzhen, China","Department of Information Engineering, The Chinese University of Hong Kong, Hong Kong"],"affiliations":[{"raw_affiliation_string":"College of Information Engineering, Shenzhen University, Shenzhen, China","institution_ids":["https://openalex.org/I180726961"]},{"raw_affiliation_string":"Department of Information Engineering, The Chinese University of Hong Kong, Hong Kong","institution_ids":["https://openalex.org/I177725633"]}]}],"institutions":[],"countries_distinct_count":2,"institutions_distinct_count":3,"corresponding_author_ids":["https://openalex.org/A5037069274"],"corresponding_institution_ids":["https://openalex.org/I177725633"],"apc_list":null,"apc_paid":null,"fwci":1.8927,"has_fulltext":false,"cited_by_count":25,"citation_normalized_percentile":{"value":0.89671077,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":{"min":90,"max":98},"biblio":{"volume":"31","issue":"9","first_page":"3319","last_page":"3333"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T11975","display_name":"Evolutionary Algorithms and Applications","score":0.9919000267982483,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T11975","display_name":"Evolutionary Algorithms and Applications","score":0.9919000267982483,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11574","display_name":"Artificial Intelligence in Games","score":0.9872000217437744,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T12158","display_name":"Guidance and Control Systems","score":0.974399983882904,"subfield":{"id":"https://openalex.org/subfields/2202","display_name":"Aerospace Engineering"},"field":{"id":"https://openalex.org/fields/22","display_name":"Engineering"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/sequence","display_name":"Sequence (biology)","score":0.7409884333610535},{"id":"https://openalex.org/keywords/reinforcement-learning","display_name":"Reinforcement learning","score":0.7175838947296143},{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.6907265782356262},{"id":"https://openalex.org/keywords/set","display_name":"Set (abstract data type)","score":0.6013249158859253},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.513782799243927},{"id":"https://openalex.org/keywords/symbol","display_name":"Symbol (formal)","score":0.4792749583721161},{"id":"https://openalex.org/keywords/filter","display_name":"Filter (signal processing)","score":0.452359676361084},{"id":"https://openalex.org/keywords/code","display_name":"Code (set theory)","score":0.4441075026988983},{"id":"https://openalex.org/keywords/sequence-learning","display_name":"Sequence learning","score":0.4278075397014618},{"id":"https://openalex.org/keywords/markov-decision-process","display_name":"Markov decision process","score":0.41548168659210205},{"id":"https://openalex.org/keywords/theoretical-computer-science","display_name":"Theoretical computer science","score":0.3545496165752411},{"id":"https://openalex.org/keywords/markov-process","display_name":"Markov process","score":0.2022354006767273},{"id":"https://openalex.org/keywords/mathematics","display_name":"Mathematics","score":0.14894363284111023},{"id":"https://openalex.org/keywords/programming-language","display_name":"Programming language","score":0.12055635452270508}],"concepts":[{"id":"https://openalex.org/C2778112365","wikidata":"https://www.wikidata.org/wiki/Q3511065","display_name":"Sequence (biology)","level":2,"score":0.7409884333610535},{"id":"https://openalex.org/C97541855","wikidata":"https://www.wikidata.org/wiki/Q830687","display_name":"Reinforcement learning","level":2,"score":0.7175838947296143},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.6907265782356262},{"id":"https://openalex.org/C177264268","wikidata":"https://www.wikidata.org/wiki/Q1514741","display_name":"Set (abstract data type)","level":2,"score":0.6013249158859253},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.513782799243927},{"id":"https://openalex.org/C134400042","wikidata":"https://www.wikidata.org/wiki/Q2372244","display_name":"Symbol (formal)","level":2,"score":0.4792749583721161},{"id":"https://openalex.org/C106131492","wikidata":"https://www.wikidata.org/wiki/Q3072260","display_name":"Filter (signal processing)","level":2,"score":0.452359676361084},{"id":"https://openalex.org/C2776760102","wikidata":"https://www.wikidata.org/wiki/Q5139990","display_name":"Code (set theory)","level":3,"score":0.4441075026988983},{"id":"https://openalex.org/C40506919","wikidata":"https://www.wikidata.org/wiki/Q7452469","display_name":"Sequence learning","level":2,"score":0.4278075397014618},{"id":"https://openalex.org/C106189395","wikidata":"https://www.wikidata.org/wiki/Q176789","display_name":"Markov decision process","level":3,"score":0.41548168659210205},{"id":"https://openalex.org/C80444323","wikidata":"https://www.wikidata.org/wiki/Q2878974","display_name":"Theoretical computer science","level":1,"score":0.3545496165752411},{"id":"https://openalex.org/C159886148","wikidata":"https://www.wikidata.org/wiki/Q176645","display_name":"Markov process","level":2,"score":0.2022354006767273},{"id":"https://openalex.org/C33923547","wikidata":"https://www.wikidata.org/wiki/Q395","display_name":"Mathematics","level":0,"score":0.14894363284111023},{"id":"https://openalex.org/C199360897","wikidata":"https://www.wikidata.org/wiki/Q9143","display_name":"Programming language","level":1,"score":0.12055635452270508},{"id":"https://openalex.org/C105795698","wikidata":"https://www.wikidata.org/wiki/Q12483","display_name":"Statistics","level":1,"score":0.0},{"id":"https://openalex.org/C54355233","wikidata":"https://www.wikidata.org/wiki/Q7162","display_name":"Genetics","level":1,"score":0.0},{"id":"https://openalex.org/C86803240","wikidata":"https://www.wikidata.org/wiki/Q420","display_name":"Biology","level":0,"score":0.0},{"id":"https://openalex.org/C31972630","wikidata":"https://www.wikidata.org/wiki/Q844240","display_name":"Computer vision","level":1,"score":0.0}],"mesh":[],"locations_count":2,"locations":[{"id":"doi:10.1109/tnnls.2019.2942951","is_oa":false,"landing_page_url":"https://doi.org/10.1109/tnnls.2019.2942951","pdf_url":null,"source":{"id":"https://openalex.org/S4210175523","display_name":"IEEE Transactions on Neural Networks and Learning Systems","issn_l":"2162-237X","issn":["2162-237X","2162-2388"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310319808","host_organization_name":"Institute of Electrical and Electronics Engineers","host_organization_lineage":["https://openalex.org/P4310319808"],"host_organization_lineage_names":["Institute of Electrical and Electronics Engineers"],"type":"journal"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"IEEE Transactions on Neural Networks and Learning Systems","raw_type":"journal-article"},{"id":"pmid:31634848","is_oa":false,"landing_page_url":"https://pubmed.ncbi.nlm.nih.gov/31634848","pdf_url":null,"source":{"id":"https://openalex.org/S4306525036","display_name":"PubMed","issn_l":null,"issn":null,"is_oa":false,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I1299303238","host_organization_name":"National Institutes of Health","host_organization_lineage":["https://openalex.org/I1299303238"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"IEEE transactions on neural networks and learning systems","raw_type":null}],"best_oa_location":null,"sustainable_development_goals":[{"score":0.7599999904632568,"display_name":"Peace, Justice and strong institutions","id":"https://metadata.un.org/sdg/16"}],"awards":[{"id":"https://openalex.org/G7725960137","display_name":null,"funder_award_id":"14200417","funder_id":"https://openalex.org/F4320334890","funder_display_name":"University Research Committee, University of Hong Kong"}],"funders":[{"id":"https://openalex.org/F4320334890","display_name":"University Research Committee, University of Hong Kong","ror":"https://ror.org/02zhqgq86"}],"has_content":{"grobid_xml":false,"pdf":false},"content_urls":null,"referenced_works_count":31,"referenced_works":["https://openalex.org/W1525552993","https://openalex.org/W1548023092","https://openalex.org/W1625390266","https://openalex.org/W1974592178","https://openalex.org/W1981837599","https://openalex.org/W2002273713","https://openalex.org/W2038833866","https://openalex.org/W2046476204","https://openalex.org/W2115229528","https://openalex.org/W2119567691","https://openalex.org/W2121863487","https://openalex.org/W2125193578","https://openalex.org/W2126316555","https://openalex.org/W2138548210","https://openalex.org/W2145339207","https://openalex.org/W2158124810","https://openalex.org/W2176699305","https://openalex.org/W2257979135","https://openalex.org/W2504855616","https://openalex.org/W2564803820","https://openalex.org/W2580175322","https://openalex.org/W2766447205","https://openalex.org/W2772709170","https://openalex.org/W2793057111","https://openalex.org/W2919115771","https://openalex.org/W2981943555","https://openalex.org/W3103559770","https://openalex.org/W4230591943","https://openalex.org/W4242085752","https://openalex.org/W6732665253","https://openalex.org/W6746177919"],"related_works":["https://openalex.org/W4400868993","https://openalex.org/W3096874164","https://openalex.org/W1985560493","https://openalex.org/W2937181779","https://openalex.org/W2386410636","https://openalex.org/W2357975469","https://openalex.org/W2145363145","https://openalex.org/W1626977535","https://openalex.org/W2341346307","https://openalex.org/W3168977894"],"abstract_inverted_index":{"Sequences":[0,117],"play":[1],"an":[2,18,48,68,131],"important":[3],"role":[4],"in":[5,52,58,169,188,216],"many":[6,136],"applications":[7],"and":[8,106,127,195],"systems.":[9,220],"Discovering":[10],"sequences":[11,33,200],"with":[12,76,142,155],"desired":[13,32],"properties":[14],"has":[15],"long":[16],"been":[17],"interesting":[19],"intellectual":[20],"pursuit.":[21],"This":[22],"article":[23],"puts":[24],"forth":[25],"a":[26,54,63,77,84,101,125,176,211],"new":[27,199],"paradigm,":[28],"AlphaSeq,":[29,122],"to":[30,113,129,159],"discover":[31],"algorithmically":[34],"using":[35],"deep":[36],"reinforcement":[37],"learning":[38],"(DRL)":[39],"techniques.":[40],"AlphaSeq":[41,96,149,168,173,197],"treats":[42],"the":[43,59,71,90,93,98,108,115,164,203,207],"sequence":[44,64,80,94,144],"discovery":[45],"problem":[46],"as":[47,100,121,124],"episodic":[49],"symbol-filling":[50],"game,":[51],"which":[53,83],"player":[55,134],"fills":[56],"symbols":[57],"vacant":[60],"positions":[61],"of":[62,70,92,111,138,167,178],"set":[65,177],"sequentially":[66],"during":[67],"episode":[69,74],"game.":[72],"Each":[73],"ends":[75],"completely":[78],"filled":[79],"set,":[81],"upon":[82],"reward":[85],"is":[86,150],"given":[87],"based":[88],"on":[89],"desirability":[91],"set.":[95],"models":[97],"game":[99,133,139],"Markov":[102],"decision":[103],"process":[104],"(MDP)":[105],"adapts":[107],"DRL":[109],"framework":[110],"AlphaGo":[112],"solve":[114],"MDP.":[116],"discovered":[118],"improve":[119],"progressively":[120],"starting":[123],"novice,":[126],"learns":[128],"become":[130],"expert":[132],"through":[135],"episodes":[137],"playing.":[140],"Compared":[141],"traditional":[143],"construction":[145],"by":[146],"mathematical":[147,160],"tools,":[148],"particularly":[151],"suitable":[152],"for":[153],"problems":[154],"complex":[156],"objectives":[157],"intractable":[158],"analysis.":[161],"We":[162],"demonstrate":[163],"searching":[165],"capabilities":[166],"two":[170],"applications:":[171],"1)":[172],"successfully":[174],"rediscovers":[175],"ideal":[179],"complementary":[180],"codes":[181],"that":[182,201],"can":[183],"zero-force":[184],"all":[185],"potential":[186],"interferences":[187],"multi-carrier":[189],"code-division":[190],"multiple":[191],"access":[192],"(CDMA)":[193],"systems":[194],"2)":[196],"discovers":[198],"triple":[202],"signal-to-interference":[204],"ratio-benchmarked":[205],"against":[206],"well-known":[208],"Legendre":[209],"sequence-of":[210],"mismatched":[212],"filter":[213],"(MMF)":[214],"estimator":[215],"pulse":[217],"compression":[218],"radar":[219]},"counts_by_year":[{"year":2025,"cited_by_count":2},{"year":2024,"cited_by_count":5},{"year":2023,"cited_by_count":5},{"year":2022,"cited_by_count":1},{"year":2021,"cited_by_count":5},{"year":2020,"cited_by_count":6},{"year":2019,"cited_by_count":1}],"updated_date":"2026-04-02T15:55:50.835912","created_date":"2025-10-10T00:00:00"}
