{"id":"https://openalex.org/W2949164659","doi":"https://doi.org/10.1109/allerton.2019.8919799","title":"Reinforcement Learning for Channel Coding: Learned Bit-Flipping Decoding","display_name":"Reinforcement Learning for Channel Coding: Learned Bit-Flipping Decoding","publication_year":2019,"publication_date":"2019-09-01","ids":{"openalex":"https://openalex.org/W2949164659","doi":"https://doi.org/10.1109/allerton.2019.8919799","mag":"2949164659"},"language":"en","primary_location":{"id":"doi:10.1109/allerton.2019.8919799","is_oa":false,"landing_page_url":"https://doi.org/10.1109/allerton.2019.8919799","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"2019 57th Annual Allerton Conference on Communication, Control, and Computing (Allerton)","raw_type":"proceedings-article"},"type":"article","indexed_in":["arxiv","crossref"],"open_access":{"is_oa":true,"oa_status":"green","oa_url":"https://arxiv.org/pdf/1906.04448","any_repository_has_fulltext":true},"authorships":[{"author_position":"first","author":{"id":null,"display_name":"Fabrizio Carpi","orcid":null},"institutions":[{"id":"https://openalex.org/I1327163397","display_name":"State University of New York","ror":"https://ror.org/01q1z8k08","country_code":"US","type":"education","lineage":["https://openalex.org/I1327163397"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Fabrizio Carpi","raw_affiliation_strings":["New York University,Department of Electrical and Computer Engineering,Brooklyn, New York,USA"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"New York University,Department of Electrical and Computer Engineering,Brooklyn, New York,USA","institution_ids":["https://openalex.org/I1327163397"]}]},{"author_position":"middle","author":{"id":null,"display_name":"Christian H\u00e4ger","orcid":null},"institutions":[{"id":"https://openalex.org/I66862912","display_name":"Chalmers University of Technology","ror":"https://ror.org/040wg7k59","country_code":"SE","type":"education","lineage":["https://openalex.org/I66862912"]}],"countries":["SE"],"is_corresponding":false,"raw_author_name":"Christian H\u00e4ger","raw_affiliation_strings":["Chalmers University of Technology,Department of Electrical Engineering,Gothenburg,Sweden"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"Chalmers University of Technology,Department of Electrical Engineering,Gothenburg,Sweden","institution_ids":["https://openalex.org/I66862912"]}]},{"author_position":"middle","author":{"id":null,"display_name":"Marco Martal\u00f2","orcid":null},"institutions":[{"id":"https://openalex.org/I124601658","display_name":"University of Parma","ror":"https://ror.org/02k7wn190","country_code":"IT","type":"education","lineage":["https://openalex.org/I124601658"]}],"countries":["IT"],"is_corresponding":false,"raw_author_name":"Marco Martal\u00f2","raw_affiliation_strings":["Department of Engineering and Architecture, University of Parma,\nParma, Italy"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"Department of Engineering and Architecture, University of Parma,\nParma, Italy","institution_ids":["https://openalex.org/I124601658"]}]},{"author_position":"middle","author":{"id":null,"display_name":"Riccardo Raheli","orcid":null},"institutions":[{"id":"https://openalex.org/I124601658","display_name":"University of Parma","ror":"https://ror.org/02k7wn190","country_code":"IT","type":"education","lineage":["https://openalex.org/I124601658"]}],"countries":["IT"],"is_corresponding":false,"raw_author_name":"Riccardo Raheli","raw_affiliation_strings":["University of Parma,Department of Engineering and Architecture,Parma,Italy"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"University of Parma,Department of Engineering and Architecture,Parma,Italy","institution_ids":["https://openalex.org/I124601658"]}]},{"author_position":"last","author":{"id":null,"display_name":"Henry D. Pfister","orcid":null},"institutions":[{"id":"https://openalex.org/I170897317","display_name":"Duke University","ror":"https://ror.org/00py81415","country_code":"US","type":"education","lineage":["https://openalex.org/I170897317"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Henry D. Pfister","raw_affiliation_strings":["Duke University,Department of Electrical and Computer Engineering,Durham,North Carolina,USA"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"Duke University,Department of Electrical and Computer Engineering,Durham,North Carolina,USA","institution_ids":["https://openalex.org/I170897317"]}]}],"institutions":[],"countries_distinct_count":3,"institutions_distinct_count":5,"corresponding_author_ids":[],"corresponding_institution_ids":[],"apc_list":null,"apc_paid":null,"fwci":3.905,"has_fulltext":false,"cited_by_count":39,"citation_normalized_percentile":{"value":0.94120765,"is_in_top_1_percent":false,"is_in_top_10_percent":true},"cited_by_percentile_year":{"min":97,"max":99},"biblio":{"volume":null,"issue":null,"first_page":"922","last_page":"929"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T11321","display_name":"Error Correcting Code Techniques","score":0.9998000264167786,"subfield":{"id":"https://openalex.org/subfields/1705","display_name":"Computer Networks and Communications"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T11321","display_name":"Error Correcting Code Techniques","score":0.9998000264167786,"subfield":{"id":"https://openalex.org/subfields/1705","display_name":"Computer Networks and Communications"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T12131","display_name":"Wireless Signal Modulation Classification","score":0.9959999918937683,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10964","display_name":"Wireless Communication Security Techniques","score":0.9937999844551086,"subfield":{"id":"https://openalex.org/subfields/2208","display_name":"Electrical and Electronic Engineering"},"field":{"id":"https://openalex.org/fields/22","display_name":"Engineering"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/decoding-methods","display_name":"Decoding methods","score":0.8119000196456909},{"id":"https://openalex.org/keywords/markov-decision-process","display_name":"Markov decision process","score":0.6323000192642212},{"id":"https://openalex.org/keywords/reinforcement-learning","display_name":"Reinforcement learning","score":0.5745000243186951},{"id":"https://openalex.org/keywords/heuristics","display_name":"Heuristics","score":0.5396000146865845},{"id":"https://openalex.org/keywords/binary-number","display_name":"Binary number","score":0.5224999785423279},{"id":"https://openalex.org/keywords/markov-process","display_name":"Markov process","score":0.4853000044822693},{"id":"https://openalex.org/keywords/convergence","display_name":"Convergence (economics)","score":0.4519999921321869},{"id":"https://openalex.org/keywords/channel","display_name":"Channel (broadcasting)","score":0.4302000105381012},{"id":"https://openalex.org/keywords/noise","display_name":"Noise (video)","score":0.40799999237060547}],"concepts":[{"id":"https://openalex.org/C57273362","wikidata":"https://www.wikidata.org/wiki/Q576722","display_name":"Decoding methods","level":2,"score":0.8119000196456909},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.6435999870300293},{"id":"https://openalex.org/C106189395","wikidata":"https://www.wikidata.org/wiki/Q176789","display_name":"Markov decision process","level":3,"score":0.6323000192642212},{"id":"https://openalex.org/C97541855","wikidata":"https://www.wikidata.org/wiki/Q830687","display_name":"Reinforcement learning","level":2,"score":0.5745000243186951},{"id":"https://openalex.org/C127705205","wikidata":"https://www.wikidata.org/wiki/Q5748245","display_name":"Heuristics","level":2,"score":0.5396000146865845},{"id":"https://openalex.org/C48372109","wikidata":"https://www.wikidata.org/wiki/Q3913","display_name":"Binary number","level":2,"score":0.5224999785423279},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.5062000155448914},{"id":"https://openalex.org/C11413529","wikidata":"https://www.wikidata.org/wiki/Q8366","display_name":"Algorithm","level":1,"score":0.5033000111579895},{"id":"https://openalex.org/C159886148","wikidata":"https://www.wikidata.org/wiki/Q176645","display_name":"Markov process","level":2,"score":0.4853000044822693},{"id":"https://openalex.org/C2777303404","wikidata":"https://www.wikidata.org/wiki/Q759757","display_name":"Convergence (economics)","level":2,"score":0.4519999921321869},{"id":"https://openalex.org/C127162648","wikidata":"https://www.wikidata.org/wiki/Q16858953","display_name":"Channel (broadcasting)","level":2,"score":0.4302000105381012},{"id":"https://openalex.org/C99498987","wikidata":"https://www.wikidata.org/wiki/Q2210247","display_name":"Noise (video)","level":3,"score":0.40799999237060547},{"id":"https://openalex.org/C169334058","wikidata":"https://www.wikidata.org/wiki/Q353292","display_name":"Additive white Gaussian noise","level":3,"score":0.4018999934196472},{"id":"https://openalex.org/C119857082","wikidata":"https://www.wikidata.org/wiki/Q2539","display_name":"Machine learning","level":1,"score":0.3799000084400177},{"id":"https://openalex.org/C204397858","wikidata":"https://www.wikidata.org/wiki/Q4437907","display_name":"List decoding","level":5,"score":0.37950000166893005},{"id":"https://openalex.org/C98045186","wikidata":"https://www.wikidata.org/wiki/Q205663","display_name":"Process (computing)","level":2,"score":0.36340001225471497},{"id":"https://openalex.org/C17098449","wikidata":"https://www.wikidata.org/wiki/Q176814","display_name":"Partially observable Markov decision process","level":4,"score":0.34940001368522644},{"id":"https://openalex.org/C98763669","wikidata":"https://www.wikidata.org/wiki/Q176645","display_name":"Markov chain","level":2,"score":0.3458000123500824},{"id":"https://openalex.org/C163716315","wikidata":"https://www.wikidata.org/wiki/Q901177","display_name":"Gaussian","level":2,"score":0.3296999931335449},{"id":"https://openalex.org/C193969084","wikidata":"https://www.wikidata.org/wiki/Q7452500","display_name":"Sequential decoding","level":4,"score":0.3151000142097473},{"id":"https://openalex.org/C80444323","wikidata":"https://www.wikidata.org/wiki/Q2878974","display_name":"Theoretical computer science","level":1,"score":0.3111000061035156},{"id":"https://openalex.org/C61326573","wikidata":"https://www.wikidata.org/wiki/Q1496376","display_name":"Gaussian process","level":3,"score":0.3109000027179718},{"id":"https://openalex.org/C204323151","wikidata":"https://www.wikidata.org/wiki/Q905424","display_name":"Range (aeronautics)","level":2,"score":0.2996000051498413},{"id":"https://openalex.org/C112633086","wikidata":"https://www.wikidata.org/wiki/Q381287","display_name":"White noise","level":2,"score":0.2913999855518341},{"id":"https://openalex.org/C147764199","wikidata":"https://www.wikidata.org/wiki/Q6865248","display_name":"Minification","level":2,"score":0.2806999981403351},{"id":"https://openalex.org/C63435697","wikidata":"https://www.wikidata.org/wiki/Q864135","display_name":"Binary code","level":3,"score":0.27790001034736633},{"id":"https://openalex.org/C155512373","wikidata":"https://www.wikidata.org/wiki/Q287450","display_name":"Residual","level":2,"score":0.27720001339912415},{"id":"https://openalex.org/C117619785","wikidata":"https://www.wikidata.org/wiki/Q6094414","display_name":"Iterative learning control","level":3,"score":0.27630001306533813},{"id":"https://openalex.org/C4199805","wikidata":"https://www.wikidata.org/wiki/Q2725903","display_name":"Gaussian noise","level":2,"score":0.2587999999523163},{"id":"https://openalex.org/C136389625","wikidata":"https://www.wikidata.org/wiki/Q334384","display_name":"Supervised learning","level":3,"score":0.2581999897956848}],"mesh":[],"locations_count":4,"locations":[{"id":"doi:10.1109/allerton.2019.8919799","is_oa":false,"landing_page_url":"https://doi.org/10.1109/allerton.2019.8919799","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"2019 57th Annual Allerton Conference on Communication, Control, and Computing (Allerton)","raw_type":"proceedings-article"},{"id":"pmh:oai:arXiv.org:1906.04448","is_oa":true,"landing_page_url":"http://arxiv.org/abs/1906.04448","pdf_url":"https://arxiv.org/pdf/1906.04448","source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"text"},{"id":"pmh:oai:iris.unica.it:11584/305486","is_oa":false,"landing_page_url":"https://ieeexplore.ieee.org/document/8919799","pdf_url":null,"source":{"id":"https://openalex.org/S4377196293","display_name":"UNICA IRIS Institutional Research Information System (University of Cagliari)","issn_l":null,"issn":null,"is_oa":false,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I172446870","host_organization_name":"University of Cagliari","host_organization_lineage":["https://openalex.org/I172446870"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":"","raw_type":"info:eu-repo/semantics/conferencePaper"},{"id":"pmh:oai:research.chalmers.se:517439","is_oa":false,"landing_page_url":"https://research.chalmers.se/en/publication/bb4d4fa0-30a1-42c7-b676-81d75abda8bc","pdf_url":null,"source":{"id":"https://openalex.org/S4306402469","display_name":"Chalmers Research (Chalmers University of Technology)","issn_l":null,"issn":null,"is_oa":false,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I66862912","host_organization_name":"Chalmers University of Technology","host_organization_lineage":["https://openalex.org/I66862912"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":"","raw_type":""}],"best_oa_location":{"id":"pmh:oai:arXiv.org:1906.04448","is_oa":true,"landing_page_url":"http://arxiv.org/abs/1906.04448","pdf_url":"https://arxiv.org/pdf/1906.04448","source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"text"},"sustainable_development_goals":[],"awards":[],"funders":[],"has_content":{"pdf":false,"grobid_xml":false},"content_urls":null,"referenced_works_count":26,"referenced_works":["https://openalex.org/W1597391834","https://openalex.org/W2021444624","https://openalex.org/W2091121840","https://openalex.org/W2114869758","https://openalex.org/W2121498709","https://openalex.org/W2134502194","https://openalex.org/W2140124864","https://openalex.org/W2144727550","https://openalex.org/W2148076418","https://openalex.org/W2151852374","https://openalex.org/W2156826724","https://openalex.org/W2161084929","https://openalex.org/W2584943905","https://openalex.org/W2734408173","https://openalex.org/W2793196194","https://openalex.org/W2901703166","https://openalex.org/W2963408536","https://openalex.org/W2964070430","https://openalex.org/W2964292940","https://openalex.org/W2976077638","https://openalex.org/W4214717370","https://openalex.org/W4256264271","https://openalex.org/W6631424144","https://openalex.org/W6747916894","https://openalex.org/W6752963931","https://openalex.org/W6755792838"],"related_works":[],"abstract_inverted_index":{"In":[0],"this":[1],"paper,":[2],"we":[3,75],"use":[4],"reinforcement":[5],"learning":[6,58,121,127],"to":[7,51,135],"find":[8],"effective":[9],"decoding":[10,22,78,131],"strategies":[11],"for":[12,56,79,104],"binary":[13,82],"linear":[14],"codes.":[15],"We":[16,42,118],"start":[17],"by":[18],"reviewing":[19],"several":[20],"iterative":[21],"algorithms":[23,47],"that":[24,93],"involve":[25],"a":[26,72,99],"decision-making":[27],"process":[28,128],"at":[29],"each":[30],"step,":[31],"including":[32],"bit-flipping":[33],"(BF)":[34],"decoding,":[35],"residual":[36],"belief":[37],"propagation,":[38],"and":[39,84,108,111,141],"anchor":[40],"decoding.":[41],"then":[43],"illustrate":[44],"how":[45],"such":[46],"can":[48,97],"be":[49],"mapped":[50],"Markov":[52],"decision":[53,61],"processes":[54],"allowing":[55],"data-driven":[57],"of":[59,101],"optimal":[60],"strategies,":[62],"rather":[63],"than":[64],"basing":[65],"decisions":[66],"on":[67,138],"heuristics":[68],"or":[69],"intuition.":[70],"As":[71],"case":[73],"study,":[74],"consider":[76],"BF":[77,95],"both":[80],"the":[81,105,126],"symmetric":[83],"additive":[85],"white":[86],"Gaussian":[87],"noise":[88],"channel.":[89],"Our":[90],"results":[91],"show":[92],"learned":[94],"decoders":[96],"offer":[98],"range":[100],"performance-complexity":[102],"trade-offs":[103],"considered":[106],"Reed-Muller":[107],"BCH":[109],"codes,":[110],"achieve":[112],"near-optimal":[113],"performance":[114],"in":[115],"some":[116],"cases.":[117],"also":[119],"demonstrate":[120],"convergence":[122],"speed-ups":[123],"when":[124],"biasing":[125],"towards":[129],"correct":[130],"decisions,":[132],"as":[133],"opposed":[134],"relying":[136],"only":[137],"random":[139],"explorations":[140],"past":[142],"knowledge.":[143]},"counts_by_year":[{"year":2025,"cited_by_count":8},{"year":2024,"cited_by_count":4},{"year":2023,"cited_by_count":6},{"year":2022,"cited_by_count":7},{"year":2021,"cited_by_count":8},{"year":2020,"cited_by_count":6}],"updated_date":"2026-06-11T09:08:48.828518","created_date":"2019-06-27T00:00:00"}
