{"id":"https://openalex.org/W3091315598","doi":"https://doi.org/10.1109/ijcnn48605.2020.9207289","title":"Transformer Decoder Based Reinforcement Learning Approach for Conversational Response Generation","display_name":"Transformer Decoder Based Reinforcement Learning Approach for Conversational Response Generation","publication_year":2020,"publication_date":"2020-07-01","ids":{"openalex":"https://openalex.org/W3091315598","doi":"https://doi.org/10.1109/ijcnn48605.2020.9207289","mag":"3091315598"},"language":"en","primary_location":{"id":"doi:10.1109/ijcnn48605.2020.9207289","is_oa":false,"landing_page_url":"https://doi.org/10.1109/ijcnn48605.2020.9207289","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"2020 International Joint Conference on Neural Networks (IJCNN)","raw_type":"proceedings-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":false,"oa_status":"closed","oa_url":null,"any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5028746314","display_name":"Farshid Faal","orcid":"https://orcid.org/0000-0002-2555-3221"},"institutions":[{"id":"https://openalex.org/I60158472","display_name":"Concordia University","ror":"https://ror.org/0420zvk78","country_code":"CA","type":"education","lineage":["https://openalex.org/I60158472"]}],"countries":["CA"],"is_corresponding":true,"raw_author_name":"Farshid Faal","raw_affiliation_strings":["Concordia Institute for Information System Engineering Concordia University, Montreal, Canada"],"affiliations":[{"raw_affiliation_string":"Concordia Institute for Information System Engineering Concordia University, Montreal, Canada","institution_ids":["https://openalex.org/I60158472"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5101868923","display_name":"Jia Yuan Yu","orcid":"https://orcid.org/0000-0002-6674-6150"},"institutions":[{"id":"https://openalex.org/I60158472","display_name":"Concordia University","ror":"https://ror.org/0420zvk78","country_code":"CA","type":"education","lineage":["https://openalex.org/I60158472"]}],"countries":["CA"],"is_corresponding":false,"raw_author_name":"Jia Yuan Yu","raw_affiliation_strings":["Concordia Institute for Information System Engineering Concordia University, Montreal, Canada"],"affiliations":[{"raw_affiliation_string":"Concordia Institute for Information System Engineering Concordia University, Montreal, Canada","institution_ids":["https://openalex.org/I60158472"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5064330344","display_name":"Ketra Schmitt","orcid":"https://orcid.org/0000-0002-4260-6209"},"institutions":[{"id":"https://openalex.org/I60158472","display_name":"Concordia University","ror":"https://ror.org/0420zvk78","country_code":"CA","type":"education","lineage":["https://openalex.org/I60158472"]}],"countries":["CA"],"is_corresponding":false,"raw_author_name":"Ketra Schmitt","raw_affiliation_strings":["Concordia Institute for Information System Engineering Concordia University, Montreal, Canada"],"affiliations":[{"raw_affiliation_string":"Concordia Institute for Information System Engineering Concordia University, Montreal, Canada","institution_ids":["https://openalex.org/I60158472"]}]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":3,"corresponding_author_ids":["https://openalex.org/A5028746314"],"corresponding_institution_ids":["https://openalex.org/I60158472"],"apc_list":null,"apc_paid":null,"fwci":0.1373,"has_fulltext":false,"cited_by_count":2,"citation_normalized_percentile":{"value":0.55344331,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":{"min":89,"max":94},"biblio":{"volume":"1","issue":null,"first_page":"1","last_page":"8"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10028","display_name":"Topic Modeling","score":1.0,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10028","display_name":"Topic Modeling","score":1.0,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10181","display_name":"Natural Language Processing Techniques","score":0.9986000061035156,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T12031","display_name":"Speech and dialogue systems","score":0.9983999729156494,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.8163928985595703},{"id":"https://openalex.org/keywords/transformer","display_name":"Transformer","score":0.8030129671096802},{"id":"https://openalex.org/keywords/conversation","display_name":"Conversation","score":0.6419369578361511},{"id":"https://openalex.org/keywords/reinforcement-learning","display_name":"Reinforcement learning","score":0.5947930812835693},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.5116584897041321},{"id":"https://openalex.org/keywords/language-model","display_name":"Language model","score":0.46724867820739746},{"id":"https://openalex.org/keywords/speech-recognition","display_name":"Speech recognition","score":0.44843170046806335},{"id":"https://openalex.org/keywords/natural-language-processing","display_name":"Natural language processing","score":0.42321449518203735},{"id":"https://openalex.org/keywords/machine-learning","display_name":"Machine learning","score":0.41896945238113403},{"id":"https://openalex.org/keywords/voltage","display_name":"Voltage","score":0.1644591987133026},{"id":"https://openalex.org/keywords/engineering","display_name":"Engineering","score":0.11911213397979736}],"concepts":[{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.8163928985595703},{"id":"https://openalex.org/C66322947","wikidata":"https://www.wikidata.org/wiki/Q11658","display_name":"Transformer","level":3,"score":0.8030129671096802},{"id":"https://openalex.org/C2777200299","wikidata":"https://www.wikidata.org/wiki/Q52943","display_name":"Conversation","level":2,"score":0.6419369578361511},{"id":"https://openalex.org/C97541855","wikidata":"https://www.wikidata.org/wiki/Q830687","display_name":"Reinforcement learning","level":2,"score":0.5947930812835693},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.5116584897041321},{"id":"https://openalex.org/C137293760","wikidata":"https://www.wikidata.org/wiki/Q3621696","display_name":"Language model","level":2,"score":0.46724867820739746},{"id":"https://openalex.org/C28490314","wikidata":"https://www.wikidata.org/wiki/Q189436","display_name":"Speech recognition","level":1,"score":0.44843170046806335},{"id":"https://openalex.org/C204321447","wikidata":"https://www.wikidata.org/wiki/Q30642","display_name":"Natural language processing","level":1,"score":0.42321449518203735},{"id":"https://openalex.org/C119857082","wikidata":"https://www.wikidata.org/wiki/Q2539","display_name":"Machine learning","level":1,"score":0.41896945238113403},{"id":"https://openalex.org/C165801399","wikidata":"https://www.wikidata.org/wiki/Q25428","display_name":"Voltage","level":2,"score":0.1644591987133026},{"id":"https://openalex.org/C127413603","wikidata":"https://www.wikidata.org/wiki/Q11023","display_name":"Engineering","level":0,"score":0.11911213397979736},{"id":"https://openalex.org/C138885662","wikidata":"https://www.wikidata.org/wiki/Q5891","display_name":"Philosophy","level":0,"score":0.0},{"id":"https://openalex.org/C41895202","wikidata":"https://www.wikidata.org/wiki/Q8162","display_name":"Linguistics","level":1,"score":0.0},{"id":"https://openalex.org/C119599485","wikidata":"https://www.wikidata.org/wiki/Q43035","display_name":"Electrical engineering","level":1,"score":0.0}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.1109/ijcnn48605.2020.9207289","is_oa":false,"landing_page_url":"https://doi.org/10.1109/ijcnn48605.2020.9207289","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"2020 International Joint Conference on Neural Networks (IJCNN)","raw_type":"proceedings-article"}],"best_oa_location":null,"sustainable_development_goals":[{"display_name":"Quality Education","id":"https://metadata.un.org/sdg/4","score":0.5799999833106995}],"awards":[],"funders":[],"has_content":{"pdf":false,"grobid_xml":false},"content_urls":null,"referenced_works_count":64,"referenced_works":["https://openalex.org/W10957333","https://openalex.org/W77961983","https://openalex.org/W1191599655","https://openalex.org/W1518951372","https://openalex.org/W1753482797","https://openalex.org/W1771410628","https://openalex.org/W1902237438","https://openalex.org/W1905882502","https://openalex.org/W1993378086","https://openalex.org/W2022433169","https://openalex.org/W2064675550","https://openalex.org/W2074818733","https://openalex.org/W2118434577","https://openalex.org/W2119168550","https://openalex.org/W2119567691","https://openalex.org/W2130942839","https://openalex.org/W2137607259","https://openalex.org/W2137871902","https://openalex.org/W2155027007","https://openalex.org/W2157331557","https://openalex.org/W2161466446","https://openalex.org/W2176263492","https://openalex.org/W2395389931","https://openalex.org/W2551884415","https://openalex.org/W2559038528","https://openalex.org/W2579486552","https://openalex.org/W2584185835","https://openalex.org/W2736601468","https://openalex.org/W2810821963","https://openalex.org/W2890969459","https://openalex.org/W2896457183","https://openalex.org/W2950314731","https://openalex.org/W2951883832","https://openalex.org/W2962784628","https://openalex.org/W2962883855","https://openalex.org/W2963084599","https://openalex.org/W2963167310","https://openalex.org/W2963206148","https://openalex.org/W2963248296","https://openalex.org/W2963341956","https://openalex.org/W2963360026","https://openalex.org/W2963403868","https://openalex.org/W2963668753","https://openalex.org/W2963951265","https://openalex.org/W2963963856","https://openalex.org/W2964309167","https://openalex.org/W4236521339","https://openalex.org/W4298023569","https://openalex.org/W4385245566","https://openalex.org/W6600426076","https://openalex.org/W6627932998","https://openalex.org/W6637698695","https://openalex.org/W6638018090","https://openalex.org/W6679436768","https://openalex.org/W6680585821","https://openalex.org/W6683204974","https://openalex.org/W6685322675","https://openalex.org/W6711536258","https://openalex.org/W6730098006","https://openalex.org/W6732350694","https://openalex.org/W6739901393","https://openalex.org/W6741002519","https://openalex.org/W6755007375","https://openalex.org/W6755207826"],"related_works":["https://openalex.org/W4288365749","https://openalex.org/W2936497627","https://openalex.org/W3013624417","https://openalex.org/W4287826556","https://openalex.org/W3098382480","https://openalex.org/W4287598411","https://openalex.org/W3100913109","https://openalex.org/W3198458223","https://openalex.org/W3126642501","https://openalex.org/W2964413124"],"abstract_inverted_index":{"Developing":[0],"a":[1,10,20,105,110,132,137,149],"machine":[2],"that":[3,142],"can":[4],"hold":[5],"an":[6],"engaging":[7],"conversation":[8],"with":[9,36,85],"human":[11,108,111,135,138],"is":[12,131],"one":[13],"of":[14,26,50,95,117,162],"the":[15,24,48,60,70,86,93,115,126,160,163],"main":[16],"challenges":[17],"in":[18,23,53,104,148],"designing":[19],"dialogue":[21,54,101,150,167],"system":[22],"field":[25],"natural":[27],"language":[28],"processing.":[29],"Responses":[30],"generated":[31],"by":[32],"neural":[33],"conversational":[34,74],"models":[35,157,169],"log-likelihood":[37,51],"training":[38,52,69],"methods":[39],"tend":[40],"to":[41,109,136],"lack":[42],"informativeness":[43],"and":[44,57,158,173],"diversity.":[45],"We":[46,90],"address":[47],"limitation":[49],"generation":[55,103,168],"models,":[56],"we":[58,121],"present":[59],"Reinforce":[61],"Transformer":[62,71,87,165],"decoder":[63,72,88],"model,":[64,75],"our":[65,96,118,123,143],"new":[66],"approach":[67],"for":[68,99],"based":[73,166,170],"which":[76,130],"incorporates":[77],"proximal":[78],"policy":[79],"optimization":[80],"techniques":[81],"from":[82],"re-inforcement":[83],"learning":[84],"architecture.":[89],"specifically":[91],"examine":[92],"use":[94],"proposed":[97,119,144],"model":[98,124,147],"multi-turn":[100],"response":[102,145],"real":[106,133],"word":[107,134],"dataset.":[112,139],"To":[113],"verify":[114],"effectiveness":[116],"framework,":[120],"evaluate":[122],"on":[125,171],"Reddit":[127],"dialogues":[128],"data,":[129],"Experiments":[140],"show":[141],"generating":[146],"achieves":[151],"significant":[152],"improvement":[153],"over":[154],"recurrent":[155],"sequence-to-sequence":[156],"also":[159],"state":[161],"art":[164],"diversity":[172],"relevance":[174],"evaluation":[175],"metrics.":[176]},"counts_by_year":[{"year":2024,"cited_by_count":1},{"year":2021,"cited_by_count":1}],"updated_date":"2025-11-06T03:46:38.306776","created_date":"2025-10-10T00:00:00"}
