{"id":"https://openalex.org/W2962953307","doi":"https://doi.org/10.18653/v1/d18-1421","title":"Paraphrase Generation with Deep Reinforcement Learning","display_name":"Paraphrase Generation with Deep Reinforcement Learning","publication_year":2018,"publication_date":"2018-01-01","ids":{"openalex":"https://openalex.org/W2962953307","doi":"https://doi.org/10.18653/v1/d18-1421","mag":"2962953307"},"language":"en","primary_location":{"id":"doi:10.18653/v1/d18-1421","is_oa":true,"landing_page_url":"https://doi.org/10.18653/v1/d18-1421","pdf_url":"https://www.aclweb.org/anthology/D18-1421.pdf","source":null,"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Proceedings of the 2018 Conference on Empirical Methods in Natural Language Processing","raw_type":"proceedings-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":true,"oa_status":"gold","oa_url":"https://www.aclweb.org/anthology/D18-1421.pdf","any_repository_has_fulltext":null},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5009277091","display_name":"Zichao Li","orcid":"https://orcid.org/0000-0003-2582-3006"},"institutions":[{"id":"https://openalex.org/I4210159102","display_name":"Huawei Technologies (Sweden)","ror":"https://ror.org/0500fyd17","country_code":"SE","type":"company","lineage":["https://openalex.org/I2250955327","https://openalex.org/I4210159102"]}],"countries":["SE"],"is_corresponding":true,"raw_author_name":"Zichao Li","raw_affiliation_strings":["Noah's Ark Lab, Huawei Technologies"],"affiliations":[{"raw_affiliation_string":"Noah's Ark Lab, Huawei Technologies","institution_ids":["https://openalex.org/I4210159102"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5086603207","display_name":"Xin Jiang","orcid":"https://orcid.org/0000-0002-9117-8247"},"institutions":[{"id":"https://openalex.org/I4210159102","display_name":"Huawei Technologies (Sweden)","ror":"https://ror.org/0500fyd17","country_code":"SE","type":"company","lineage":["https://openalex.org/I2250955327","https://openalex.org/I4210159102"]}],"countries":["SE"],"is_corresponding":false,"raw_author_name":"Xin Jiang","raw_affiliation_strings":["Noah's Ark Lab, Huawei Technologies"],"affiliations":[{"raw_affiliation_string":"Noah's Ark Lab, Huawei Technologies","institution_ids":["https://openalex.org/I4210159102"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5046228314","display_name":"Lifeng Shang","orcid":null},"institutions":[{"id":"https://openalex.org/I4210159102","display_name":"Huawei Technologies (Sweden)","ror":"https://ror.org/0500fyd17","country_code":"SE","type":"company","lineage":["https://openalex.org/I2250955327","https://openalex.org/I4210159102"]}],"countries":["SE"],"is_corresponding":false,"raw_author_name":"Lifeng Shang","raw_affiliation_strings":["Noah's Ark Lab, Huawei Technologies"],"affiliations":[{"raw_affiliation_string":"Noah's Ark Lab, Huawei Technologies","institution_ids":["https://openalex.org/I4210159102"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5100455112","display_name":"Hang Li","orcid":"https://orcid.org/0000-0001-5096-0155"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Hang Li","raw_affiliation_strings":["Toutiao AI Lab"],"affiliations":[{"raw_affiliation_string":"Toutiao AI Lab","institution_ids":[]}]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":4,"corresponding_author_ids":["https://openalex.org/A5009277091"],"corresponding_institution_ids":["https://openalex.org/I4210159102"],"apc_list":null,"apc_paid":null,"fwci":23.355,"has_fulltext":true,"cited_by_count":189,"citation_normalized_percentile":{"value":0.99494472,"is_in_top_1_percent":true,"is_in_top_10_percent":true},"cited_by_percentile_year":{"min":96,"max":100},"biblio":{"volume":null,"issue":null,"first_page":"3865","last_page":"3878"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10028","display_name":"Topic Modeling","score":1.0,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10028","display_name":"Topic Modeling","score":1.0,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10181","display_name":"Natural Language Processing Techniques","score":0.9994999766349792,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11714","display_name":"Multimodal Machine Learning Applications","score":0.9958000183105469,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/paraphrase","display_name":"Paraphrase","score":0.9304301738739014},{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.8441303968429565},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.8046451210975647},{"id":"https://openalex.org/keywords/reinforcement-learning","display_name":"Reinforcement learning","score":0.7578790783882141},{"id":"https://openalex.org/keywords/task","display_name":"Task (project management)","score":0.6443647146224976},{"id":"https://openalex.org/keywords/natural-language-processing","display_name":"Natural language processing","score":0.6199944615364075},{"id":"https://openalex.org/keywords/generator","display_name":"Generator (circuit theory)","score":0.6191101670265198},{"id":"https://openalex.org/keywords/sentence","display_name":"Sentence","score":0.5928505063056946},{"id":"https://openalex.org/keywords/matching","display_name":"Matching (statistics)","score":0.538199245929718},{"id":"https://openalex.org/keywords/deep-learning","display_name":"Deep learning","score":0.5329227447509766},{"id":"https://openalex.org/keywords/sequence","display_name":"Sequence (biology)","score":0.42874041199684143},{"id":"https://openalex.org/keywords/machine-learning","display_name":"Machine learning","score":0.3867042064666748},{"id":"https://openalex.org/keywords/power","display_name":"Power (physics)","score":0.09795805811882019}],"concepts":[{"id":"https://openalex.org/C2780922921","wikidata":"https://www.wikidata.org/wiki/Q255189","display_name":"Paraphrase","level":2,"score":0.9304301738739014},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.8441303968429565},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.8046451210975647},{"id":"https://openalex.org/C97541855","wikidata":"https://www.wikidata.org/wiki/Q830687","display_name":"Reinforcement learning","level":2,"score":0.7578790783882141},{"id":"https://openalex.org/C2780451532","wikidata":"https://www.wikidata.org/wiki/Q759676","display_name":"Task (project management)","level":2,"score":0.6443647146224976},{"id":"https://openalex.org/C204321447","wikidata":"https://www.wikidata.org/wiki/Q30642","display_name":"Natural language processing","level":1,"score":0.6199944615364075},{"id":"https://openalex.org/C2780992000","wikidata":"https://www.wikidata.org/wiki/Q17016113","display_name":"Generator (circuit theory)","level":3,"score":0.6191101670265198},{"id":"https://openalex.org/C2777530160","wikidata":"https://www.wikidata.org/wiki/Q41796","display_name":"Sentence","level":2,"score":0.5928505063056946},{"id":"https://openalex.org/C165064840","wikidata":"https://www.wikidata.org/wiki/Q1321061","display_name":"Matching (statistics)","level":2,"score":0.538199245929718},{"id":"https://openalex.org/C108583219","wikidata":"https://www.wikidata.org/wiki/Q197536","display_name":"Deep learning","level":2,"score":0.5329227447509766},{"id":"https://openalex.org/C2778112365","wikidata":"https://www.wikidata.org/wiki/Q3511065","display_name":"Sequence (biology)","level":2,"score":0.42874041199684143},{"id":"https://openalex.org/C119857082","wikidata":"https://www.wikidata.org/wiki/Q2539","display_name":"Machine learning","level":1,"score":0.3867042064666748},{"id":"https://openalex.org/C163258240","wikidata":"https://www.wikidata.org/wiki/Q25342","display_name":"Power (physics)","level":2,"score":0.09795805811882019},{"id":"https://openalex.org/C105795698","wikidata":"https://www.wikidata.org/wiki/Q12483","display_name":"Statistics","level":1,"score":0.0},{"id":"https://openalex.org/C162324750","wikidata":"https://www.wikidata.org/wiki/Q8134","display_name":"Economics","level":0,"score":0.0},{"id":"https://openalex.org/C121332964","wikidata":"https://www.wikidata.org/wiki/Q413","display_name":"Physics","level":0,"score":0.0},{"id":"https://openalex.org/C86803240","wikidata":"https://www.wikidata.org/wiki/Q420","display_name":"Biology","level":0,"score":0.0},{"id":"https://openalex.org/C33923547","wikidata":"https://www.wikidata.org/wiki/Q395","display_name":"Mathematics","level":0,"score":0.0},{"id":"https://openalex.org/C187736073","wikidata":"https://www.wikidata.org/wiki/Q2920921","display_name":"Management","level":1,"score":0.0},{"id":"https://openalex.org/C62520636","wikidata":"https://www.wikidata.org/wiki/Q944","display_name":"Quantum mechanics","level":1,"score":0.0},{"id":"https://openalex.org/C54355233","wikidata":"https://www.wikidata.org/wiki/Q7162","display_name":"Genetics","level":1,"score":0.0}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.18653/v1/d18-1421","is_oa":true,"landing_page_url":"https://doi.org/10.18653/v1/d18-1421","pdf_url":"https://www.aclweb.org/anthology/D18-1421.pdf","source":null,"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Proceedings of the 2018 Conference on Empirical Methods in Natural Language Processing","raw_type":"proceedings-article"}],"best_oa_location":{"id":"doi:10.18653/v1/d18-1421","is_oa":true,"landing_page_url":"https://doi.org/10.18653/v1/d18-1421","pdf_url":"https://www.aclweb.org/anthology/D18-1421.pdf","source":null,"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Proceedings of the 2018 Conference on Empirical Methods in Natural Language Processing","raw_type":"proceedings-article"},"sustainable_development_goals":[{"display_name":"Quality Education","id":"https://metadata.un.org/sdg/4","score":0.8100000023841858}],"awards":[{"id":"https://openalex.org/G4304641529","display_name":null,"funder_award_id":"2014CB340301","funder_id":"https://openalex.org/F4320335777","funder_display_name":"National Key Research and Development Program of China"},{"id":"https://openalex.org/G5171771356","display_name":null,"funder_award_id":"2014CB","funder_id":"https://openalex.org/F4320335777","funder_display_name":"National Key Research and Development Program of China"}],"funders":[{"id":"https://openalex.org/F4320335777","display_name":"National Key Research and Development Program of China","ror":null}],"has_content":{"grobid_xml":true,"pdf":true},"content_urls":{"pdf":"https://content.openalex.org/works/W2962953307.pdf","grobid_xml":"https://content.openalex.org/works/W2962953307.grobid-xml"},"referenced_works_count":73,"referenced_works":["https://openalex.org/W174630521","https://openalex.org/W648786980","https://openalex.org/W1505629914","https://openalex.org/W1522301498","https://openalex.org/W1591706642","https://openalex.org/W1776056560","https://openalex.org/W1777239053","https://openalex.org/W1843891098","https://openalex.org/W1999874108","https://openalex.org/W2098774185","https://openalex.org/W2099471712","https://openalex.org/W2101105183","https://openalex.org/W2103081392","https://openalex.org/W2103305545","https://openalex.org/W2119717200","https://openalex.org/W2119785746","https://openalex.org/W2127564752","https://openalex.org/W2130942839","https://openalex.org/W2132019450","https://openalex.org/W2133512280","https://openalex.org/W2133564696","https://openalex.org/W2146502635","https://openalex.org/W2154652894","https://openalex.org/W2155027007","https://openalex.org/W2157331557","https://openalex.org/W2167170026","https://openalex.org/W2169498096","https://openalex.org/W2170738476","https://openalex.org/W2176263492","https://openalex.org/W2290104316","https://openalex.org/W2296073425","https://openalex.org/W2413794162","https://openalex.org/W2525778437","https://openalex.org/W2531908596","https://openalex.org/W2557480356","https://openalex.org/W2566467060","https://openalex.org/W2581637843","https://openalex.org/W2605243085","https://openalex.org/W2606974598","https://openalex.org/W2616969219","https://openalex.org/W2617128460","https://openalex.org/W2741049976","https://openalex.org/W2755124548","https://openalex.org/W2793501144","https://openalex.org/W2950635152","https://openalex.org/W2951359136","https://openalex.org/W2951824008","https://openalex.org/W2962965405","https://openalex.org/W2963001247","https://openalex.org/W2963014947","https://openalex.org/W2963033554","https://openalex.org/W2963126845","https://openalex.org/W2963248296","https://openalex.org/W2963248348","https://openalex.org/W2963277051","https://openalex.org/W2963343509","https://openalex.org/W2963403868","https://openalex.org/W2963463583","https://openalex.org/W2963508788","https://openalex.org/W2963546833","https://openalex.org/W2963558220","https://openalex.org/W2963590100","https://openalex.org/W2963847417","https://openalex.org/W2963941871","https://openalex.org/W2963963856","https://openalex.org/W2964053384","https://openalex.org/W2964121744","https://openalex.org/W2964212550","https://openalex.org/W2964268978","https://openalex.org/W2964308564","https://openalex.org/W2964352247","https://openalex.org/W4320013936","https://openalex.org/W4385245566"],"related_works":["https://openalex.org/W1973985309","https://openalex.org/W2263401911","https://openalex.org/W350308244","https://openalex.org/W2978707643","https://openalex.org/W2087536156","https://openalex.org/W2398825887","https://openalex.org/W2793324584","https://openalex.org/W4385718007","https://openalex.org/W2962934171","https://openalex.org/W2148689572"],"abstract_inverted_index":{"Automatic":[0],"generation":[1,162],"of":[2,43,50,85,115,135],"paraphrases":[3,66,84,154],"from":[4,54],"a":[5,24,35,44,60,68,74],"given":[6,67,108],"sentence":[7],"is":[8,90,107],"an":[9,47],"important":[10],"yet":[11],"challenging":[12],"task":[13],"in":[14,103,160,163],"natural":[15],"language":[16],"processing":[17],"(NLP).":[18],"In":[19],"this":[20],"paper,":[21],"we":[22,33,118],"present":[23],"deep":[25,75,94],"reinforcement":[26,101,128],"learning":[27,62,95,102,114,125,129],"approach":[28],"to":[29],"paraphrase":[30,161],"generation.":[31],"Specifically,":[32],"propose":[34,119],"new":[36],"framework":[37],"for":[38],"the":[39,105,110,113,116,133,145,157],"task,":[40],"which":[41,51,104],"consists":[42],"generator":[45,89],"and":[46,96,126,155,167],"evaluator,":[48,71,117],"both":[49,164],"are":[52,83],"learned":[53],"data.":[55,138],"The":[56,70,88],"generator,":[57],"built":[58],"as":[59,73],"sequenceto-sequence":[61],"model,":[63,77],"can":[64,78,150],"produce":[65,151],"sentence.":[69],"constructed":[72],"matching":[76],"judge":[79],"whether":[80],"two":[81,120,142],"sentences":[82],"each":[86],"other.":[87],"first":[91],"trained":[92],"by":[93,100,109],"then":[97],"further":[98],"fine-tuned":[99],"reward":[106],"evaluator.":[111],"For":[112],"methods":[121,159],"based":[122],"on":[123,132,141],"supervised":[124],"inverse":[127],"respectively,":[130],"depending":[131],"type":[134],"available":[136],"training":[137],"Experimental":[139],"results":[140],"datasets":[143],"demonstrate":[144],"proposed":[146],"models":[147],"(the":[148],"generators)":[149],"more":[152],"accurate":[153],"outperform":[156],"stateof-the-art":[158],"automatic":[165],"evaluation":[166],"human":[168],"evaluation.":[169]},"counts_by_year":[{"year":2026,"cited_by_count":1},{"year":2025,"cited_by_count":9},{"year":2024,"cited_by_count":8},{"year":2023,"cited_by_count":12},{"year":2022,"cited_by_count":21},{"year":2021,"cited_by_count":40},{"year":2020,"cited_by_count":50},{"year":2019,"cited_by_count":38},{"year":2018,"cited_by_count":10}],"updated_date":"2026-04-10T15:06:20.359241","created_date":"2025-10-10T00:00:00"}
