{"id":"https://openalex.org/W2526182867","doi":"https://doi.org/10.18653/v1/d16-1245","title":"Deep Reinforcement Learning for Mention-Ranking Coreference Models","display_name":"Deep Reinforcement Learning for Mention-Ranking Coreference Models","publication_year":2016,"publication_date":"2016-01-01","ids":{"openalex":"https://openalex.org/W2526182867","doi":"https://doi.org/10.18653/v1/d16-1245","mag":"2526182867"},"language":"en","primary_location":{"id":"doi:10.18653/v1/d16-1245","is_oa":true,"landing_page_url":"https://doi.org/10.18653/v1/d16-1245","pdf_url":"https://www.aclweb.org/anthology/D16-1245.pdf","source":null,"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Proceedings of the 2016 Conference on Empirical Methods in Natural\n          Language Processing","raw_type":"proceedings-article"},"type":"preprint","indexed_in":["arxiv","crossref","datacite"],"open_access":{"is_oa":true,"oa_status":"gold","oa_url":"https://www.aclweb.org/anthology/D16-1245.pdf","any_repository_has_fulltext":true},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5049064405","display_name":"Kevin B. Clark","orcid":"https://orcid.org/0000-0003-0544-2150"},"institutions":[{"id":"https://openalex.org/I4210156583","display_name":"Laboratoire d'Informatique de Paris-Nord","ror":"https://ror.org/05g1zjw44","country_code":"FR","type":"facility","lineage":["https://openalex.org/I1294671590","https://openalex.org/I1294671590","https://openalex.org/I4210091279","https://openalex.org/I4210156583","https://openalex.org/I4210159245"]},{"id":"https://openalex.org/I97018004","display_name":"Stanford University","ror":"https://ror.org/00f54p054","country_code":"US","type":"education","lineage":["https://openalex.org/I97018004"]}],"countries":["FR","US"],"is_corresponding":true,"raw_author_name":"Kevin Clark","raw_affiliation_strings":["Computer Science Department Stanford University","Stanford University, Stanford, United States"],"affiliations":[{"raw_affiliation_string":"Computer Science Department Stanford University","institution_ids":["https://openalex.org/I4210156583","https://openalex.org/I97018004"]},{"raw_affiliation_string":"Stanford University, Stanford, United States","institution_ids":["https://openalex.org/I97018004"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5046006076","display_name":"Christopher D. Manning","orcid":"https://orcid.org/0000-0001-6155-649X"},"institutions":[{"id":"https://openalex.org/I4210156583","display_name":"Laboratoire d'Informatique de Paris-Nord","ror":"https://ror.org/05g1zjw44","country_code":"FR","type":"facility","lineage":["https://openalex.org/I1294671590","https://openalex.org/I1294671590","https://openalex.org/I4210091279","https://openalex.org/I4210156583","https://openalex.org/I4210159245"]},{"id":"https://openalex.org/I97018004","display_name":"Stanford University","ror":"https://ror.org/00f54p054","country_code":"US","type":"education","lineage":["https://openalex.org/I97018004"]}],"countries":["FR","US"],"is_corresponding":false,"raw_author_name":"Christopher D. Manning","raw_affiliation_strings":["Computer Science Department Stanford University","Stanford University, Stanford, United States"],"affiliations":[{"raw_affiliation_string":"Computer Science Department Stanford University","institution_ids":["https://openalex.org/I4210156583","https://openalex.org/I97018004"]},{"raw_affiliation_string":"Stanford University, Stanford, United States","institution_ids":["https://openalex.org/I97018004"]}]}],"institutions":[],"countries_distinct_count":2,"institutions_distinct_count":2,"corresponding_author_ids":["https://openalex.org/A5049064405"],"corresponding_institution_ids":["https://openalex.org/I4210156583","https://openalex.org/I97018004"],"apc_list":null,"apc_paid":null,"fwci":7.985,"has_fulltext":true,"cited_by_count":44,"citation_normalized_percentile":{"value":0.97469256,"is_in_top_1_percent":false,"is_in_top_10_percent":true},"cited_by_percentile_year":{"min":90,"max":99},"biblio":{"volume":null,"issue":null,"first_page":"2256","last_page":"2262"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10028","display_name":"Topic Modeling","score":0.9998000264167786,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10028","display_name":"Topic Modeling","score":0.9998000264167786,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10181","display_name":"Natural Language Processing Techniques","score":0.9998000264167786,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11714","display_name":"Multimodal Machine Learning Applications","score":0.984000027179718,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/coreference","display_name":"Coreference","score":0.9560286998748779},{"id":"https://openalex.org/keywords/reinforcement-learning","display_name":"Reinforcement learning","score":0.8671972751617432},{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.8077426552772522},{"id":"https://openalex.org/keywords/margin","display_name":"Margin (machine learning)","score":0.8025993704795837},{"id":"https://openalex.org/keywords/ranking","display_name":"Ranking (information retrieval)","score":0.7532421350479126},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.6927422285079956},{"id":"https://openalex.org/keywords/task","display_name":"Task (project management)","score":0.6300289630889893},{"id":"https://openalex.org/keywords/heuristic","display_name":"Heuristic","score":0.6237583160400391},{"id":"https://openalex.org/keywords/machine-learning","display_name":"Machine learning","score":0.5502984523773193},{"id":"https://openalex.org/keywords/resolution","display_name":"Resolution (logic)","score":0.469551146030426},{"id":"https://openalex.org/keywords/natural-language-processing","display_name":"Natural language processing","score":0.4487605392932892}],"concepts":[{"id":"https://openalex.org/C28076734","wikidata":"https://www.wikidata.org/wiki/Q63087","display_name":"Coreference","level":3,"score":0.9560286998748779},{"id":"https://openalex.org/C97541855","wikidata":"https://www.wikidata.org/wiki/Q830687","display_name":"Reinforcement learning","level":2,"score":0.8671972751617432},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.8077426552772522},{"id":"https://openalex.org/C774472","wikidata":"https://www.wikidata.org/wiki/Q6760393","display_name":"Margin (machine learning)","level":2,"score":0.8025993704795837},{"id":"https://openalex.org/C189430467","wikidata":"https://www.wikidata.org/wiki/Q7293293","display_name":"Ranking (information retrieval)","level":2,"score":0.7532421350479126},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.6927422285079956},{"id":"https://openalex.org/C2780451532","wikidata":"https://www.wikidata.org/wiki/Q759676","display_name":"Task (project management)","level":2,"score":0.6300289630889893},{"id":"https://openalex.org/C173801870","wikidata":"https://www.wikidata.org/wiki/Q201413","display_name":"Heuristic","level":2,"score":0.6237583160400391},{"id":"https://openalex.org/C119857082","wikidata":"https://www.wikidata.org/wiki/Q2539","display_name":"Machine learning","level":1,"score":0.5502984523773193},{"id":"https://openalex.org/C138268822","wikidata":"https://www.wikidata.org/wiki/Q1051925","display_name":"Resolution (logic)","level":2,"score":0.469551146030426},{"id":"https://openalex.org/C204321447","wikidata":"https://www.wikidata.org/wiki/Q30642","display_name":"Natural language processing","level":1,"score":0.4487605392932892},{"id":"https://openalex.org/C187736073","wikidata":"https://www.wikidata.org/wiki/Q2920921","display_name":"Management","level":1,"score":0.0},{"id":"https://openalex.org/C162324750","wikidata":"https://www.wikidata.org/wiki/Q8134","display_name":"Economics","level":0,"score":0.0}],"mesh":[],"locations_count":4,"locations":[{"id":"doi:10.18653/v1/d16-1245","is_oa":true,"landing_page_url":"https://doi.org/10.18653/v1/d16-1245","pdf_url":"https://www.aclweb.org/anthology/D16-1245.pdf","source":null,"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Proceedings of the 2016 Conference on Empirical Methods in Natural\n          Language Processing","raw_type":"proceedings-article"},{"id":"pmh:oai:arXiv.org:1609.08667","is_oa":true,"landing_page_url":"http://arxiv.org/abs/1609.08667","pdf_url":"https://arxiv.org/pdf/1609.08667","source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":"","raw_type":null},{"id":"mag:2526182867","is_oa":true,"landing_page_url":"https://arxiv.org/pdf/1609.08667.pdf","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":"arXiv (Cornell University)","raw_type":null},{"id":"doi:10.48550/arxiv.1609.08667","is_oa":true,"landing_page_url":"https://doi.org/10.48550/arxiv.1609.08667","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":null,"is_accepted":false,"is_published":null,"raw_source_name":null,"raw_type":"article"}],"best_oa_location":{"id":"doi:10.18653/v1/d16-1245","is_oa":true,"landing_page_url":"https://doi.org/10.18653/v1/d16-1245","pdf_url":"https://www.aclweb.org/anthology/D16-1245.pdf","source":null,"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Proceedings of the 2016 Conference on Empirical Methods in Natural\n          Language Processing","raw_type":"proceedings-article"},"sustainable_development_goals":[{"score":0.5600000023841858,"id":"https://metadata.un.org/sdg/16","display_name":"Peace, Justice and strong institutions"}],"awards":[{"id":"https://openalex.org/G5651234186","display_name":"RI: Medium: Deep Understanding: Integrating Neural and Symbolic Models of Meaning","funder_award_id":"1514268","funder_id":"https://openalex.org/F4320306076","funder_display_name":"National Science Foundation"},{"id":"https://openalex.org/G8295239305","display_name":null,"funder_award_id":"514268","funder_id":"https://openalex.org/F4320306076","funder_display_name":"National Science Foundation"}],"funders":[{"id":"https://openalex.org/F4320306076","display_name":"National Science Foundation","ror":"https://ror.org/021nxhr62"}],"has_content":{"pdf":true,"grobid_xml":true},"content_urls":{"pdf":"https://content.openalex.org/works/W2526182867.pdf","grobid_xml":"https://content.openalex.org/works/W2526182867.grobid-xml"},"referenced_works_count":19,"referenced_works":["https://openalex.org/W65330238","https://openalex.org/W1495981708","https://openalex.org/W1904365287","https://openalex.org/W1965693266","https://openalex.org/W2098345921","https://openalex.org/W2112648537","https://openalex.org/W2119717200","https://openalex.org/W2124700572","https://openalex.org/W2155069789","https://openalex.org/W2167140078","https://openalex.org/W2180160918","https://openalex.org/W2251035762","https://openalex.org/W2251064706","https://openalex.org/W2252031764","https://openalex.org/W2252247041","https://openalex.org/W2312609093","https://openalex.org/W2336260055","https://openalex.org/W2410503294","https://openalex.org/W2949600092"],"related_works":["https://openalex.org/W2963167649","https://openalex.org/W2964308564","https://openalex.org/W2250539671","https://openalex.org/W2064675550","https://openalex.org/W2738152205","https://openalex.org/W3162119881","https://openalex.org/W2952420254","https://openalex.org/W2410503294","https://openalex.org/W2135734357","https://openalex.org/W150227128","https://openalex.org/W2963403868","https://openalex.org/W2963341956","https://openalex.org/W2787560479","https://openalex.org/W2410983263","https://openalex.org/W2155069789","https://openalex.org/W2101105183","https://openalex.org/W2161771536","https://openalex.org/W236383343","https://openalex.org/W2252247041","https://openalex.org/W2950055289"],"abstract_inverted_index":{"Coreference":[0],"resolution":[1],"systems":[2],"are":[3],"typically":[4],"trained":[5],"with":[6,35],"heuristic":[7],"loss":[8],"functions":[9],"that":[10],"require":[11],"careful":[12],"tuning.":[13],"In":[14],"this":[15],"paper":[16],"we":[17],"instead":[18],"apply":[19],"reinforcement":[20],"learning":[21],"to":[22,52],"directly":[23],"optimize":[24],"a":[25,44,58],"neural":[26],"mention-ranking":[27],"model":[28],"for":[29],"coreference":[30],"evaluation":[31],"metrics.":[32],"We":[33,48],"experiment":[34],"two":[36],"approaches:":[37],"the":[38,50,62,66,72],"REINFORCE":[39],"policy":[40],"gradient":[41],"algorithm":[42],"and":[43,68],"rewardrescaled":[45],"max-margin":[46],"objective.":[47],"find":[49],"latter":[51],"be":[53],"more":[54],"effective,":[55],"resulting":[56],"in":[57],"significant":[59],"improvement":[60],"over":[61],"current":[63],"stateof-the-art":[64],"on":[65],"English":[67],"Chinese":[69],"portions":[70],"of":[71],"CoNLL":[73],"2012":[74],"Shared":[75],"Task.":[76]},"counts_by_year":[{"year":2024,"cited_by_count":1},{"year":2023,"cited_by_count":4},{"year":2022,"cited_by_count":5},{"year":2021,"cited_by_count":11},{"year":2020,"cited_by_count":5},{"year":2019,"cited_by_count":5},{"year":2018,"cited_by_count":8},{"year":2017,"cited_by_count":3},{"year":2016,"cited_by_count":2}],"updated_date":"2026-03-18T14:38:29.013473","created_date":"2025-10-10T00:00:00"}
