{"id":"https://openalex.org/W2757930439","doi":"https://doi.org/10.18653/v1/w17-4304","title":"Structured Prediction via Learning to Search under Bandit Feedback","display_name":"Structured Prediction via Learning to Search under Bandit Feedback","publication_year":2017,"publication_date":"2017-01-01","ids":{"openalex":"https://openalex.org/W2757930439","doi":"https://doi.org/10.18653/v1/w17-4304","mag":"2757930439"},"language":"en","primary_location":{"id":"doi:10.18653/v1/w17-4304","is_oa":true,"landing_page_url":"https://doi.org/10.18653/v1/w17-4304","pdf_url":"https://www.aclweb.org/anthology/W17-4304.pdf","source":null,"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Proceedings of the 2nd Workshop on Structured Prediction for Natural\n          Language Processing","raw_type":"proceedings-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":true,"oa_status":"gold","oa_url":"https://www.aclweb.org/anthology/W17-4304.pdf","any_repository_has_fulltext":null},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5068614789","display_name":"Amr Sharaf","orcid":null},"institutions":[{"id":"https://openalex.org/I66946132","display_name":"University of Maryland, College Park","ror":"https://ror.org/047s2c258","country_code":"US","type":"education","lineage":["https://openalex.org/I66946132"]}],"countries":["US"],"is_corresponding":true,"raw_author_name":"Amr Sharaf","raw_affiliation_strings":["University of Maryland, College Park"],"affiliations":[{"raw_affiliation_string":"University of Maryland, College Park","institution_ids":["https://openalex.org/I66946132"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5019928111","display_name":"Hal Daum\u00e9","orcid":"https://orcid.org/0000-0002-3760-345X"},"institutions":[{"id":"https://openalex.org/I66946132","display_name":"University of Maryland, College Park","ror":"https://ror.org/047s2c258","country_code":"US","type":"education","lineage":["https://openalex.org/I66946132"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Hal Daum\u00e9 III","raw_affiliation_strings":["University of Maryland, College Park"],"affiliations":[{"raw_affiliation_string":"University of Maryland, College Park","institution_ids":["https://openalex.org/I66946132"]}]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":2,"corresponding_author_ids":["https://openalex.org/A5068614789"],"corresponding_institution_ids":["https://openalex.org/I66946132"],"apc_list":null,"apc_paid":null,"fwci":1.8857,"has_fulltext":true,"cited_by_count":9,"citation_normalized_percentile":{"value":0.87171094,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":{"min":90,"max":97},"biblio":{"volume":null,"issue":null,"first_page":"17","last_page":"26"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T12101","display_name":"Advanced Bandit Algorithms Research","score":0.9998999834060669,"subfield":{"id":"https://openalex.org/subfields/1803","display_name":"Management Science and Operations Research"},"field":{"id":"https://openalex.org/fields/18","display_name":"Decision Sciences"},"domain":{"id":"https://openalex.org/domains/2","display_name":"Social Sciences"}},"topics":[{"id":"https://openalex.org/T12101","display_name":"Advanced Bandit Algorithms Research","score":0.9998999834060669,"subfield":{"id":"https://openalex.org/subfields/1803","display_name":"Management Science and Operations Research"},"field":{"id":"https://openalex.org/fields/18","display_name":"Decision Sciences"},"domain":{"id":"https://openalex.org/domains/2","display_name":"Social Sciences"}},{"id":"https://openalex.org/T12072","display_name":"Machine Learning and Algorithms","score":0.9984999895095825,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10462","display_name":"Reinforcement Learning in Robotics","score":0.9975000023841858,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.7061318755149841},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.5154274702072144},{"id":"https://openalex.org/keywords/machine-learning","display_name":"Machine learning","score":0.4851311147212982}],"concepts":[{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.7061318755149841},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.5154274702072144},{"id":"https://openalex.org/C119857082","wikidata":"https://www.wikidata.org/wiki/Q2539","display_name":"Machine learning","level":1,"score":0.4851311147212982}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.18653/v1/w17-4304","is_oa":true,"landing_page_url":"https://doi.org/10.18653/v1/w17-4304","pdf_url":"https://www.aclweb.org/anthology/W17-4304.pdf","source":null,"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Proceedings of the 2nd Workshop on Structured Prediction for Natural\n          Language Processing","raw_type":"proceedings-article"}],"best_oa_location":{"id":"doi:10.18653/v1/w17-4304","is_oa":true,"landing_page_url":"https://doi.org/10.18653/v1/w17-4304","pdf_url":"https://www.aclweb.org/anthology/W17-4304.pdf","source":null,"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Proceedings of the 2nd Workshop on Structured Prediction for Natural\n          Language Processing","raw_type":"proceedings-article"},"sustainable_development_goals":[],"awards":[{"id":"https://openalex.org/G3020253667","display_name":"RI: Small: Linguistic Semantics and Discourse from Leaky Distant Supervision","funder_award_id":"1618193","funder_id":"https://openalex.org/F4320306076","funder_display_name":"National Science Foundation"}],"funders":[{"id":"https://openalex.org/F4320306076","display_name":"National Science Foundation","ror":"https://ror.org/021nxhr62"}],"has_content":{"pdf":true,"grobid_xml":true},"content_urls":{"pdf":"https://content.openalex.org/works/W2757930439.pdf","grobid_xml":"https://content.openalex.org/works/W2757930439.grobid-xml"},"referenced_works_count":47,"referenced_works":["https://openalex.org/W81000870","https://openalex.org/W115173043","https://openalex.org/W371426616","https://openalex.org/W648786980","https://openalex.org/W1579652926","https://openalex.org/W1632114991","https://openalex.org/W1846966754","https://openalex.org/W1850531616","https://openalex.org/W1850547517","https://openalex.org/W1931877416","https://openalex.org/W1998498767","https://openalex.org/W2001947543","https://openalex.org/W2004763266","https://openalex.org/W2077902449","https://openalex.org/W2098532383","https://openalex.org/W2103715332","https://openalex.org/W2104805229","https://openalex.org/W2104917081","https://openalex.org/W2108114251","https://openalex.org/W2108738385","https://openalex.org/W2112420033","https://openalex.org/W2116929514","https://openalex.org/W2118980425","https://openalex.org/W2119850747","https://openalex.org/W2147880316","https://openalex.org/W2155027007","https://openalex.org/W2158349948","https://openalex.org/W2166253248","https://openalex.org/W2169401877","https://openalex.org/W2186629860","https://openalex.org/W2257979135","https://openalex.org/W2278024189","https://openalex.org/W2513592723","https://openalex.org/W2541794668","https://openalex.org/W2951270685","https://openalex.org/W2951665052","https://openalex.org/W2953182116","https://openalex.org/W2962957031","https://openalex.org/W2963620441","https://openalex.org/W2964125852","https://openalex.org/W2964245012","https://openalex.org/W3098679278","https://openalex.org/W3124229194","https://openalex.org/W3198214231","https://openalex.org/W4237910115","https://openalex.org/W4297664295","https://openalex.org/W4299286629"],"related_works":["https://openalex.org/W2961085424","https://openalex.org/W4306674287","https://openalex.org/W4224009465","https://openalex.org/W4286629047","https://openalex.org/W4306321456","https://openalex.org/W3046775127","https://openalex.org/W4205958290","https://openalex.org/W3107474891","https://openalex.org/W3209574120","https://openalex.org/W3170094116"],"abstract_inverted_index":{"We":[0,33,61,81],"present":[1],"an":[2],"algorithm":[3],"for":[4,27,58,69,76],"structured":[5,21],"prediction":[6],"under":[7],"online":[8],"bandit":[9,39],"feedback.":[10],"The":[11],"learner":[12],"repeatedly":[13],"predicts":[14],"a":[15,20,37,46,56,77,84],"sequence":[16,99],"of":[17,86,96],"actions,":[18],"generating":[19],"output.":[22],"It":[23],"then":[24],"observes":[25,45,55],"feedback":[26,51,66],"that":[28,63],"output":[29],"and":[30,48,89,92,101],"no":[31],"others.":[32],"consider":[34],"two":[35],"cases:":[36],"pure":[38],"setting":[40],"in":[41,52],"which":[42,53],"it":[43,54,74],"only":[44],"loss,":[47],"more":[49],"fine-grained":[50,65],"loss":[57],"every":[59],"action.":[60],"find":[62],"the":[64,94],"is":[67],"necessary":[68],"strong":[70],"empirical":[71],"performance,":[72],"because":[73],"allows":[75],"robust":[78],"variance-reduction":[79],"strategy.":[80],"empirically":[82],"compare":[83],"number":[85],"different":[87],"algorithms":[88],"exploration":[90],"methods":[91],"show":[93],"efficacy":[95],"BLS":[97],"on":[98],"labeling":[100],"dependency":[102],"parsing":[103],"tasks.":[104]},"counts_by_year":[{"year":2021,"cited_by_count":2},{"year":2020,"cited_by_count":3},{"year":2019,"cited_by_count":3},{"year":2018,"cited_by_count":1}],"updated_date":"2026-04-10T15:06:20.359241","created_date":"2025-10-10T00:00:00"}
