{"id":"https://openalex.org/W4224139126","doi":"https://doi.org/10.1109/ciss53076.2022.9751163","title":"Policy Gradient for Ratio Optimization: A Case Study","display_name":"Policy Gradient for Ratio Optimization: A Case Study","publication_year":2022,"publication_date":"2022-03-09","ids":{"openalex":"https://openalex.org/W4224139126","doi":"https://doi.org/10.1109/ciss53076.2022.9751163"},"language":"en","primary_location":{"id":"doi:10.1109/ciss53076.2022.9751163","is_oa":false,"landing_page_url":"https://doi.org/10.1109/ciss53076.2022.9751163","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"2022 56th Annual Conference on Information Sciences and Systems (CISS)","raw_type":"proceedings-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":false,"oa_status":"closed","oa_url":null,"any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5056599663","display_name":"Wesley A. Suttle","orcid":"https://orcid.org/0000-0003-1234-7151"},"institutions":[{"id":"https://openalex.org/I4210131439","display_name":"Applied Mathematics (United States)","ror":"https://ror.org/03seew607","country_code":"US","type":"company","lineage":["https://openalex.org/I4210131439"]},{"id":"https://openalex.org/I59553526","display_name":"Stony Brook University","ror":"https://ror.org/05qghxh33","country_code":"US","type":"education","lineage":["https://openalex.org/I59553526"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Wesley A. Suttle","raw_affiliation_strings":["Stony Brook University,Applied Mathematics and Statistics","Applied Mathematics and Statistics, Stony Brook University"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"Stony Brook University,Applied Mathematics and Statistics","institution_ids":["https://openalex.org/I59553526"]},{"raw_affiliation_string":"Applied Mathematics and Statistics, Stony Brook University","institution_ids":["https://openalex.org/I59553526","https://openalex.org/I4210131439"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5025896653","display_name":"Alec Koppel","orcid":"https://orcid.org/0000-0003-2447-2873"},"institutions":[{"id":"https://openalex.org/I4210089985","display_name":"Amazon (Germany)","ror":"https://ror.org/00b9ktm87","country_code":"DE","type":"company","lineage":["https://openalex.org/I1311688040","https://openalex.org/I4210089985"]},{"id":"https://openalex.org/I4210164786","display_name":"Optimal Solutions (United States)","ror":"https://ror.org/05t1cnz26","country_code":"US","type":"company","lineage":["https://openalex.org/I4210164786"]}],"countries":["DE","US"],"is_corresponding":false,"raw_author_name":"Alec Koppel","raw_affiliation_strings":["Supply Chain Optimization Technologies, Amazon,Optimal Sourcing Systems","Optimal Sourcing Systems, Supply Chain Optimization Technologies, Amazon"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"Supply Chain Optimization Technologies, Amazon,Optimal Sourcing Systems","institution_ids":["https://openalex.org/I4210164786"]},{"raw_affiliation_string":"Optimal Sourcing Systems, Supply Chain Optimization Technologies, Amazon","institution_ids":["https://openalex.org/I4210164786","https://openalex.org/I4210089985"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5100396338","display_name":"Ji Liu","orcid":"https://orcid.org/0000-0003-2871-9888"},"institutions":[{"id":"https://openalex.org/I59553526","display_name":"Stony Brook University","ror":"https://ror.org/05qghxh33","country_code":"US","type":"education","lineage":["https://openalex.org/I59553526"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Ji Liu","raw_affiliation_strings":["Stony Brook University,Electrical and Computer Engineering","Electrical and Computer Engineering, Stony Brook University"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"Stony Brook University,Electrical and Computer Engineering","institution_ids":["https://openalex.org/I59553526"]},{"raw_affiliation_string":"Electrical and Computer Engineering, Stony Brook University","institution_ids":["https://openalex.org/I59553526"]}]}],"institutions":[],"countries_distinct_count":2,"institutions_distinct_count":3,"corresponding_author_ids":[],"corresponding_institution_ids":[],"apc_list":null,"apc_paid":null,"fwci":0.0,"has_fulltext":false,"cited_by_count":0,"citation_normalized_percentile":{"value":0.03150867,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":null,"biblio":{"volume":"7","issue":null,"first_page":"281","last_page":"286"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10462","display_name":"Reinforcement Learning in Robotics","score":0.9991999864578247,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10462","display_name":"Reinforcement Learning in Robotics","score":0.9991999864578247,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T12101","display_name":"Advanced Bandit Algorithms Research","score":0.9991999864578247,"subfield":{"id":"https://openalex.org/subfields/1803","display_name":"Management Science and Operations Research"},"field":{"id":"https://openalex.org/fields/18","display_name":"Decision Sciences"},"domain":{"id":"https://openalex.org/domains/2","display_name":"Social Sciences"}},{"id":"https://openalex.org/T11413","display_name":"Risk and Portfolio Optimization","score":0.9979000091552734,"subfield":{"id":"https://openalex.org/subfields/1803","display_name":"Management Science and Operations Research"},"field":{"id":"https://openalex.org/fields/18","display_name":"Decision Sciences"},"domain":{"id":"https://openalex.org/domains/2","display_name":"Social Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/omega","display_name":"Omega","score":0.5660735964775085},{"id":"https://openalex.org/keywords/mathematical-optimization","display_name":"Mathematical optimization","score":0.5616914629936218},{"id":"https://openalex.org/keywords/optimization-problem","display_name":"Optimization problem","score":0.5180149674415588},{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.5061408877372742},{"id":"https://openalex.org/keywords/portfolio-optimization","display_name":"Portfolio optimization","score":0.4857640564441681},{"id":"https://openalex.org/keywords/portfolio","display_name":"Portfolio","score":0.47434794902801514},{"id":"https://openalex.org/keywords/mathematics","display_name":"Mathematics","score":0.33579951524734497},{"id":"https://openalex.org/keywords/economics","display_name":"Economics","score":0.12037032842636108},{"id":"https://openalex.org/keywords/finance","display_name":"Finance","score":0.11543712019920349}],"concepts":[{"id":"https://openalex.org/C2779557605","wikidata":"https://www.wikidata.org/wiki/Q9890","display_name":"Omega","level":2,"score":0.5660735964775085},{"id":"https://openalex.org/C126255220","wikidata":"https://www.wikidata.org/wiki/Q141495","display_name":"Mathematical optimization","level":1,"score":0.5616914629936218},{"id":"https://openalex.org/C137836250","wikidata":"https://www.wikidata.org/wiki/Q984063","display_name":"Optimization problem","level":2,"score":0.5180149674415588},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.5061408877372742},{"id":"https://openalex.org/C202655437","wikidata":"https://www.wikidata.org/wiki/Q7231728","display_name":"Portfolio optimization","level":3,"score":0.4857640564441681},{"id":"https://openalex.org/C2780821815","wikidata":"https://www.wikidata.org/wiki/Q5340806","display_name":"Portfolio","level":2,"score":0.47434794902801514},{"id":"https://openalex.org/C33923547","wikidata":"https://www.wikidata.org/wiki/Q395","display_name":"Mathematics","level":0,"score":0.33579951524734497},{"id":"https://openalex.org/C162324750","wikidata":"https://www.wikidata.org/wiki/Q8134","display_name":"Economics","level":0,"score":0.12037032842636108},{"id":"https://openalex.org/C10138342","wikidata":"https://www.wikidata.org/wiki/Q43015","display_name":"Finance","level":1,"score":0.11543712019920349},{"id":"https://openalex.org/C121332964","wikidata":"https://www.wikidata.org/wiki/Q413","display_name":"Physics","level":0,"score":0.0},{"id":"https://openalex.org/C62520636","wikidata":"https://www.wikidata.org/wiki/Q944","display_name":"Quantum mechanics","level":1,"score":0.0}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.1109/ciss53076.2022.9751163","is_oa":false,"landing_page_url":"https://doi.org/10.1109/ciss53076.2022.9751163","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"2022 56th Annual Conference on Information Sciences and Systems (CISS)","raw_type":"proceedings-article"}],"best_oa_location":null,"sustainable_development_goals":[{"display_name":"Peace, Justice and strong institutions","score":0.8199999928474426,"id":"https://metadata.un.org/sdg/16"}],"awards":[{"id":"https://openalex.org/G6430636516","display_name":null,"funder_award_id":"W911NF-22-2-0003","funder_id":"https://openalex.org/F4320338295","funder_display_name":"Army Research Laboratory"}],"funders":[{"id":"https://openalex.org/F4320338295","display_name":"Army Research Laboratory","ror":"https://ror.org/011hc8f90"}],"has_content":{"pdf":false,"grobid_xml":false},"content_urls":null,"referenced_works_count":35,"referenced_works":["https://openalex.org/W41554520","https://openalex.org/W594357522","https://openalex.org/W1496778712","https://openalex.org/W1499021337","https://openalex.org/W1968115484","https://openalex.org/W2047364871","https://openalex.org/W2094387729","https://openalex.org/W2118208297","https://openalex.org/W2148654185","https://openalex.org/W2155027007","https://openalex.org/W2155054353","https://openalex.org/W2156737235","https://openalex.org/W2169015875","https://openalex.org/W2605411941","https://openalex.org/W3038006656","https://openalex.org/W3038915804","https://openalex.org/W3121933628","https://openalex.org/W3132054471","https://openalex.org/W3172979527","https://openalex.org/W3183820536","https://openalex.org/W4241229021","https://openalex.org/W4241584625","https://openalex.org/W4298023569","https://openalex.org/W4318718437","https://openalex.org/W6629699597","https://openalex.org/W6683040585","https://openalex.org/W6683204974","https://openalex.org/W6702431756","https://openalex.org/W6740961973","https://openalex.org/W6769467134","https://openalex.org/W6780089238","https://openalex.org/W6780386840","https://openalex.org/W6791168167","https://openalex.org/W6796847927","https://openalex.org/W6807091881"],"related_works":["https://openalex.org/W1986311305","https://openalex.org/W4360613713","https://openalex.org/W3125148470","https://openalex.org/W2768197547","https://openalex.org/W2055959038","https://openalex.org/W4206877017","https://openalex.org/W4225528185","https://openalex.org/W4327779378","https://openalex.org/W2795635811","https://openalex.org/W2221832056"],"abstract_inverted_index":{"We":[0,24],"consider":[1],"policy":[2],"gradient":[3],"methods":[4],"for":[5,29,50],"ratio":[6,19,30,53],"optimization":[7,31],"problems":[8],"by":[9],"way":[10],"of":[11,20,39],"an":[12,47],"illustrative":[13],"case":[14],"study:":[15],"maximizing":[16],"the":[17,37,51,62],"Omega":[18,52],"a":[21,26,71],"financial":[22],"portfolio.":[23],"propose":[25,46],"general":[27],"framework":[28],"in":[32,42,79],"sequential":[33],"decision-making":[34],"problems,":[35,44],"explore":[36],"notion":[38],"hidden":[40],"quasiconcavity":[41],"such":[43],"and":[45,74],"actor-critic":[48],"algorithm":[49,63],"problem.":[54],"Our":[55],"central":[56],"contribution":[57],"is":[58],"to":[59,67,75],"show":[60],"that":[61],"converges":[64],"almost":[65],"surely":[66],"(a":[68],"neighborhood":[69],"of)":[70],"global":[72],"optimum":[73],"demonstrate":[76],"its":[77],"performance":[78],"practice.":[80]},"counts_by_year":[],"updated_date":"2026-06-11T09:08:48.828518","created_date":"2025-10-10T00:00:00"}
