{"id":"https://openalex.org/W3157066907","doi":"https://doi.org/10.1609/aaai.v35i6.16659","title":"Reinforcement Learning of Sequential Price Mechanisms","display_name":"Reinforcement Learning of Sequential Price Mechanisms","publication_year":2021,"publication_date":"2021-05-18","ids":{"openalex":"https://openalex.org/W3157066907","doi":"https://doi.org/10.1609/aaai.v35i6.16659","mag":"3157066907"},"language":"en","primary_location":{"id":"doi:10.1609/aaai.v35i6.16659","is_oa":true,"landing_page_url":"https://doi.org/10.1609/aaai.v35i6.16659","pdf_url":"https://ojs.aaai.org/index.php/AAAI/article/download/16659/16466","source":{"id":"https://openalex.org/S4210191458","display_name":"Proceedings of the AAAI Conference on Artificial Intelligence","issn_l":"2159-5399","issn":["2159-5399","2374-3468"],"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/P4310320058","host_organization_name":"Association for the Advancement of Artificial Intelligence","host_organization_lineage":["https://openalex.org/P4310320058"],"host_organization_lineage_names":["Association for the Advancement of Artificial Intelligence"],"type":"conference"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Proceedings of the AAAI Conference on Artificial Intelligence","raw_type":"journal-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":true,"oa_status":"diamond","oa_url":"https://ojs.aaai.org/index.php/AAAI/article/download/16659/16466","any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5007934589","display_name":"Gianluca Brero","orcid":null},"institutions":[{"id":"https://openalex.org/I2801851002","display_name":"Harvard University Press","ror":"https://ror.org/006v7bf86","country_code":"US","type":"other","lineage":["https://openalex.org/I136199984","https://openalex.org/I2801851002"]}],"countries":["US"],"is_corresponding":true,"raw_author_name":"Gianluca Brero","raw_affiliation_strings":["Harvard University"],"affiliations":[{"raw_affiliation_string":"Harvard University","institution_ids":["https://openalex.org/I2801851002"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5052790204","display_name":"Alon Eden","orcid":"https://orcid.org/0000-0002-0907-3914"},"institutions":[{"id":"https://openalex.org/I2801851002","display_name":"Harvard University Press","ror":"https://ror.org/006v7bf86","country_code":"US","type":"other","lineage":["https://openalex.org/I136199984","https://openalex.org/I2801851002"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Alon Eden","raw_affiliation_strings":["Harvard University"],"affiliations":[{"raw_affiliation_string":"Harvard University","institution_ids":["https://openalex.org/I2801851002"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5062440568","display_name":"Matthias Gerstgrasser","orcid":null},"institutions":[{"id":"https://openalex.org/I2801851002","display_name":"Harvard University Press","ror":"https://ror.org/006v7bf86","country_code":"US","type":"other","lineage":["https://openalex.org/I136199984","https://openalex.org/I2801851002"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Matthias Gerstgrasser","raw_affiliation_strings":["Harvard University"],"affiliations":[{"raw_affiliation_string":"Harvard University","institution_ids":["https://openalex.org/I2801851002"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5068264437","display_name":"David Parkes","orcid":null},"institutions":[{"id":"https://openalex.org/I2801851002","display_name":"Harvard University Press","ror":"https://ror.org/006v7bf86","country_code":"US","type":"other","lineage":["https://openalex.org/I136199984","https://openalex.org/I2801851002"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"David Parkes","raw_affiliation_strings":["Harvard University"],"affiliations":[{"raw_affiliation_string":"Harvard University","institution_ids":["https://openalex.org/I2801851002"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5037396817","display_name":"Duncan Rheingans-Yoo","orcid":null},"institutions":[{"id":"https://openalex.org/I2801851002","display_name":"Harvard University Press","ror":"https://ror.org/006v7bf86","country_code":"US","type":"other","lineage":["https://openalex.org/I136199984","https://openalex.org/I2801851002"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Duncan Rheingans-Yoo","raw_affiliation_strings":["Harvard University"],"affiliations":[{"raw_affiliation_string":"Harvard University","institution_ids":["https://openalex.org/I2801851002"]}]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":5,"corresponding_author_ids":["https://openalex.org/A5007934589"],"corresponding_institution_ids":["https://openalex.org/I2801851002"],"apc_list":null,"apc_paid":null,"fwci":1.5357,"has_fulltext":true,"cited_by_count":7,"citation_normalized_percentile":{"value":0.81507824,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":{"min":89,"max":97},"biblio":{"volume":"35","issue":"6","first_page":"5219","last_page":"5227"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T11182","display_name":"Auction Theory and Applications","score":0.9998999834060669,"subfield":{"id":"https://openalex.org/subfields/1803","display_name":"Management Science and Operations Research"},"field":{"id":"https://openalex.org/fields/18","display_name":"Decision Sciences"},"domain":{"id":"https://openalex.org/domains/2","display_name":"Social Sciences"}},"topics":[{"id":"https://openalex.org/T11182","display_name":"Auction Theory and Applications","score":0.9998999834060669,"subfield":{"id":"https://openalex.org/subfields/1803","display_name":"Management Science and Operations Research"},"field":{"id":"https://openalex.org/fields/18","display_name":"Decision Sciences"},"domain":{"id":"https://openalex.org/domains/2","display_name":"Social Sciences"}},{"id":"https://openalex.org/T10646","display_name":"Experimental Behavioral Economics Studies","score":0.9887999892234802,"subfield":{"id":"https://openalex.org/subfields/3311","display_name":"Safety Research"},"field":{"id":"https://openalex.org/fields/33","display_name":"Social Sciences"},"domain":{"id":"https://openalex.org/domains/2","display_name":"Social Sciences"}},{"id":"https://openalex.org/T11161","display_name":"Consumer Market Behavior and Pricing","score":0.9878000020980835,"subfield":{"id":"https://openalex.org/subfields/1406","display_name":"Marketing"},"field":{"id":"https://openalex.org/fields/14","display_name":"Business, Management and Accounting"},"domain":{"id":"https://openalex.org/domains/2","display_name":"Social Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/reinforcement-learning","display_name":"Reinforcement learning","score":0.8508251905441284},{"id":"https://openalex.org/keywords/class","display_name":"Class (philosophy)","score":0.6789095401763916},{"id":"https://openalex.org/keywords/markov-decision-process","display_name":"Markov decision process","score":0.6481090784072876},{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.6286514401435852},{"id":"https://openalex.org/keywords/mechanism","display_name":"Mechanism (biology)","score":0.5964611172676086},{"id":"https://openalex.org/keywords/partially-observable-markov-decision-process","display_name":"Partially observable Markov decision process","score":0.5234346389770508},{"id":"https://openalex.org/keywords/markov-process","display_name":"Markov process","score":0.47993046045303345},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.47082382440567017},{"id":"https://openalex.org/keywords/adaptation","display_name":"Adaptation (eye)","score":0.4676351845264435},{"id":"https://openalex.org/keywords/process","display_name":"Process (computing)","score":0.4618707001209259},{"id":"https://openalex.org/keywords/reinforcement","display_name":"Reinforcement","score":0.44648033380508423},{"id":"https://openalex.org/keywords/markov-chain","display_name":"Markov chain","score":0.39568135142326355},{"id":"https://openalex.org/keywords/mathematical-optimization","display_name":"Mathematical optimization","score":0.34017130732536316},{"id":"https://openalex.org/keywords/machine-learning","display_name":"Machine learning","score":0.29725995659828186},{"id":"https://openalex.org/keywords/mathematics","display_name":"Mathematics","score":0.21344250440597534},{"id":"https://openalex.org/keywords/markov-model","display_name":"Markov model","score":0.18539205193519592},{"id":"https://openalex.org/keywords/psychology","display_name":"Psychology","score":0.11642026901245117},{"id":"https://openalex.org/keywords/statistics","display_name":"Statistics","score":0.07616326212882996},{"id":"https://openalex.org/keywords/social-psychology","display_name":"Social psychology","score":0.06756499409675598}],"concepts":[{"id":"https://openalex.org/C97541855","wikidata":"https://www.wikidata.org/wiki/Q830687","display_name":"Reinforcement learning","level":2,"score":0.8508251905441284},{"id":"https://openalex.org/C2777212361","wikidata":"https://www.wikidata.org/wiki/Q5127848","display_name":"Class (philosophy)","level":2,"score":0.6789095401763916},{"id":"https://openalex.org/C106189395","wikidata":"https://www.wikidata.org/wiki/Q176789","display_name":"Markov decision process","level":3,"score":0.6481090784072876},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.6286514401435852},{"id":"https://openalex.org/C89611455","wikidata":"https://www.wikidata.org/wiki/Q6804646","display_name":"Mechanism (biology)","level":2,"score":0.5964611172676086},{"id":"https://openalex.org/C17098449","wikidata":"https://www.wikidata.org/wiki/Q176814","display_name":"Partially observable Markov decision process","level":4,"score":0.5234346389770508},{"id":"https://openalex.org/C159886148","wikidata":"https://www.wikidata.org/wiki/Q176645","display_name":"Markov process","level":2,"score":0.47993046045303345},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.47082382440567017},{"id":"https://openalex.org/C139807058","wikidata":"https://www.wikidata.org/wiki/Q352374","display_name":"Adaptation (eye)","level":2,"score":0.4676351845264435},{"id":"https://openalex.org/C98045186","wikidata":"https://www.wikidata.org/wiki/Q205663","display_name":"Process (computing)","level":2,"score":0.4618707001209259},{"id":"https://openalex.org/C67203356","wikidata":"https://www.wikidata.org/wiki/Q1321905","display_name":"Reinforcement","level":2,"score":0.44648033380508423},{"id":"https://openalex.org/C98763669","wikidata":"https://www.wikidata.org/wiki/Q176645","display_name":"Markov chain","level":2,"score":0.39568135142326355},{"id":"https://openalex.org/C126255220","wikidata":"https://www.wikidata.org/wiki/Q141495","display_name":"Mathematical optimization","level":1,"score":0.34017130732536316},{"id":"https://openalex.org/C119857082","wikidata":"https://www.wikidata.org/wiki/Q2539","display_name":"Machine learning","level":1,"score":0.29725995659828186},{"id":"https://openalex.org/C33923547","wikidata":"https://www.wikidata.org/wiki/Q395","display_name":"Mathematics","level":0,"score":0.21344250440597534},{"id":"https://openalex.org/C163836022","wikidata":"https://www.wikidata.org/wiki/Q6771326","display_name":"Markov model","level":3,"score":0.18539205193519592},{"id":"https://openalex.org/C15744967","wikidata":"https://www.wikidata.org/wiki/Q9418","display_name":"Psychology","level":0,"score":0.11642026901245117},{"id":"https://openalex.org/C105795698","wikidata":"https://www.wikidata.org/wiki/Q12483","display_name":"Statistics","level":1,"score":0.07616326212882996},{"id":"https://openalex.org/C77805123","wikidata":"https://www.wikidata.org/wiki/Q161272","display_name":"Social psychology","level":1,"score":0.06756499409675598},{"id":"https://openalex.org/C138885662","wikidata":"https://www.wikidata.org/wiki/Q5891","display_name":"Philosophy","level":0,"score":0.0},{"id":"https://openalex.org/C111919701","wikidata":"https://www.wikidata.org/wiki/Q9135","display_name":"Operating system","level":1,"score":0.0},{"id":"https://openalex.org/C111472728","wikidata":"https://www.wikidata.org/wiki/Q9471","display_name":"Epistemology","level":1,"score":0.0},{"id":"https://openalex.org/C169760540","wikidata":"https://www.wikidata.org/wiki/Q207011","display_name":"Neuroscience","level":1,"score":0.0}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.1609/aaai.v35i6.16659","is_oa":true,"landing_page_url":"https://doi.org/10.1609/aaai.v35i6.16659","pdf_url":"https://ojs.aaai.org/index.php/AAAI/article/download/16659/16466","source":{"id":"https://openalex.org/S4210191458","display_name":"Proceedings of the AAAI Conference on Artificial Intelligence","issn_l":"2159-5399","issn":["2159-5399","2374-3468"],"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/P4310320058","host_organization_name":"Association for the Advancement of Artificial Intelligence","host_organization_lineage":["https://openalex.org/P4310320058"],"host_organization_lineage_names":["Association for the Advancement of Artificial Intelligence"],"type":"conference"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Proceedings of the AAAI Conference on Artificial Intelligence","raw_type":"journal-article"}],"best_oa_location":{"id":"doi:10.1609/aaai.v35i6.16659","is_oa":true,"landing_page_url":"https://doi.org/10.1609/aaai.v35i6.16659","pdf_url":"https://ojs.aaai.org/index.php/AAAI/article/download/16659/16466","source":{"id":"https://openalex.org/S4210191458","display_name":"Proceedings of the AAAI Conference on Artificial Intelligence","issn_l":"2159-5399","issn":["2159-5399","2374-3468"],"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/P4310320058","host_organization_name":"Association for the Advancement of Artificial Intelligence","host_organization_lineage":["https://openalex.org/P4310320058"],"host_organization_lineage_names":["Association for the Advancement of Artificial Intelligence"],"type":"conference"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Proceedings of the AAAI Conference on Artificial Intelligence","raw_type":"journal-article"},"sustainable_development_goals":[{"id":"https://metadata.un.org/sdg/16","score":0.8199999928474426,"display_name":"Peace, Justice and strong institutions"}],"awards":[{"id":"https://openalex.org/G1093674026","display_name":null,"funder_award_id":"agreement","funder_id":"https://openalex.org/F4320320924","funder_display_name":"Schweizerischer Nationalfonds zur F\u00f6rderung der Wissenschaftlichen Forschung"},{"id":"https://openalex.org/G4621158401","display_name":null,"funder_award_id":"Fellowship","funder_id":"https://openalex.org/F4320320924","funder_display_name":"Schweizerischer Nationalfonds zur F\u00f6rderung der Wissenschaftlichen Forschung"},{"id":"https://openalex.org/G602257814","display_name":"Towards a General Theory of Mechanism Design for Economies of Automated Agents","funder_award_id":"191253","funder_id":"https://openalex.org/F4320320924","funder_display_name":"Schweizerischer Nationalfonds zur F\u00f6rderung der Wissenschaftlichen Forschung"},{"id":"https://openalex.org/G6801848600","display_name":"Akte der Rechtsetzung im Bereiche der schweizeri- schen Aussenpolitik.","funder_award_id":"20029","funder_id":"https://openalex.org/F4320320924","funder_display_name":"Schweizerischer Nationalfonds zur F\u00f6rderung der Wissenschaftlichen Forschung"}],"funders":[{"id":"https://openalex.org/F4320306076","display_name":"National Science Foundation","ror":"https://ror.org/021nxhr62"},{"id":"https://openalex.org/F4320320924","display_name":"Schweizerischer Nationalfonds zur F\u00f6rderung der Wissenschaftlichen Forschung","ror":"https://ror.org/00yjd3n13"},{"id":"https://openalex.org/F4320332180","display_name":"Defense Advanced Research Projects Agency","ror":"https://ror.org/02caytj08"},{"id":"https://openalex.org/F4320332815","display_name":"Advanced Research Projects Agency","ror":"https://ror.org/02caytj08"}],"has_content":{"grobid_xml":true,"pdf":true},"content_urls":{"pdf":"https://content.openalex.org/works/W3157066907.pdf","grobid_xml":"https://content.openalex.org/works/W3157066907.grobid-xml"},"referenced_works_count":79,"referenced_works":["https://openalex.org/W102212266","https://openalex.org/W1507134461","https://openalex.org/W1582122708","https://openalex.org/W1826494558","https://openalex.org/W1846856248","https://openalex.org/W1942817867","https://openalex.org/W1984726588","https://openalex.org/W1985367963","https://openalex.org/W1989148223","https://openalex.org/W2008737310","https://openalex.org/W2012672170","https://openalex.org/W2038017315","https://openalex.org/W2064675550","https://openalex.org/W2076337359","https://openalex.org/W2078587062","https://openalex.org/W2082943428","https://openalex.org/W2100292679","https://openalex.org/W2102399453","https://openalex.org/W2108682071","https://openalex.org/W2116009284","https://openalex.org/W2122124037","https://openalex.org/W2126528747","https://openalex.org/W2130521818","https://openalex.org/W2164143329","https://openalex.org/W2168069490","https://openalex.org/W2168359464","https://openalex.org/W2260756217","https://openalex.org/W2567363598","https://openalex.org/W2573152691","https://openalex.org/W2623431351","https://openalex.org/W2734590272","https://openalex.org/W2736601468","https://openalex.org/W2740489910","https://openalex.org/W2749928749","https://openalex.org/W2771017837","https://openalex.org/W2808146197","https://openalex.org/W2808749078","https://openalex.org/W2888571344","https://openalex.org/W2892074363","https://openalex.org/W2950290776","https://openalex.org/W2950351404","https://openalex.org/W2963184638","https://openalex.org/W2963313316","https://openalex.org/W2963426715","https://openalex.org/W2963440040","https://openalex.org/W2964043796","https://openalex.org/W2965084085","https://openalex.org/W2980094399","https://openalex.org/W2990760025","https://openalex.org/W2998596932","https://openalex.org/W3008809765","https://openalex.org/W3023007900","https://openalex.org/W3023615263","https://openalex.org/W3041225824","https://openalex.org/W3091257192","https://openalex.org/W3123500228","https://openalex.org/W3124026469","https://openalex.org/W3186341834","https://openalex.org/W4229497432","https://openalex.org/W4243139241","https://openalex.org/W4297872963","https://openalex.org/W4299802797","https://openalex.org/W4385366197","https://openalex.org/W6604092932","https://openalex.org/W6627198108","https://openalex.org/W6633577978","https://openalex.org/W6638626249","https://openalex.org/W6638735515","https://openalex.org/W6640749565","https://openalex.org/W6653474156","https://openalex.org/W6666761814","https://openalex.org/W6669402789","https://openalex.org/W6670379539","https://openalex.org/W6684099973","https://openalex.org/W6741922412","https://openalex.org/W6743013956","https://openalex.org/W6769439163","https://openalex.org/W6789028906","https://openalex.org/W6799106678"],"related_works":["https://openalex.org/W2096013579","https://openalex.org/W1589140671","https://openalex.org/W1760611253","https://openalex.org/W52153049","https://openalex.org/W3096874164","https://openalex.org/W2951545791","https://openalex.org/W1515117609","https://openalex.org/W2294884454","https://openalex.org/W2937181779","https://openalex.org/W2386410636"],"abstract_inverted_index":{"We":[0,49,83],"introduce":[1],"the":[2,12,77],"use":[3],"of":[4,15,57,70,79],"reinforcement":[5],"learning":[6],"for":[7,53,66,73,76],"indirect":[8],"mechanisms,":[9,18,65],"working":[10],"with":[11],"existing":[13],"class":[14,42,56],"sequential":[16],"price":[17,26],"which":[19],"generalizes":[20],"both":[21],"serial":[22],"dictatorship":[23],"and":[24,28,75],"posted":[25],"mechanisms":[27,58,93],"essentially":[29],"characterizes":[30],"all":[31],"strongly":[32],"obviously":[33],"strategyproof":[34],"mechanisms.":[35],"Learning":[36],"an":[37],"optimal":[38,90],"mechanism":[39],"within":[40],"this":[41,55],"forms":[43],"a":[44],"partially-observable":[45],"Markov":[46],"decision":[47],"process.":[48],"provide":[50],"rigorous":[51],"conditions":[52],"when":[54],"is":[59],"more":[60],"powerful":[61],"than":[62],"simpler":[63],"static":[64],"sufficiency":[67],"or":[68,91],"insufficiency":[69],"observation":[71],"statistics":[72],"learning,":[74],"necessity":[78],"complex":[80],"(deep)":[81],"policies.":[82],"show":[84],"that":[85],"our":[86],"approach":[87],"can":[88],"learn":[89],"near-optimal":[92],"in":[94],"several":[95],"experimental":[96],"settings.":[97]},"counts_by_year":[{"year":2025,"cited_by_count":2},{"year":2024,"cited_by_count":1},{"year":2023,"cited_by_count":3},{"year":2022,"cited_by_count":1}],"updated_date":"2026-03-07T16:01:11.037858","created_date":"2025-10-10T00:00:00"}
