{"id":"https://openalex.org/W3099082736","doi":"https://doi.org/10.1109/access.2020.3037940","title":"A Dynamic Bidding Strategy Based on Model-Free Reinforcement Learning in Display Advertising","display_name":"A Dynamic Bidding Strategy Based on Model-Free Reinforcement Learning in Display Advertising","publication_year":2020,"publication_date":"2020-01-01","ids":{"openalex":"https://openalex.org/W3099082736","doi":"https://doi.org/10.1109/access.2020.3037940","mag":"3099082736"},"language":"en","primary_location":{"id":"doi:10.1109/access.2020.3037940","is_oa":true,"landing_page_url":"https://doi.org/10.1109/access.2020.3037940","pdf_url":null,"source":{"id":"https://openalex.org/S2485537415","display_name":"IEEE Access","issn_l":"2169-3536","issn":["2169-3536"],"is_oa":true,"is_in_doaj":true,"is_core":true,"host_organization":"https://openalex.org/P4310319808","host_organization_name":"Institute of Electrical and Electronics Engineers","host_organization_lineage":["https://openalex.org/P4310319808"],"host_organization_lineage_names":["Institute of Electrical and Electronics Engineers"],"type":"journal"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"IEEE Access","raw_type":"journal-article"},"type":"article","indexed_in":["crossref","doaj"],"open_access":{"is_oa":true,"oa_status":"gold","oa_url":"https://doi.org/10.1109/access.2020.3037940","any_repository_has_fulltext":true},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5005041726","display_name":"Mengjuan Liu","orcid":"https://orcid.org/0000-0003-3679-7915"},"institutions":[{"id":"https://openalex.org/I150229711","display_name":"University of Electronic Science and Technology of China","ror":"https://ror.org/04qr3zq92","country_code":"CN","type":"education","lineage":["https://openalex.org/I150229711"]}],"countries":["CN"],"is_corresponding":true,"raw_author_name":"Mengjuan Liu","raw_affiliation_strings":["Network and Data Security Key Laboratory of Sichuan Province, University of Electronic Science and Technology of China, Chengdu, China","ORCiD"],"raw_orcid":"https://orcid.org/0000-0003-3679-7915","affiliations":[{"raw_affiliation_string":"Network and Data Security Key Laboratory of Sichuan Province, University of Electronic Science and Technology of China, Chengdu, China","institution_ids":["https://openalex.org/I150229711"]},{"raw_affiliation_string":"ORCiD","institution_ids":[]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5020895300","display_name":"Li Jiaxing","orcid":"https://orcid.org/0000-0002-3074-5383"},"institutions":[{"id":"https://openalex.org/I150229711","display_name":"University of Electronic Science and Technology of China","ror":"https://ror.org/04qr3zq92","country_code":"CN","type":"education","lineage":["https://openalex.org/I150229711"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Li Jiaxing","raw_affiliation_strings":["Network and Data Security Key Laboratory of Sichuan Province, University of Electronic Science and Technology of China, Chengdu, China","ORCiD"],"raw_orcid":"https://orcid.org/0000-0002-3074-5383","affiliations":[{"raw_affiliation_string":"Network and Data Security Key Laboratory of Sichuan Province, University of Electronic Science and Technology of China, Chengdu, China","institution_ids":["https://openalex.org/I150229711"]},{"raw_affiliation_string":"ORCiD","institution_ids":[]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5103068652","display_name":"Zhengning Hu","orcid":"https://orcid.org/0000-0002-1354-2197"},"institutions":[{"id":"https://openalex.org/I150229711","display_name":"University of Electronic Science and Technology of China","ror":"https://ror.org/04qr3zq92","country_code":"CN","type":"education","lineage":["https://openalex.org/I150229711"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Zhengning Hu","raw_affiliation_strings":["Network and Data Security Key Laboratory of Sichuan Province, University of Electronic Science and Technology of China, Chengdu, China","ORCiD"],"raw_orcid":"https://orcid.org/0000-0002-1354-2197","affiliations":[{"raw_affiliation_string":"Network and Data Security Key Laboratory of Sichuan Province, University of Electronic Science and Technology of China, Chengdu, China","institution_ids":["https://openalex.org/I150229711"]},{"raw_affiliation_string":"ORCiD","institution_ids":[]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5100329170","display_name":"Jinyu Liu","orcid":"https://orcid.org/0000-0001-5428-625X"},"institutions":[{"id":"https://openalex.org/I150229711","display_name":"University of Electronic Science and Technology of China","ror":"https://ror.org/04qr3zq92","country_code":"CN","type":"education","lineage":["https://openalex.org/I150229711"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Jinyu Liu","raw_affiliation_strings":["Network and Data Security Key Laboratory of Sichuan Province, University of Electronic Science and Technology of China, Chengdu, China","ORCiD"],"raw_orcid":"https://orcid.org/0000-0001-5428-625X","affiliations":[{"raw_affiliation_string":"Network and Data Security Key Laboratory of Sichuan Province, University of Electronic Science and Technology of China, Chengdu, China","institution_ids":["https://openalex.org/I150229711"]},{"raw_affiliation_string":"ORCiD","institution_ids":[]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5016371039","display_name":"Xuyun Nie","orcid":"https://orcid.org/0000-0003-2868-0442"},"institutions":[{"id":"https://openalex.org/I150229711","display_name":"University of Electronic Science and Technology of China","ror":"https://ror.org/04qr3zq92","country_code":"CN","type":"education","lineage":["https://openalex.org/I150229711"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Xuyun Nie","raw_affiliation_strings":["Network and Data Security Key Laboratory of Sichuan Province, University of Electronic Science and Technology of China, Chengdu, China","ORCiD"],"raw_orcid":"https://orcid.org/0000-0003-2868-0442","affiliations":[{"raw_affiliation_string":"Network and Data Security Key Laboratory of Sichuan Province, University of Electronic Science and Technology of China, Chengdu, China","institution_ids":["https://openalex.org/I150229711"]},{"raw_affiliation_string":"ORCiD","institution_ids":[]}]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":5,"corresponding_author_ids":["https://openalex.org/A5005041726"],"corresponding_institution_ids":["https://openalex.org/I150229711"],"apc_list":{"value":1850,"currency":"USD","value_usd":1850},"apc_paid":{"value":1850,"currency":"USD","value_usd":1850},"fwci":2.0691,"has_fulltext":false,"cited_by_count":19,"citation_normalized_percentile":{"value":0.88736734,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":{"min":95,"max":98},"biblio":{"volume":"8","issue":null,"first_page":"213587","last_page":"213601"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T11161","display_name":"Consumer Market Behavior and Pricing","score":0.9980000257492065,"subfield":{"id":"https://openalex.org/subfields/1406","display_name":"Marketing"},"field":{"id":"https://openalex.org/fields/14","display_name":"Business, Management and Accounting"},"domain":{"id":"https://openalex.org/domains/2","display_name":"Social Sciences"}},"topics":[{"id":"https://openalex.org/T11161","display_name":"Consumer Market Behavior and Pricing","score":0.9980000257492065,"subfield":{"id":"https://openalex.org/subfields/1406","display_name":"Marketing"},"field":{"id":"https://openalex.org/fields/14","display_name":"Business, Management and Accounting"},"domain":{"id":"https://openalex.org/domains/2","display_name":"Social Sciences"}},{"id":"https://openalex.org/T12101","display_name":"Advanced Bandit Algorithms Research","score":0.9968000054359436,"subfield":{"id":"https://openalex.org/subfields/1803","display_name":"Management Science and Operations Research"},"field":{"id":"https://openalex.org/fields/18","display_name":"Decision Sciences"},"domain":{"id":"https://openalex.org/domains/2","display_name":"Social Sciences"}},{"id":"https://openalex.org/T11182","display_name":"Auction Theory and Applications","score":0.9961000084877014,"subfield":{"id":"https://openalex.org/subfields/1803","display_name":"Management Science and Operations Research"},"field":{"id":"https://openalex.org/fields/18","display_name":"Decision Sciences"},"domain":{"id":"https://openalex.org/domains/2","display_name":"Social Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/bidding","display_name":"Bidding","score":0.9664058685302734},{"id":"https://openalex.org/keywords/real-time-bidding","display_name":"Real-time bidding","score":0.8500567674636841},{"id":"https://openalex.org/keywords/reinforcement-learning","display_name":"Reinforcement learning","score":0.805722713470459},{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.6844944953918457},{"id":"https://openalex.org/keywords/ebidding","display_name":"Ebidding","score":0.6681879162788391},{"id":"https://openalex.org/keywords/display-advertising","display_name":"Display advertising","score":0.5494592785835266},{"id":"https://openalex.org/keywords/revenue","display_name":"Revenue","score":0.5177571177482605},{"id":"https://openalex.org/keywords/operations-research","display_name":"Operations research","score":0.36035871505737305},{"id":"https://openalex.org/keywords/mathematical-optimization","display_name":"Mathematical optimization","score":0.32999324798583984},{"id":"https://openalex.org/keywords/microeconomics","display_name":"Microeconomics","score":0.3294237554073334},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.2512710690498352},{"id":"https://openalex.org/keywords/economics","display_name":"Economics","score":0.20189496874809265},{"id":"https://openalex.org/keywords/online-advertising","display_name":"Online advertising","score":0.19580590724945068},{"id":"https://openalex.org/keywords/engineering","display_name":"Engineering","score":0.10712701082229614},{"id":"https://openalex.org/keywords/finance","display_name":"Finance","score":0.09047698974609375},{"id":"https://openalex.org/keywords/mathematics","display_name":"Mathematics","score":0.07925572991371155}],"concepts":[{"id":"https://openalex.org/C9233905","wikidata":"https://www.wikidata.org/wiki/Q3276328","display_name":"Bidding","level":2,"score":0.9664058685302734},{"id":"https://openalex.org/C1525070","wikidata":"https://www.wikidata.org/wiki/Q2134714","display_name":"Real-time bidding","level":3,"score":0.8500567674636841},{"id":"https://openalex.org/C97541855","wikidata":"https://www.wikidata.org/wiki/Q830687","display_name":"Reinforcement learning","level":2,"score":0.805722713470459},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.6844944953918457},{"id":"https://openalex.org/C143989560","wikidata":"https://www.wikidata.org/wiki/Q17011617","display_name":"Ebidding","level":3,"score":0.6681879162788391},{"id":"https://openalex.org/C2777999536","wikidata":"https://www.wikidata.org/wiki/Q2399498","display_name":"Display advertising","level":4,"score":0.5494592785835266},{"id":"https://openalex.org/C195487862","wikidata":"https://www.wikidata.org/wiki/Q850210","display_name":"Revenue","level":2,"score":0.5177571177482605},{"id":"https://openalex.org/C42475967","wikidata":"https://www.wikidata.org/wiki/Q194292","display_name":"Operations research","level":1,"score":0.36035871505737305},{"id":"https://openalex.org/C126255220","wikidata":"https://www.wikidata.org/wiki/Q141495","display_name":"Mathematical optimization","level":1,"score":0.32999324798583984},{"id":"https://openalex.org/C175444787","wikidata":"https://www.wikidata.org/wiki/Q39072","display_name":"Microeconomics","level":1,"score":0.3294237554073334},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.2512710690498352},{"id":"https://openalex.org/C162324750","wikidata":"https://www.wikidata.org/wiki/Q8134","display_name":"Economics","level":0,"score":0.20189496874809265},{"id":"https://openalex.org/C512338625","wikidata":"https://www.wikidata.org/wiki/Q624902","display_name":"Online advertising","level":3,"score":0.19580590724945068},{"id":"https://openalex.org/C127413603","wikidata":"https://www.wikidata.org/wiki/Q11023","display_name":"Engineering","level":0,"score":0.10712701082229614},{"id":"https://openalex.org/C10138342","wikidata":"https://www.wikidata.org/wiki/Q43015","display_name":"Finance","level":1,"score":0.09047698974609375},{"id":"https://openalex.org/C33923547","wikidata":"https://www.wikidata.org/wiki/Q395","display_name":"Mathematics","level":0,"score":0.07925572991371155},{"id":"https://openalex.org/C136764020","wikidata":"https://www.wikidata.org/wiki/Q466","display_name":"World Wide Web","level":1,"score":0.0},{"id":"https://openalex.org/C110875604","wikidata":"https://www.wikidata.org/wiki/Q75","display_name":"The Internet","level":2,"score":0.0}],"mesh":[],"locations_count":2,"locations":[{"id":"doi:10.1109/access.2020.3037940","is_oa":true,"landing_page_url":"https://doi.org/10.1109/access.2020.3037940","pdf_url":null,"source":{"id":"https://openalex.org/S2485537415","display_name":"IEEE Access","issn_l":"2169-3536","issn":["2169-3536"],"is_oa":true,"is_in_doaj":true,"is_core":true,"host_organization":"https://openalex.org/P4310319808","host_organization_name":"Institute of Electrical and Electronics Engineers","host_organization_lineage":["https://openalex.org/P4310319808"],"host_organization_lineage_names":["Institute of Electrical and Electronics Engineers"],"type":"journal"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"IEEE Access","raw_type":"journal-article"},{"id":"pmh:oai:doaj.org/article:653652da20b54c08b5e2abeebf4b7189","is_oa":true,"landing_page_url":"https://doaj.org/article/653652da20b54c08b5e2abeebf4b7189","pdf_url":null,"source":{"id":"https://openalex.org/S4306401280","display_name":"DOAJ (DOAJ: Directory of Open Access Journals)","issn_l":null,"issn":null,"is_oa":false,"is_in_doaj":false,"is_core":false,"host_organization":null,"host_organization_name":null,"host_organization_lineage":[],"host_organization_lineage_names":[],"type":"repository"},"license":"cc-by-sa","license_id":"https://openalex.org/licenses/cc-by-sa","version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":"IEEE Access, Vol 8, Pp 213587-213601 (2020)","raw_type":"article"}],"best_oa_location":{"id":"doi:10.1109/access.2020.3037940","is_oa":true,"landing_page_url":"https://doi.org/10.1109/access.2020.3037940","pdf_url":null,"source":{"id":"https://openalex.org/S2485537415","display_name":"IEEE Access","issn_l":"2169-3536","issn":["2169-3536"],"is_oa":true,"is_in_doaj":true,"is_core":true,"host_organization":"https://openalex.org/P4310319808","host_organization_name":"Institute of Electrical and Electronics Engineers","host_organization_lineage":["https://openalex.org/P4310319808"],"host_organization_lineage_names":["Institute of Electrical and Electronics Engineers"],"type":"journal"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"IEEE Access","raw_type":"journal-article"},"sustainable_development_goals":[{"id":"https://metadata.un.org/sdg/17","score":0.4000000059604645,"display_name":"Partnerships for the goals"}],"awards":[{"id":"https://openalex.org/G4531568404","display_name":null,"funder_award_id":"61472064","funder_id":"https://openalex.org/F4320321001","funder_display_name":"National Natural Science Foundation of China"},{"id":"https://openalex.org/G685846593","display_name":null,"funder_award_id":"61202445","funder_id":"https://openalex.org/F4320321001","funder_display_name":"National Natural Science Foundation of China"}],"funders":[{"id":"https://openalex.org/F4320321001","display_name":"National Natural Science Foundation of China","ror":"https://ror.org/01h0zpd94"}],"has_content":{"pdf":false,"grobid_xml":false},"content_urls":null,"referenced_works_count":45,"referenced_works":["https://openalex.org/W1498502445","https://openalex.org/W1506085041","https://openalex.org/W1522301498","https://openalex.org/W1547105496","https://openalex.org/W1836465849","https://openalex.org/W1888895843","https://openalex.org/W1973081445","https://openalex.org/W1973976093","https://openalex.org/W2021375049","https://openalex.org/W2022091784","https://openalex.org/W2031745992","https://openalex.org/W2039842578","https://openalex.org/W2046376809","https://openalex.org/W2090883204","https://openalex.org/W2094286023","https://openalex.org/W2121863487","https://openalex.org/W2149822245","https://openalex.org/W2155027007","https://openalex.org/W2156387975","https://openalex.org/W2172968643","https://openalex.org/W2173248099","https://openalex.org/W2317606158","https://openalex.org/W2530299800","https://openalex.org/W2562337727","https://openalex.org/W2761686124","https://openalex.org/W2787938642","https://openalex.org/W2788376840","https://openalex.org/W2952072798","https://openalex.org/W2962684874","https://openalex.org/W2963841569","https://openalex.org/W2963864421","https://openalex.org/W2963923407","https://openalex.org/W2964121744","https://openalex.org/W2964325980","https://openalex.org/W3004257040","https://openalex.org/W3099947523","https://openalex.org/W3105140685","https://openalex.org/W4214717370","https://openalex.org/W6629793200","https://openalex.org/W6631190155","https://openalex.org/W6639248806","https://openalex.org/W6682889407","https://openalex.org/W6683204974","https://openalex.org/W6695986770","https://openalex.org/W6748839928"],"related_works":["https://openalex.org/W2372662578","https://openalex.org/W2367213784","https://openalex.org/W2355176056","https://openalex.org/W2360391211","https://openalex.org/W2141395620","https://openalex.org/W2360290312","https://openalex.org/W2380848687","https://openalex.org/W3099082736","https://openalex.org/W4385421505","https://openalex.org/W341704063"],"abstract_inverted_index":{"Real-time":[0],"bidding":[1,31,42,61,86,97,119,141,155,160,169,178,188,215,235],"(RTB)":[2],"is":[3,44,180],"one":[4],"of":[5,171,232],"the":[6,14,26,32,41,68,74,77,85,96,105,110,117,123,140,168,177,195,200,218,226,233],"most":[7,59],"striking":[8],"advances":[9],"in":[10,30],"online":[11],"advertising,":[12],"where":[13],"websites":[15],"can":[16,28,191],"sell":[17],"each":[18,158,184,211],"ad":[19,79,147],"impression":[20,33],"through":[21],"a":[22,222],"public":[23,223],"auction,":[24],"and":[25,56,76,94,167,229],"advertisers":[27,49],"participate":[29],"based":[34,100],"on":[35,101,133,163,221],"its":[36,164,172],"estimated":[37,165],"value.":[38],"In":[39,128],"RTB,":[40],"strategy":[43,120,179,236],"an":[45,146],"essential":[46],"component":[47],"for":[48,122],"to":[50,115,138,182,194,209],"maximize":[51],"their":[52],"revenues":[53],"(e.g.,":[54],"clicks":[55],"conversions).":[57],"However,":[58],"existing":[60],"strategies":[62],"may":[63],"not":[64],"work":[65],"well":[66],"when":[67],"RTB":[69,126,196],"environment":[70],"changes":[71],"dramatically":[72],"between":[73],"historical":[75,102],"new":[78],"delivery":[80,148],"periods":[81],"since":[82],"they":[83],"regard":[84],"decision":[87],"as":[88],"$\\boldsymbol":[89],"{a}$":[90],"static":[91],"optimization":[92],"problem":[93],"derive":[95],"function":[98],"only":[99],"data.":[103],"Thus,":[104],"latest":[106],"research":[107],"suggests":[108],"using":[109,134],"reinforcement":[111,136],"learning":[112,137],"(RL)":[113],"framework":[114],"learn":[116,210],"optimal":[118,187,214],"suitable":[121],"highly":[124],"dynamic":[125],"environment.":[127,197],"this":[129],"paper,":[130],"we":[131,144],"focus":[132],"model-free":[135],"optimize":[139],"strategy.":[142],"Specifically,":[143],"divide":[145],"period":[149],"into":[150],"several":[151],"time":[152,174,185,212],"slots.":[153],"The":[154],"agent":[156],"decides":[157],"impression's":[159],"price":[161],"depending":[162],"value":[166],"factor":[170],"arriving":[173],"slot.":[175],"Therefore,":[176],"simplified":[181],"solve":[183],"slot's":[186,213],"factor,":[189],"which":[190],"adapt":[192],"dynamically":[193],"We":[198],"exploit":[199],"Twin":[201],"Delayed":[202],"Deep":[203],"Deterministic":[204],"policy":[205],"gradient":[206],"(TD3)":[207],"algorithm":[208],"factor.":[216],"Finally,":[217],"empirical":[219],"study":[220],"dataset":[224],"demonstrates":[225],"superior":[227],"performance":[228],"high":[230],"efficiency":[231],"proposed":[234],"compared":[237],"with":[238],"other":[239],"state-of-the-art":[240],"baselines.":[241]},"counts_by_year":[{"year":2025,"cited_by_count":4},{"year":2024,"cited_by_count":4},{"year":2023,"cited_by_count":5},{"year":2022,"cited_by_count":3},{"year":2021,"cited_by_count":3}],"updated_date":"2026-03-27T05:58:40.876381","created_date":"2025-10-10T00:00:00"}
