{"id":"https://openalex.org/W2990183840","doi":"https://doi.org/10.1109/cbd.2019.00051","title":"An Intelligent Bidding Strategy Based on Model-Free Reinforcement Learning for Real-Time Bidding in Display Advertising","display_name":"An Intelligent Bidding Strategy Based on Model-Free Reinforcement Learning for Real-Time Bidding in Display Advertising","publication_year":2019,"publication_date":"2019-09-01","ids":{"openalex":"https://openalex.org/W2990183840","doi":"https://doi.org/10.1109/cbd.2019.00051","mag":"2990183840"},"language":"en","primary_location":{"is_oa":false,"landing_page_url":"https://doi.org/10.1109/cbd.2019.00051","pdf_url":null,"source":null,"license":null,"license_id":null,"version":null,"is_accepted":false,"is_published":false},"type":"article","type_crossref":"proceedings-article","indexed_in":["crossref"],"open_access":{"is_oa":false,"oa_status":"closed","oa_url":null,"any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5005041726","display_name":"Mengjuan Liu","orcid":"https://orcid.org/0000-0003-3679-7915"},"institutions":[{"id":"https://openalex.org/I150229711","display_name":"University of Electronic Science and Technology of China","ror":"https://ror.org/04qr3zq92","country_code":"CN","type":"funder","lineage":["https://openalex.org/I150229711"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Mengjuan Liu","raw_affiliation_strings":["School of Information and Software Engineering, University of Electronic Science and Technology of China, Chengdu, China"],"affiliations":[{"raw_affiliation_string":"School of Information and Software Engineering, University of Electronic Science and Technology of China, Chengdu, China","institution_ids":["https://openalex.org/I150229711"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5100636528","display_name":"Jiaxing Li","orcid":"https://orcid.org/0000-0001-7048-9284"},"institutions":[{"id":"https://openalex.org/I150229711","display_name":"University of Electronic Science and Technology of China","ror":"https://ror.org/04qr3zq92","country_code":"CN","type":"funder","lineage":["https://openalex.org/I150229711"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Jiaxing Li","raw_affiliation_strings":["School of Information and Software Engineering, University of Electronic Science and Technology of China, Chengdu, China"],"affiliations":[{"raw_affiliation_string":"School of Information and Software Engineering, University of Electronic Science and Technology of China, Chengdu, China","institution_ids":["https://openalex.org/I150229711"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5084398278","display_name":"Wei Thoo Yue","orcid":"https://orcid.org/0000-0002-1344-153X"},"institutions":[{"id":"https://openalex.org/I150229711","display_name":"University of Electronic Science and Technology of China","ror":"https://ror.org/04qr3zq92","country_code":"CN","type":"funder","lineage":["https://openalex.org/I150229711"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Wei Yue","raw_affiliation_strings":["School of Information and Software Engineering, University of Electronic Science and Technology of China, Chengdu, China"],"affiliations":[{"raw_affiliation_string":"School of Information and Software Engineering, University of Electronic Science and Technology of China, Chengdu, China","institution_ids":["https://openalex.org/I150229711"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5005796407","display_name":"Lizhou Qiu","orcid":"https://orcid.org/0000-0003-4293-6969"},"institutions":[{"id":"https://openalex.org/I150229711","display_name":"University of Electronic Science and Technology of China","ror":"https://ror.org/04qr3zq92","country_code":"CN","type":"funder","lineage":["https://openalex.org/I150229711"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Lizhou Qiu","raw_affiliation_strings":["School of Information and Software Engineering, University of Electronic Science and Technology of China, Chengdu, China"],"affiliations":[{"raw_affiliation_string":"School of Information and Software Engineering, University of Electronic Science and Technology of China, Chengdu, China","institution_ids":["https://openalex.org/I150229711"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5100329170","display_name":"Jinyu Liu","orcid":"https://orcid.org/0000-0001-5428-625X"},"institutions":[{"id":"https://openalex.org/I150229711","display_name":"University of Electronic Science and Technology of China","ror":"https://ror.org/04qr3zq92","country_code":"CN","type":"funder","lineage":["https://openalex.org/I150229711"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Jinyu Liu","raw_affiliation_strings":["School of Information and Software Engineering, University of Electronic Science and Technology of China, Chengdu, China"],"affiliations":[{"raw_affiliation_string":"School of Information and Software Engineering, University of Electronic Science and Technology of China, Chengdu, China","institution_ids":["https://openalex.org/I150229711"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5045032131","display_name":"Zhiguang Qin","orcid":"https://orcid.org/0000-0001-6745-6377"},"institutions":[{"id":"https://openalex.org/I150229711","display_name":"University of Electronic Science and Technology of China","ror":"https://ror.org/04qr3zq92","country_code":"CN","type":"funder","lineage":["https://openalex.org/I150229711"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Zhiguang Qin","raw_affiliation_strings":["School of Information and Software Engineering, University of Electronic Science and Technology of China, Chengdu, China"],"affiliations":[{"raw_affiliation_string":"School of Information and Software Engineering, University of Electronic Science and Technology of China, Chengdu, China","institution_ids":["https://openalex.org/I150229711"]}]}],"institution_assertions":[],"countries_distinct_count":1,"institutions_distinct_count":1,"corresponding_author_ids":[],"corresponding_institution_ids":[],"apc_list":null,"apc_paid":null,"fwci":0.513,"has_fulltext":false,"cited_by_count":2,"citation_normalized_percentile":{"value":0.630278,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":{"min":69,"max":74},"biblio":{"volume":null,"issue":null,"first_page":"240","last_page":"245"},"is_retracted":false,"is_paratext":false,"primary_topic":{"id":"https://openalex.org/T11161","display_name":"Consumer Market Behavior and Pricing","score":0.9953,"subfield":{"id":"https://openalex.org/subfields/1406","display_name":"Marketing"},"field":{"id":"https://openalex.org/fields/14","display_name":"Business, Management and Accounting"},"domain":{"id":"https://openalex.org/domains/2","display_name":"Social Sciences"}},"topics":[{"id":"https://openalex.org/T11161","display_name":"Consumer Market Behavior and Pricing","score":0.9953,"subfield":{"id":"https://openalex.org/subfields/1406","display_name":"Marketing"},"field":{"id":"https://openalex.org/fields/14","display_name":"Business, Management and Accounting"},"domain":{"id":"https://openalex.org/domains/2","display_name":"Social Sciences"}},{"id":"https://openalex.org/T11182","display_name":"Auction Theory and Applications","score":0.9907,"subfield":{"id":"https://openalex.org/subfields/1803","display_name":"Management Science and Operations Research"},"field":{"id":"https://openalex.org/fields/18","display_name":"Decision Sciences"},"domain":{"id":"https://openalex.org/domains/2","display_name":"Social Sciences"}},{"id":"https://openalex.org/T11165","display_name":"Image and Video Quality Assessment","score":0.9623,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/real-time-bidding","display_name":"Real-time bidding","score":0.8612883},{"id":"https://openalex.org/keywords/display-advertising","display_name":"Display advertising","score":0.7136357},{"id":"https://openalex.org/keywords/ebidding","display_name":"Ebidding","score":0.56689304}],"concepts":[{"id":"https://openalex.org/C9233905","wikidata":"https://www.wikidata.org/wiki/Q3276328","display_name":"Bidding","level":2,"score":0.9341778},{"id":"https://openalex.org/C97541855","wikidata":"https://www.wikidata.org/wiki/Q830687","display_name":"Reinforcement learning","level":2,"score":0.8642005},{"id":"https://openalex.org/C1525070","wikidata":"https://www.wikidata.org/wiki/Q2134714","display_name":"Real-time bidding","level":3,"score":0.8612883},{"id":"https://openalex.org/C2777999536","wikidata":"https://www.wikidata.org/wiki/Q2399498","display_name":"Display advertising","level":4,"score":0.7136357},{"id":"https://openalex.org/C163239763","wikidata":"https://www.wikidata.org/wiki/Q5153637","display_name":"Common value auction","level":2,"score":0.70710653},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.6956699},{"id":"https://openalex.org/C195487862","wikidata":"https://www.wikidata.org/wiki/Q850210","display_name":"Revenue","level":2,"score":0.6092111},{"id":"https://openalex.org/C143989560","wikidata":"https://www.wikidata.org/wiki/Q17011617","display_name":"Ebidding","level":3,"score":0.56689304},{"id":"https://openalex.org/C42475967","wikidata":"https://www.wikidata.org/wiki/Q194292","display_name":"Operations research","level":1,"score":0.412205},{"id":"https://openalex.org/C177264268","wikidata":"https://www.wikidata.org/wiki/Q1514741","display_name":"Set (abstract data type)","level":2,"score":0.41052386},{"id":"https://openalex.org/C512338625","wikidata":"https://www.wikidata.org/wiki/Q624902","display_name":"Online advertising","level":3,"score":0.40905434},{"id":"https://openalex.org/C126255220","wikidata":"https://www.wikidata.org/wiki/Q141495","display_name":"Mathematical optimization","level":1,"score":0.3591499},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.3300991},{"id":"https://openalex.org/C175444787","wikidata":"https://www.wikidata.org/wiki/Q39072","display_name":"Microeconomics","level":1,"score":0.2438316},{"id":"https://openalex.org/C144133560","wikidata":"https://www.wikidata.org/wiki/Q4830453","display_name":"Business","level":0,"score":0.14353707},{"id":"https://openalex.org/C162324750","wikidata":"https://www.wikidata.org/wiki/Q8134","display_name":"Economics","level":0,"score":0.14294413},{"id":"https://openalex.org/C127413603","wikidata":"https://www.wikidata.org/wiki/Q11023","display_name":"Engineering","level":0,"score":0.12927091},{"id":"https://openalex.org/C110875604","wikidata":"https://www.wikidata.org/wiki/Q75","display_name":"The Internet","level":2,"score":0.0},{"id":"https://openalex.org/C199360897","wikidata":"https://www.wikidata.org/wiki/Q9143","display_name":"Programming language","level":1,"score":0.0},{"id":"https://openalex.org/C121955636","wikidata":"https://www.wikidata.org/wiki/Q4116214","display_name":"Accounting","level":1,"score":0.0},{"id":"https://openalex.org/C33923547","wikidata":"https://www.wikidata.org/wiki/Q395","display_name":"Mathematics","level":0,"score":0.0},{"id":"https://openalex.org/C136764020","wikidata":"https://www.wikidata.org/wiki/Q466","display_name":"World Wide Web","level":1,"score":0.0}],"mesh":[],"locations_count":1,"locations":[{"is_oa":false,"landing_page_url":"https://doi.org/10.1109/cbd.2019.00051","pdf_url":null,"source":null,"license":null,"license_id":null,"version":null,"is_accepted":false,"is_published":false}],"best_oa_location":null,"sustainable_development_goals":[{"display_name":"Partnerships for the goals","score":0.48,"id":"https://metadata.un.org/sdg/17"}],"grants":[],"datasets":[],"versions":[],"referenced_works_count":23,"referenced_works":["https://openalex.org/W1516061453","https://openalex.org/W1547105496","https://openalex.org/W1557517019","https://openalex.org/W1757796397","https://openalex.org/W1973976093","https://openalex.org/W2021375049","https://openalex.org/W2022091784","https://openalex.org/W2039842578","https://openalex.org/W2121863487","https://openalex.org/W2149822245","https://openalex.org/W2155027007","https://openalex.org/W2211399443","https://openalex.org/W2530299800","https://openalex.org/W2562337727","https://openalex.org/W2951002685","https://openalex.org/W2962684874","https://openalex.org/W2963864421","https://openalex.org/W3099947523","https://openalex.org/W3105140685","https://openalex.org/W3139377883","https://openalex.org/W32403112","https://openalex.org/W4214717370","https://openalex.org/W4298857966"],"related_works":["https://openalex.org/W4306254152","https://openalex.org/W4301661005","https://openalex.org/W3099082736","https://openalex.org/W2990183840","https://openalex.org/W2952820798","https://openalex.org/W2951754014","https://openalex.org/W2770888277","https://openalex.org/W2317606158","https://openalex.org/W2115496895","https://openalex.org/W2039842578"],"abstract_inverted_index":{"In":[0,84],"recent":[1,58],"years,":[2],"the":[3,31,41,47,51,57,63,70,79,99,105,110,119,124,132,137,143,162,170,175,178,188,193],"most":[4],"important":[5],"paradigm":[6],"in":[7,74,167],"online":[8],"display":[9],"advertising":[10],"is":[11,102,116],"real-time":[12,24],"bidding":[13,72,91,120,139,164,180],"(RTB).":[14],"It":[15],"allows":[16],"advertisers":[17],"to":[18,26,68,117,154,161,200],"buy":[19],"individual":[20],"ad":[21,37,53],"impressions":[22],"through":[23],"auctions,":[25],"obtain":[27],"maximum":[28],"revenue.":[29],"However,":[30],"existing":[32],"strategies":[33],"usually":[34],"bid":[35,45],"an":[36,114],"impression":[38],"independently,":[39],"ignoring":[40],"impacts":[42],"of":[43,177],"each":[44],"on":[46,77,183],"overall":[48],"revenue":[49],"during":[50],"whole":[52],"delivery":[54],"period.":[55],"Thus,":[56],"research":[59],"suggests":[60],"that":[61],"using":[62],"reinforcement":[64,95],"learning":[65,96],"(RL)":[66],"framework":[67],"learn":[69,136],"optimal":[71,138],"strategy":[73,140,165,181],"RTB,":[75],"based":[76,182],"both":[78],"immediate":[80],"and":[81,109,158,187,196],"future":[82],"rewards.":[83],"this":[85],"paper,":[86],"we":[87,135,148],"formulate":[88],"budget":[89],"constrained":[90],"as":[92],"a":[93,184],"model-free":[94,127],"problem,":[97,134],"where":[98],"state":[100],"space":[101],"presented":[103],"by":[104,141],"impressions'":[106],"feature":[107],"parameters":[108],"auction":[111,156],"information,":[112],"while":[113],"action":[115],"set":[118],"price.":[121],"Different":[122],"from":[123,131],"prior":[125],"value-based":[126],"work,":[128],"which":[129],"suffers":[130],"convergence":[133],"employing":[142],"policy":[144],"gradient":[145],"model.":[146],"Additionally,":[147],"design":[149],"four":[150],"reward":[151],"functions":[152],"according":[153],"different":[155],"results":[157,190],"user":[159],"feedback":[160],"learned":[163],"more":[166],"line":[168],"with":[169],"optimization":[171],"objectives.":[172],"We":[173],"evaluate":[174],"performance":[176,195],"proposed":[179],"real-world":[185],"dataset,":[186],"experimental":[189],"have":[191],"demonstrated":[192],"superior":[194],"high":[197],"efficiency":[198],"compared":[199],"state-of-the-art":[201],"methods.":[202]},"abstract_inverted_index_v3":null,"cited_by_api_url":"https://api.openalex.org/works?filter=cites:W2990183840","counts_by_year":[{"year":2023,"cited_by_count":1},{"year":2020,"cited_by_count":1}],"updated_date":"2025-02-18T04:27:20.135546","created_date":"2019-12-05"}