{"id":"https://openalex.org/W3114285181","doi":"https://doi.org/10.1145/3430984.3431045","title":"A Multi-Agent Reinforcement Learning Approach for Stock Portfolio Allocation","display_name":"A Multi-Agent Reinforcement Learning Approach for Stock Portfolio Allocation","publication_year":2020,"publication_date":"2020-12-28","ids":{"openalex":"https://openalex.org/W3114285181","doi":"https://doi.org/10.1145/3430984.3431045","mag":"3114285181"},"language":"en","primary_location":{"is_oa":false,"landing_page_url":"https://doi.org/10.1145/3430984.3431045","pdf_url":null,"source":null,"license":null,"license_id":null,"version":null,"is_accepted":false,"is_published":false},"type":"article","type_crossref":"proceedings-article","indexed_in":["crossref"],"open_access":{"is_oa":false,"oa_status":"closed","oa_url":null,"any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5008023780","display_name":"Prahlad Koratamaddi","orcid":null},"institutions":[{"id":"https://openalex.org/I121750182","display_name":"National Institute of Technology Warangal","ror":"https://ror.org/017ebfz38","country_code":"IN","type":"education","lineage":["https://openalex.org/I121750182"]}],"countries":["IN"],"is_corresponding":false,"raw_author_name":"Prahlad Koratamaddi","raw_affiliation_strings":["National Institute of Technology Warangal"],"affiliations":[{"raw_affiliation_string":"National Institute of Technology Warangal","institution_ids":["https://openalex.org/I121750182"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5082056973","display_name":"Karan Wadhwani","orcid":null},"institutions":[{"id":"https://openalex.org/I121750182","display_name":"National Institute of Technology Warangal","ror":"https://ror.org/017ebfz38","country_code":"IN","type":"education","lineage":["https://openalex.org/I121750182"]}],"countries":["IN"],"is_corresponding":false,"raw_author_name":"Karan Wadhwani","raw_affiliation_strings":["National Institute of Technology Warangal"],"affiliations":[{"raw_affiliation_string":"National Institute of Technology Warangal","institution_ids":["https://openalex.org/I121750182"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5020169677","display_name":"Mridul Gupta","orcid":"https://orcid.org/0000-0001-6181-1403"},"institutions":[{"id":"https://openalex.org/I121750182","display_name":"National Institute of Technology Warangal","ror":"https://ror.org/017ebfz38","country_code":"IN","type":"education","lineage":["https://openalex.org/I121750182"]}],"countries":["IN"],"is_corresponding":false,"raw_author_name":"Mridul Gupta","raw_affiliation_strings":["National Institute of Technology Warangal"],"affiliations":[{"raw_affiliation_string":"National Institute of Technology Warangal","institution_ids":["https://openalex.org/I121750182"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5034835113","display_name":"Sriram G. Sanjeevi","orcid":null},"institutions":[{"id":"https://openalex.org/I121750182","display_name":"National Institute of Technology Warangal","ror":"https://ror.org/017ebfz38","country_code":"IN","type":"education","lineage":["https://openalex.org/I121750182"]}],"countries":["IN"],"is_corresponding":false,"raw_author_name":"Dr. Sriram G. Sanjeevi","raw_affiliation_strings":["National Institute of Technology Warangal"],"affiliations":[{"raw_affiliation_string":"National Institute of Technology Warangal","institution_ids":["https://openalex.org/I121750182"]}]}],"institution_assertions":[],"countries_distinct_count":1,"institutions_distinct_count":1,"corresponding_author_ids":[],"corresponding_institution_ids":[],"apc_list":null,"apc_paid":null,"fwci":0.219,"has_fulltext":false,"cited_by_count":1,"citation_normalized_percentile":{"value":0.522048,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":{"min":60,"max":69},"biblio":{"volume":null,"issue":null,"first_page":"410","last_page":"410"},"is_retracted":false,"is_paratext":false,"primary_topic":{"id":"https://openalex.org/T10047","display_name":"Financial Markets and Investment Strategies","score":0.9934,"subfield":{"id":"https://openalex.org/subfields/2003","display_name":"Finance"},"field":{"id":"https://openalex.org/fields/20","display_name":"Economics, Econometrics and Finance"},"domain":{"id":"https://openalex.org/domains/2","display_name":"Social Sciences"}},"topics":[{"id":"https://openalex.org/T10047","display_name":"Financial Markets and Investment Strategies","score":0.9934,"subfield":{"id":"https://openalex.org/subfields/2003","display_name":"Finance"},"field":{"id":"https://openalex.org/fields/20","display_name":"Economics, Econometrics and Finance"},"domain":{"id":"https://openalex.org/domains/2","display_name":"Social Sciences"}},{"id":"https://openalex.org/T11326","display_name":"Stock Market Forecasting Methods","score":0.9816,"subfield":{"id":"https://openalex.org/subfields/1803","display_name":"Management Science and Operations Research"},"field":{"id":"https://openalex.org/fields/18","display_name":"Decision Sciences"},"domain":{"id":"https://openalex.org/domains/2","display_name":"Social Sciences"}},{"id":"https://openalex.org/T11270","display_name":"Complex Systems and Time Series Analysis","score":0.9625,"subfield":{"id":"https://openalex.org/subfields/2002","display_name":"Economics and Econometrics"},"field":{"id":"https://openalex.org/fields/20","display_name":"Economics, Econometrics and Finance"},"domain":{"id":"https://openalex.org/domains/2","display_name":"Social Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/stock","display_name":"Stock (firearms)","score":0.49217883},{"id":"https://openalex.org/keywords/portfolio-allocation","display_name":"Portfolio allocation","score":0.45620748}],"concepts":[{"id":"https://openalex.org/C97541855","wikidata":"https://www.wikidata.org/wiki/Q830687","display_name":"Reinforcement learning","level":2,"score":0.9297577},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.70911825},{"id":"https://openalex.org/C2780821815","wikidata":"https://www.wikidata.org/wiki/Q5340806","display_name":"Portfolio","level":2,"score":0.666699},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.58778596},{"id":"https://openalex.org/C204036174","wikidata":"https://www.wikidata.org/wiki/Q909380","display_name":"Stock (firearms)","level":2,"score":0.49217883},{"id":"https://openalex.org/C2780299701","wikidata":"https://www.wikidata.org/wiki/Q475000","display_name":"Stock market","level":3,"score":0.4875023},{"id":"https://openalex.org/C2993800227","wikidata":"https://www.wikidata.org/wiki/Q7231728","display_name":"Portfolio allocation","level":3,"score":0.45620748},{"id":"https://openalex.org/C119857082","wikidata":"https://www.wikidata.org/wiki/Q2539","display_name":"Machine learning","level":1,"score":0.38876125},{"id":"https://openalex.org/C42475967","wikidata":"https://www.wikidata.org/wiki/Q194292","display_name":"Operations research","level":1,"score":0.32187492},{"id":"https://openalex.org/C162324750","wikidata":"https://www.wikidata.org/wiki/Q8134","display_name":"Economics","level":0,"score":0.14266351},{"id":"https://openalex.org/C10138342","wikidata":"https://www.wikidata.org/wiki/Q43015","display_name":"Finance","level":1,"score":0.13315642},{"id":"https://openalex.org/C127413603","wikidata":"https://www.wikidata.org/wiki/Q11023","display_name":"Engineering","level":0,"score":0.09425166},{"id":"https://openalex.org/C78519656","wikidata":"https://www.wikidata.org/wiki/Q101333","display_name":"Mechanical engineering","level":1,"score":0.0},{"id":"https://openalex.org/C151730666","wikidata":"https://www.wikidata.org/wiki/Q7205","display_name":"Paleontology","level":1,"score":0.0},{"id":"https://openalex.org/C2780762169","wikidata":"https://www.wikidata.org/wiki/Q5905368","display_name":"Horse","level":2,"score":0.0},{"id":"https://openalex.org/C86803240","wikidata":"https://www.wikidata.org/wiki/Q420","display_name":"Biology","level":0,"score":0.0}],"mesh":[],"locations_count":1,"locations":[{"is_oa":false,"landing_page_url":"https://doi.org/10.1145/3430984.3431045","pdf_url":null,"source":null,"license":null,"license_id":null,"version":null,"is_accepted":false,"is_published":false}],"best_oa_location":null,"sustainable_development_goals":[{"id":"https://metadata.un.org/sdg/17","display_name":"Partnerships for the goals","score":0.51}],"grants":[],"datasets":[],"versions":[],"referenced_works_count":5,"referenced_works":["https://openalex.org/W2047267926","https://openalex.org/W2153580489","https://openalex.org/W2173248099","https://openalex.org/W2901174038","https://openalex.org/W2954535276"],"related_works":["https://openalex.org/W4383874400","https://openalex.org/W4380318855","https://openalex.org/W4362501864","https://openalex.org/W4306904969","https://openalex.org/W3136925080","https://openalex.org/W2586732548","https://openalex.org/W2370669686","https://openalex.org/W2158350033","https://openalex.org/W2138720691","https://openalex.org/W2031695474"],"abstract_inverted_index":{"Stock":[0],"portfolio":[1,26],"allocation":[2],"is":[3,100],"one":[4],"of":[5,12,49,63,107,114],"the":[6,42,47,61,90,105,112],"most":[7,29],"challenging":[8],"and":[9,76],"interesting":[10],"problems":[11],"modern":[13],"finance.":[14],"Recently,":[15],"deep":[16,65,78],"reinforcement":[17,66],"learning":[18,36,67,109],"applications":[19],"have":[20],"shown":[21],"promising":[22],"results":[23,91],"in":[24,52,84,104],"automating":[25],"allocation.":[27],"However,":[28],"current":[30],"approaches":[31],"use":[32],"a":[33,85,101],"single":[34],"agent":[35],"model":[37],"which":[38],"could":[39],"inadequately":[40],"capture":[41],"complex":[43],"dynamics":[44],"arising":[45],"from":[46],"interactions":[48],"many":[50],"traders":[51],"today's":[53],"stock":[54],"market.":[55],"In":[56],"this":[57,69],"paper,":[58],"we":[59,96],"explore":[60],"applicability":[62],"multi-agent":[64],"to":[68],"problem":[70],"by":[71],"implementing":[72],"single-agent,":[73],"2-agent,":[74],"3-agent,":[75],"4-agent":[77],"deterministic":[79],"policy":[80],"gradients":[81],"(DDPG)":[82],"algorithms":[83],"competitive":[86],"setting.":[87],"Upon":[88],"analyzing":[89],"obtained":[92],"using":[93],"standardized":[94],"metrics,":[95],"observe":[97],"that":[98],"there":[99],"significant":[102],"improvement":[103],"performance":[106],"our":[108],"models":[110],"with":[111],"introduction":[113],"multiple":[115],"agents.":[116]},"cited_by_api_url":"https://api.openalex.org/works?filter=cites:W3114285181","counts_by_year":[{"year":2022,"cited_by_count":1}],"updated_date":"2025-01-05T18:45:05.059638","created_date":"2021-01-05"}