{"id":"https://openalex.org/W4294771618","doi":"https://doi.org/10.3233/aic-220113","title":"Developing, evaluating and scaling learning agents in multi-agent environments","display_name":"Developing, evaluating and scaling learning agents in multi-agent environments","publication_year":2022,"publication_date":"2022-09-06","ids":{"openalex":"https://openalex.org/W4294771618","doi":"https://doi.org/10.3233/aic-220113"},"language":"en","primary_location":{"is_oa":false,"landing_page_url":"https://doi.org/10.3233/aic-220113","pdf_url":null,"source":{"id":"https://openalex.org/S176303223","display_name":"AI Communications","issn_l":"0921-7126","issn":["0921-7126","1875-8452"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310318577","host_organization_name":"IOS Press","host_organization_lineage":["https://openalex.org/P4310318577"],"host_organization_lineage_names":["IOS Press"],"type":"journal"},"license":null,"license_id":null,"version":null,"is_accepted":false,"is_published":false},"type":"article","type_crossref":"journal-article","indexed_in":["crossref"],"open_access":{"is_oa":true,"oa_status":"green","oa_url":"https://arxiv.org/pdf/2209.10958","any_repository_has_fulltext":true},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5112947561","display_name":"Ian Gemp","orcid":"https://orcid.org/0000-0002-7774-3246"},"institutions":[{"id":"https://openalex.org/I4210090411","display_name":"DeepMind (United Kingdom)","ror":"https://ror.org/00971b260","country_code":"GB","type":"company","lineage":["https://openalex.org/I4210090411","https://openalex.org/I4210128969"]}],"countries":["GB"],"is_corresponding":false,"raw_author_name":"Ian Gemp","raw_affiliation_strings":["Game Theory & Multi-Agent Team, DeepMind, London, UK"],"affiliations":[{"raw_affiliation_string":"Game Theory & Multi-Agent Team, DeepMind, London, UK","institution_ids":["https://openalex.org/I4210090411"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5000081835","display_name":"Thomas Anthony","orcid":"https://orcid.org/0000-0002-4443-5466"},"institutions":[{"id":"https://openalex.org/I4210090411","display_name":"DeepMind (United Kingdom)","ror":"https://ror.org/00971b260","country_code":"GB","type":"company","lineage":["https://openalex.org/I4210090411","https://openalex.org/I4210128969"]}],"countries":["GB"],"is_corresponding":false,"raw_author_name":"Thomas Anthony","raw_affiliation_strings":["Game Theory & Multi-Agent Team, DeepMind, London, UK"],"affiliations":[{"raw_affiliation_string":"Game Theory & Multi-Agent Team, DeepMind, London, UK","institution_ids":["https://openalex.org/I4210090411"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5062949033","display_name":"Yoram Bachrach","orcid":"https://orcid.org/0000-0002-4382-7636"},"institutions":[{"id":"https://openalex.org/I4210090411","display_name":"DeepMind (United Kingdom)","ror":"https://ror.org/00971b260","country_code":"GB","type":"company","lineage":["https://openalex.org/I4210090411","https://openalex.org/I4210128969"]}],"countries":["GB"],"is_corresponding":false,"raw_author_name":"Yoram Bachrach","raw_affiliation_strings":["Game Theory & Multi-Agent Team, DeepMind, London, UK"],"affiliations":[{"raw_affiliation_string":"Game Theory & Multi-Agent Team, DeepMind, London, UK","institution_ids":["https://openalex.org/I4210090411"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5029311828","display_name":"Avishkar Bhoopchand","orcid":"https://orcid.org/0009-0004-0465-4244"},"institutions":[{"id":"https://openalex.org/I4210090411","display_name":"DeepMind (United Kingdom)","ror":"https://ror.org/00971b260","country_code":"GB","type":"company","lineage":["https://openalex.org/I4210090411","https://openalex.org/I4210128969"]}],"countries":["GB"],"is_corresponding":false,"raw_author_name":"Avishkar Bhoopchand","raw_affiliation_strings":["Game Theory & Multi-Agent Team, DeepMind, London, UK"],"affiliations":[{"raw_affiliation_string":"Game Theory & Multi-Agent Team, DeepMind, London, UK","institution_ids":["https://openalex.org/I4210090411"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5061034972","display_name":"Kalesha Bullard","orcid":null},"institutions":[{"id":"https://openalex.org/I4210090411","display_name":"DeepMind (United Kingdom)","ror":"https://ror.org/00971b260","country_code":"GB","type":"company","lineage":["https://openalex.org/I4210090411","https://openalex.org/I4210128969"]}],"countries":["GB"],"is_corresponding":false,"raw_author_name":"Kalesha Bullard","raw_affiliation_strings":["Game Theory & Multi-Agent Team, DeepMind, London, UK"],"affiliations":[{"raw_affiliation_string":"Game Theory & Multi-Agent Team, DeepMind, London, UK","institution_ids":["https://openalex.org/I4210090411"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5041881668","display_name":"Jerome T. Connor","orcid":"https://orcid.org/0000-0002-7141-6260"},"institutions":[{"id":"https://openalex.org/I4210090411","display_name":"DeepMind (United Kingdom)","ror":"https://ror.org/00971b260","country_code":"GB","type":"company","lineage":["https://openalex.org/I4210090411","https://openalex.org/I4210128969"]}],"countries":["GB"],"is_corresponding":false,"raw_author_name":"Jerome Connor","raw_affiliation_strings":["Game Theory & Multi-Agent Team, DeepMind, London, UK"],"affiliations":[{"raw_affiliation_string":"Game Theory & Multi-Agent Team, DeepMind, London, UK","institution_ids":["https://openalex.org/I4210090411"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5012909623","display_name":"Vibhavari Dasagi","orcid":null},"institutions":[{"id":"https://openalex.org/I4210090411","display_name":"DeepMind (United Kingdom)","ror":"https://ror.org/00971b260","country_code":"GB","type":"company","lineage":["https://openalex.org/I4210090411","https://openalex.org/I4210128969"]}],"countries":["GB"],"is_corresponding":false,"raw_author_name":"Vibhavari Dasagi","raw_affiliation_strings":["Game Theory & Multi-Agent Team, DeepMind, London, UK"],"affiliations":[{"raw_affiliation_string":"Game Theory & Multi-Agent Team, DeepMind, London, UK","institution_ids":["https://openalex.org/I4210090411"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5027641103","display_name":"Bart De Vylder","orcid":"https://orcid.org/0000-0002-7833-4831"},"institutions":[{"id":"https://openalex.org/I4210090411","display_name":"DeepMind (United Kingdom)","ror":"https://ror.org/00971b260","country_code":"GB","type":"company","lineage":["https://openalex.org/I4210090411","https://openalex.org/I4210128969"]}],"countries":["GB"],"is_corresponding":false,"raw_author_name":"Bart De Vylder","raw_affiliation_strings":["Game Theory & Multi-Agent Team, DeepMind, London, UK"],"affiliations":[{"raw_affiliation_string":"Game Theory & Multi-Agent Team, DeepMind, London, UK","institution_ids":["https://openalex.org/I4210090411"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5061221525","display_name":"Edgar A. Du\u00e9\u00f1ez\u2010Guzm\u00e1n","orcid":"https://orcid.org/0000-0002-6212-9104"},"institutions":[{"id":"https://openalex.org/I4210090411","display_name":"DeepMind (United Kingdom)","ror":"https://ror.org/00971b260","country_code":"GB","type":"company","lineage":["https://openalex.org/I4210090411","https://openalex.org/I4210128969"]}],"countries":["GB"],"is_corresponding":false,"raw_author_name":"Edgar\u00a0A. Du\u00e9\u00f1ez-Guzm\u00e1n","raw_affiliation_strings":["Game Theory & Multi-Agent Team, DeepMind, London, UK"],"affiliations":[{"raw_affiliation_string":"Game Theory & Multi-Agent Team, DeepMind, London, UK","institution_ids":["https://openalex.org/I4210090411"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5085971810","display_name":"Romuald \u00c9lie","orcid":null},"institutions":[{"id":"https://openalex.org/I4210090411","display_name":"DeepMind (United Kingdom)","ror":"https://ror.org/00971b260","country_code":"GB","type":"company","lineage":["https://openalex.org/I4210090411","https://openalex.org/I4210128969"]}],"countries":["GB"],"is_corresponding":false,"raw_author_name":"Romuald Elie","raw_affiliation_strings":["Game Theory & Multi-Agent Team, DeepMind, London, UK"],"affiliations":[{"raw_affiliation_string":"Game Theory & Multi-Agent Team, DeepMind, London, UK","institution_ids":["https://openalex.org/I4210090411"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5007090604","display_name":"Richard Everett","orcid":"https://orcid.org/0000-0002-9404-6338"},"institutions":[{"id":"https://openalex.org/I4210090411","display_name":"DeepMind (United Kingdom)","ror":"https://ror.org/00971b260","country_code":"GB","type":"company","lineage":["https://openalex.org/I4210090411","https://openalex.org/I4210128969"]}],"countries":["GB"],"is_corresponding":false,"raw_author_name":"Richard Everett","raw_affiliation_strings":["Game Theory & Multi-Agent Team, DeepMind, London, UK"],"affiliations":[{"raw_affiliation_string":"Game Theory & Multi-Agent Team, DeepMind, London, UK","institution_ids":["https://openalex.org/I4210090411"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5043984392","display_name":"Daniel Hennes","orcid":"https://orcid.org/0000-0002-3646-5286"},"institutions":[{"id":"https://openalex.org/I4210090411","display_name":"DeepMind (United Kingdom)","ror":"https://ror.org/00971b260","country_code":"GB","type":"company","lineage":["https://openalex.org/I4210090411","https://openalex.org/I4210128969"]}],"countries":["GB"],"is_corresponding":false,"raw_author_name":"Daniel Hennes","raw_affiliation_strings":["Game Theory & Multi-Agent Team, DeepMind, London, UK"],"affiliations":[{"raw_affiliation_string":"Game Theory & Multi-Agent Team, DeepMind, London, UK","institution_ids":["https://openalex.org/I4210090411"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5006947993","display_name":"Edward Hughes","orcid":"https://orcid.org/0000-0002-2434-2334"},"institutions":[{"id":"https://openalex.org/I4210090411","display_name":"DeepMind (United Kingdom)","ror":"https://ror.org/00971b260","country_code":"GB","type":"company","lineage":["https://openalex.org/I4210090411","https://openalex.org/I4210128969"]}],"countries":["GB"],"is_corresponding":false,"raw_author_name":"Edward Hughes","raw_affiliation_strings":["Game Theory & Multi-Agent Team, DeepMind, London, UK"],"affiliations":[{"raw_affiliation_string":"Game Theory & Multi-Agent Team, DeepMind, London, UK","institution_ids":["https://openalex.org/I4210090411"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5061261923","display_name":"Mina Khan","orcid":null},"institutions":[{"id":"https://openalex.org/I4210090411","display_name":"DeepMind (United Kingdom)","ror":"https://ror.org/00971b260","country_code":"GB","type":"company","lineage":["https://openalex.org/I4210090411","https://openalex.org/I4210128969"]}],"countries":["GB"],"is_corresponding":false,"raw_author_name":"Mina Khan","raw_affiliation_strings":["Game Theory & Multi-Agent Team, DeepMind, London, UK"],"affiliations":[{"raw_affiliation_string":"Game Theory & Multi-Agent Team, DeepMind, London, UK","institution_ids":["https://openalex.org/I4210090411"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5049659586","display_name":"Marc Lanctot","orcid":null},"institutions":[{"id":"https://openalex.org/I4210090411","display_name":"DeepMind (United Kingdom)","ror":"https://ror.org/00971b260","country_code":"GB","type":"company","lineage":["https://openalex.org/I4210090411","https://openalex.org/I4210128969"]}],"countries":["GB"],"is_corresponding":false,"raw_author_name":"Marc Lanctot","raw_affiliation_strings":["Game Theory & Multi-Agent Team, DeepMind, London, UK"],"affiliations":[{"raw_affiliation_string":"Game Theory & Multi-Agent Team, DeepMind, London, UK","institution_ids":["https://openalex.org/I4210090411"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5105978897","display_name":"Kate Larson","orcid":"https://orcid.org/0000-0002-5455-9657"},"institutions":[{"id":"https://openalex.org/I4210090411","display_name":"DeepMind (United Kingdom)","ror":"https://ror.org/00971b260","country_code":"GB","type":"company","lineage":["https://openalex.org/I4210090411","https://openalex.org/I4210128969"]}],"countries":["GB"],"is_corresponding":false,"raw_author_name":"Kate Larson","raw_affiliation_strings":["Game Theory & Multi-Agent Team, DeepMind, London, UK"],"affiliations":[{"raw_affiliation_string":"Game Theory & Multi-Agent Team, DeepMind, London, UK","institution_ids":["https://openalex.org/I4210090411"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5031943811","display_name":"Guy Lever","orcid":"https://orcid.org/0000-0001-9551-1839"},"institutions":[{"id":"https://openalex.org/I4210090411","display_name":"DeepMind (United Kingdom)","ror":"https://ror.org/00971b260","country_code":"GB","type":"company","lineage":["https://openalex.org/I4210090411","https://openalex.org/I4210128969"]}],"countries":["GB"],"is_corresponding":false,"raw_author_name":"Guy Lever","raw_affiliation_strings":["Game Theory & Multi-Agent Team, DeepMind, London, UK"],"affiliations":[{"raw_affiliation_string":"Game Theory & Multi-Agent Team, DeepMind, London, UK","institution_ids":["https://openalex.org/I4210090411"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5100390236","display_name":"Siqi Liu","orcid":"https://orcid.org/0000-0002-4675-5498"},"institutions":[{"id":"https://openalex.org/I4210090411","display_name":"DeepMind (United Kingdom)","ror":"https://ror.org/00971b260","country_code":"GB","type":"company","lineage":["https://openalex.org/I4210090411","https://openalex.org/I4210128969"]}],"countries":["GB"],"is_corresponding":false,"raw_author_name":"Siqi Liu","raw_affiliation_strings":["Game Theory & Multi-Agent Team, DeepMind, London, UK"],"affiliations":[{"raw_affiliation_string":"Game Theory & Multi-Agent Team, DeepMind, London, UK","institution_ids":["https://openalex.org/I4210090411"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5051039278","display_name":"Luke Marris","orcid":null},"institutions":[{"id":"https://openalex.org/I4210090411","display_name":"DeepMind (United Kingdom)","ror":"https://ror.org/00971b260","country_code":"GB","type":"company","lineage":["https://openalex.org/I4210090411","https://openalex.org/I4210128969"]}],"countries":["GB"],"is_corresponding":false,"raw_author_name":"Luke Marris","raw_affiliation_strings":["Game Theory & Multi-Agent Team, DeepMind, London, UK"],"affiliations":[{"raw_affiliation_string":"Game Theory & Multi-Agent Team, DeepMind, London, UK","institution_ids":["https://openalex.org/I4210090411"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5013841168","display_name":"Kevin R. McKee","orcid":"https://orcid.org/0000-0002-4412-1686"},"institutions":[{"id":"https://openalex.org/I4210090411","display_name":"DeepMind (United Kingdom)","ror":"https://ror.org/00971b260","country_code":"GB","type":"company","lineage":["https://openalex.org/I4210090411","https://openalex.org/I4210128969"]}],"countries":["GB"],"is_corresponding":false,"raw_author_name":"Kevin R. McKee","raw_affiliation_strings":["Game Theory & Multi-Agent Team, DeepMind, London, UK"],"affiliations":[{"raw_affiliation_string":"Game Theory & Multi-Agent Team, DeepMind, London, UK","institution_ids":["https://openalex.org/I4210090411"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5058922471","display_name":"Paul M\u00fcller","orcid":"https://orcid.org/0000-0002-5734-3130"},"institutions":[{"id":"https://openalex.org/I4210090411","display_name":"DeepMind (United Kingdom)","ror":"https://ror.org/00971b260","country_code":"GB","type":"company","lineage":["https://openalex.org/I4210090411","https://openalex.org/I4210128969"]}],"countries":["GB"],"is_corresponding":false,"raw_author_name":"Paul Muller","raw_affiliation_strings":["Game Theory & Multi-Agent Team, DeepMind, London, UK"],"affiliations":[{"raw_affiliation_string":"Game Theory & Multi-Agent Team, DeepMind, London, UK","institution_ids":["https://openalex.org/I4210090411"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5056707583","display_name":"Julien P\u00e9rolat","orcid":"https://orcid.org/0000-0002-8176-1666"},"institutions":[{"id":"https://openalex.org/I4210090411","display_name":"DeepMind (United Kingdom)","ror":"https://ror.org/00971b260","country_code":"GB","type":"company","lineage":["https://openalex.org/I4210090411","https://openalex.org/I4210128969"]}],"countries":["GB"],"is_corresponding":false,"raw_author_name":"Julien P\u00e9rolat","raw_affiliation_strings":["Game Theory & Multi-Agent Team, DeepMind, London, UK"],"affiliations":[{"raw_affiliation_string":"Game Theory & Multi-Agent Team, DeepMind, London, UK","institution_ids":["https://openalex.org/I4210090411"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5024394972","display_name":"Florian Strub","orcid":"https://orcid.org/0000-0001-7271-5345"},"institutions":[{"id":"https://openalex.org/I4210090411","display_name":"DeepMind (United Kingdom)","ror":"https://ror.org/00971b260","country_code":"GB","type":"company","lineage":["https://openalex.org/I4210090411","https://openalex.org/I4210128969"]}],"countries":["GB"],"is_corresponding":false,"raw_author_name":"Florian Strub","raw_affiliation_strings":["Game Theory & Multi-Agent Team, DeepMind, London, UK"],"affiliations":[{"raw_affiliation_string":"Game Theory & Multi-Agent Team, DeepMind, London, UK","institution_ids":["https://openalex.org/I4210090411"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5071433151","display_name":"Andrea Tacchetti","orcid":"https://orcid.org/0000-0001-9311-9171"},"institutions":[{"id":"https://openalex.org/I4210090411","display_name":"DeepMind (United Kingdom)","ror":"https://ror.org/00971b260","country_code":"GB","type":"company","lineage":["https://openalex.org/I4210090411","https://openalex.org/I4210128969"]}],"countries":["GB"],"is_corresponding":false,"raw_author_name":"Andrea Tacchetti","raw_affiliation_strings":["Game Theory & Multi-Agent Team, DeepMind, London, UK"],"affiliations":[{"raw_affiliation_string":"Game Theory & Multi-Agent Team, DeepMind, London, UK","institution_ids":["https://openalex.org/I4210090411"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5072903215","display_name":"Eugene Tarassov","orcid":"https://orcid.org/0000-0002-7330-860X"},"institutions":[{"id":"https://openalex.org/I4210090411","display_name":"DeepMind (United Kingdom)","ror":"https://ror.org/00971b260","country_code":"GB","type":"company","lineage":["https://openalex.org/I4210090411","https://openalex.org/I4210128969"]}],"countries":["GB"],"is_corresponding":false,"raw_author_name":"Eugene Tarassov","raw_affiliation_strings":["Game Theory & Multi-Agent Team, DeepMind, London, UK"],"affiliations":[{"raw_affiliation_string":"Game Theory & Multi-Agent Team, DeepMind, London, UK","institution_ids":["https://openalex.org/I4210090411"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5100621319","display_name":"Zhe Wang","orcid":"https://orcid.org/0000-0002-3759-2041"},"institutions":[{"id":"https://openalex.org/I4210090411","display_name":"DeepMind (United Kingdom)","ror":"https://ror.org/00971b260","country_code":"GB","type":"company","lineage":["https://openalex.org/I4210090411","https://openalex.org/I4210128969"]}],"countries":["GB"],"is_corresponding":false,"raw_author_name":"Zhe Wang","raw_affiliation_strings":["Game Theory & Multi-Agent Team, DeepMind, London, UK"],"affiliations":[{"raw_affiliation_string":"Game Theory & Multi-Agent Team, DeepMind, London, UK","institution_ids":["https://openalex.org/I4210090411"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5008547992","display_name":"Karl Tuyls","orcid":"https://orcid.org/0000-0001-7929-1944"},"institutions":[{"id":"https://openalex.org/I4210090411","display_name":"DeepMind (United Kingdom)","ror":"https://ror.org/00971b260","country_code":"GB","type":"company","lineage":["https://openalex.org/I4210090411","https://openalex.org/I4210128969"]}],"countries":["GB"],"is_corresponding":true,"raw_author_name":"Karl Tuyls","raw_affiliation_strings":["Game Theory & Multi-Agent Team, DeepMind, London, UK"],"affiliations":[{"raw_affiliation_string":"Game Theory & Multi-Agent Team, DeepMind, London, UK","institution_ids":["https://openalex.org/I4210090411"]}]}],"institution_assertions":[],"countries_distinct_count":1,"institutions_distinct_count":1,"corresponding_author_ids":["https://openalex.org/A5008547992"],"corresponding_institution_ids":["https://openalex.org/I4210090411"],"apc_list":null,"apc_paid":null,"fwci":0.162,"has_fulltext":false,"cited_by_count":1,"citation_normalized_percentile":{"value":0.418212,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":{"min":60,"max":70},"biblio":{"volume":"35","issue":"4","first_page":"271","last_page":"284"},"is_retracted":false,"is_paratext":false,"primary_topic":{"id":"https://openalex.org/T10462","display_name":"Reinforcement Learning in Robotics","score":0.9983,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10462","display_name":"Reinforcement Learning in Robotics","score":0.9983,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11252","display_name":"Evolutionary Game Theory and Cooperation","score":0.9882,"subfield":{"id":"https://openalex.org/subfields/3312","display_name":"Sociology and Political Science"},"field":{"id":"https://openalex.org/fields/33","display_name":"Social Sciences"},"domain":{"id":"https://openalex.org/domains/2","display_name":"Social Sciences"}},{"id":"https://openalex.org/T11704","display_name":"Mobile Crowdsensing and Crowdsourcing","score":0.9784,"subfield":{"id":"https://openalex.org/subfields/1706","display_name":"Computer Science Applications"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[],"concepts":[{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.83318627},{"id":"https://openalex.org/C97541855","wikidata":"https://www.wikidata.org/wiki/Q830687","display_name":"Reinforcement learning","level":2,"score":0.6650467},{"id":"https://openalex.org/C41550386","wikidata":"https://www.wikidata.org/wiki/Q529909","display_name":"Multi-agent system","level":2,"score":0.49599656},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.44564027},{"id":"https://openalex.org/C58642233","wikidata":"https://www.wikidata.org/wiki/Q8269924","display_name":"Taxonomy (biology)","level":2,"score":0.41507876},{"id":"https://openalex.org/C107457646","wikidata":"https://www.wikidata.org/wiki/Q207434","display_name":"Human\u2013computer interaction","level":1,"score":0.41451368},{"id":"https://openalex.org/C56739046","wikidata":"https://www.wikidata.org/wiki/Q192060","display_name":"Knowledge management","level":1,"score":0.36577475},{"id":"https://openalex.org/C2522767166","wikidata":"https://www.wikidata.org/wiki/Q2374463","display_name":"Data science","level":1,"score":0.32905012},{"id":"https://openalex.org/C86803240","wikidata":"https://www.wikidata.org/wiki/Q420","display_name":"Biology","level":0,"score":0.0},{"id":"https://openalex.org/C59822182","wikidata":"https://www.wikidata.org/wiki/Q441","display_name":"Botany","level":1,"score":0.0}],"mesh":[],"locations_count":2,"locations":[{"is_oa":false,"landing_page_url":"https://doi.org/10.3233/aic-220113","pdf_url":null,"source":{"id":"https://openalex.org/S176303223","display_name":"AI Communications","issn_l":"0921-7126","issn":["0921-7126","1875-8452"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310318577","host_organization_name":"IOS Press","host_organization_lineage":["https://openalex.org/P4310318577"],"host_organization_lineage_names":["IOS Press"],"type":"journal"},"license":null,"license_id":null,"version":null,"is_accepted":false,"is_published":false},{"is_oa":true,"landing_page_url":"https://arxiv.org/abs/2209.10958","pdf_url":"https://arxiv.org/pdf/2209.10958","source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":["Cornell University"],"type":"repository"},"license":null,"license_id":null,"version":"submittedVersion","is_accepted":false,"is_published":false}],"best_oa_location":{"is_oa":true,"landing_page_url":"https://arxiv.org/abs/2209.10958","pdf_url":"https://arxiv.org/pdf/2209.10958","source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":["Cornell University"],"type":"repository"},"license":null,"license_id":null,"version":"submittedVersion","is_accepted":false,"is_published":false},"sustainable_development_goals":[],"grants":[],"datasets":[],"versions":[],"referenced_works_count":32,"referenced_works":["https://openalex.org/W1192553058","https://openalex.org/W1605936240","https://openalex.org/W1963754118","https://openalex.org/W1995622844","https://openalex.org/W2000941866","https://openalex.org/W2011000015","https://openalex.org/W2038686546","https://openalex.org/W2108598243","https://openalex.org/W2586680856","https://openalex.org/W2766447205","https://openalex.org/W2896274930","https://openalex.org/W2916924555","https://openalex.org/W2925418831","https://openalex.org/W2963373847","https://openalex.org/W2964381205","https://openalex.org/W2982316857","https://openalex.org/W2997345668","https://openalex.org/W3034222845","https://openalex.org/W3092876226","https://openalex.org/W3102534762","https://openalex.org/W3121382465","https://openalex.org/W3126647909","https://openalex.org/W3128901210","https://openalex.org/W3158023256","https://openalex.org/W3163016373","https://openalex.org/W3167043448","https://openalex.org/W3190930624","https://openalex.org/W4206483639","https://openalex.org/W4207074987","https://openalex.org/W4225654671","https://openalex.org/W4287760655","https://openalex.org/W4287813665"],"related_works":["https://openalex.org/W4380318855","https://openalex.org/W4362501864","https://openalex.org/W4306904969","https://openalex.org/W3049728571","https://openalex.org/W2964765435","https://openalex.org/W2586732548","https://openalex.org/W2138720691","https://openalex.org/W20361778","https://openalex.org/W2031695474","https://openalex.org/W2024136090"],"abstract_inverted_index":{"The":[0],"Game":[1],"Theory":[2],"&":[3],"Multi-Agent":[4],"team":[5,38,87],"at":[6,58],"DeepMind":[7,59],"studies":[8],"several":[9],"aspects":[10],"of":[11,44,85],"multi-agent":[12,66,101],"learning":[13,63],"ranging":[14],"from":[15],"computing":[16],"approximations":[17],"to":[18,24,48,56,64,75],"fundamental":[19],"concepts":[20],"in":[21,28,36,60,68,100],"game":[22],"theory":[23],"simulating":[25],"social":[26],"dilemmas":[27],"rich":[29],"spatial":[30],"environments":[31,70],"and":[32,52,71,88],"training":[33],"3-d":[34],"humanoids":[35],"difficult":[37],"coordination":[39],"tasks.":[40],"A":[41],"signature":[42],"aim":[43],"our":[45,77,86],"group":[46],"is":[47],"use":[49,72],"the":[50,82],"resources":[51],"expertise":[53],"made":[54],"available":[55],"us":[57],"deep":[61],"reinforcement":[62],"explore":[65],"systems":[67],"complex":[69],"these":[73],"benchmarks":[74],"advance":[76],"understanding.":[78],"Here,":[79],"we":[80,93],"summarise":[81],"recent":[83],"work":[84],"present":[89],"a":[90],"taxonomy":[91],"that":[92],"feel":[94],"highlights":[95],"many":[96],"important":[97],"open":[98],"challenges":[99],"research.":[102]},"cited_by_api_url":"https://api.openalex.org/works?filter=cites:W4294771618","counts_by_year":[{"year":2022,"cited_by_count":1}],"updated_date":"2025-01-08T22:19:37.705629","created_date":"2022-09-06"}