{"id":"https://openalex.org/W4220904111","doi":"https://doi.org/10.1016/j.neunet.2022.03.015","title":"Selective particle attention: Rapidly and flexibly selecting features for deep reinforcement learning","display_name":"Selective particle attention: Rapidly and flexibly selecting features for deep reinforcement learning","publication_year":2022,"publication_date":"2022-03-17","ids":{"openalex":"https://openalex.org/W4220904111","doi":"https://doi.org/10.1016/j.neunet.2022.03.015","pmid":"https://pubmed.ncbi.nlm.nih.gov/35358888"},"language":"en","primary_location":{"is_oa":true,"landing_page_url":"https://doi.org/10.1016/j.neunet.2022.03.015","pdf_url":null,"source":{"id":"https://openalex.org/S123019304","display_name":"Neural Networks","issn_l":"0893-6080","issn":["0893-6080","1879-2782"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310320990","host_organization_name":"Elsevier BV","host_organization_lineage":["https://openalex.org/P4310320990"],"host_organization_lineage_names":["Elsevier BV"],"type":"journal"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"publishedVersion","is_accepted":true,"is_published":true},"type":"article","type_crossref":"journal-article","indexed_in":["crossref","pubmed"],"open_access":{"is_oa":true,"oa_status":"hybrid","oa_url":"https://doi.org/10.1016/j.neunet.2022.03.015","any_repository_has_fulltext":true},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5065665155","display_name":"Sam Blakeman","orcid":"https://orcid.org/0000-0002-5023-7933"},"institutions":[{"id":"https://openalex.org/I98259816","display_name":"Birkbeck, University of London","ror":"https://ror.org/02mb95055","country_code":"GB","type":"education","lineage":["https://openalex.org/I124357947","https://openalex.org/I98259816"]}],"countries":["GB"],"is_corresponding":true,"raw_author_name":"Sam Blakeman","raw_affiliation_strings":["Centre for Brain and Cognitive Development, Department of Psychological Sciences, Birkbeck, University of London, Malet Street, WC1E 7HX, United Kingdom","Sony AI, Wiesenstrasse 5, 8952, Schlieren, Switzerland"],"affiliations":[{"raw_affiliation_string":"Sony AI, Wiesenstrasse 5, 8952, Schlieren, Switzerland","institution_ids":[]},{"raw_affiliation_string":"Centre for Brain and Cognitive Development, Department of Psychological Sciences, Birkbeck, University of London, Malet Street, WC1E 7HX, United Kingdom","institution_ids":["https://openalex.org/I98259816"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5073001689","display_name":"Denis Mareschal","orcid":"https://orcid.org/0000-0002-9828-9548"},"institutions":[{"id":"https://openalex.org/I98259816","display_name":"Birkbeck, University of London","ror":"https://ror.org/02mb95055","country_code":"GB","type":"education","lineage":["https://openalex.org/I124357947","https://openalex.org/I98259816"]}],"countries":["GB"],"is_corresponding":false,"raw_author_name":"Denis Mareschal","raw_affiliation_strings":["Centre for Brain and Cognitive Development, Department of Psychological Sciences, Birkbeck, University of London, Malet Street, WC1E 7HX, United Kingdom"],"affiliations":[{"raw_affiliation_string":"Centre for Brain and Cognitive Development, Department of Psychological Sciences, Birkbeck, University of London, Malet Street, WC1E 7HX, United Kingdom","institution_ids":["https://openalex.org/I98259816"]}]}],"institution_assertions":[],"countries_distinct_count":1,"institutions_distinct_count":1,"corresponding_author_ids":["https://openalex.org/A5065665155"],"corresponding_institution_ids":["https://openalex.org/I98259816"],"apc_list":{"value":3350,"currency":"USD","value_usd":3350,"provenance":"doaj"},"apc_paid":{"value":3350,"currency":"USD","value_usd":3350,"provenance":"doaj"},"fwci":0.332,"has_fulltext":true,"fulltext_origin":"pdf","cited_by_count":2,"citation_normalized_percentile":{"value":0.37728,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":{"min":70,"max":76},"biblio":{"volume":"150","issue":null,"first_page":"408","last_page":"421"},"is_retracted":false,"is_paratext":false,"primary_topic":{"id":"https://openalex.org/T10581","display_name":"Neural dynamics and brain function","score":0.9996,"subfield":{"id":"https://openalex.org/subfields/2805","display_name":"Cognitive Neuroscience"},"field":{"id":"https://openalex.org/fields/28","display_name":"Neuroscience"},"domain":{"id":"https://openalex.org/domains/1","display_name":"Life Sciences"}},"topics":[{"id":"https://openalex.org/T10581","display_name":"Neural dynamics and brain function","score":0.9996,"subfield":{"id":"https://openalex.org/subfields/2805","display_name":"Cognitive Neuroscience"},"field":{"id":"https://openalex.org/fields/28","display_name":"Neuroscience"},"domain":{"id":"https://openalex.org/domains/1","display_name":"Life Sciences"}},{"id":"https://openalex.org/T10502","display_name":"Advanced Memory and Neural Computing","score":0.993,"subfield":{"id":"https://openalex.org/subfields/2208","display_name":"Electrical and Electronic Engineering"},"field":{"id":"https://openalex.org/fields/22","display_name":"Engineering"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10462","display_name":"Reinforcement Learning in Robotics","score":0.9873,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/overfitting","display_name":"Overfitting","score":0.7723942},{"id":"https://openalex.org/keywords/backpropagation","display_name":"Backpropagation","score":0.43325025}],"concepts":[{"id":"https://openalex.org/C97541855","wikidata":"https://www.wikidata.org/wiki/Q830687","display_name":"Reinforcement learning","level":2,"score":0.7943286},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.7936934},{"id":"https://openalex.org/C22019652","wikidata":"https://www.wikidata.org/wiki/Q331309","display_name":"Overfitting","level":3,"score":0.7723942},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.74918973},{"id":"https://openalex.org/C2780451532","wikidata":"https://www.wikidata.org/wiki/Q759676","display_name":"Task (project management)","level":2,"score":0.6772093},{"id":"https://openalex.org/C2780598303","wikidata":"https://www.wikidata.org/wiki/Q65921492","display_name":"Flexibility (engineering)","level":2,"score":0.6579027},{"id":"https://openalex.org/C108583219","wikidata":"https://www.wikidata.org/wiki/Q197536","display_name":"Deep learning","level":2,"score":0.5207503},{"id":"https://openalex.org/C119857082","wikidata":"https://www.wikidata.org/wiki/Q2539","display_name":"Machine learning","level":1,"score":0.44876313},{"id":"https://openalex.org/C155032097","wikidata":"https://www.wikidata.org/wiki/Q798503","display_name":"Backpropagation","level":3,"score":0.43325025},{"id":"https://openalex.org/C52421305","wikidata":"https://www.wikidata.org/wiki/Q1151499","display_name":"Particle filter","level":3,"score":0.42512992},{"id":"https://openalex.org/C50644808","wikidata":"https://www.wikidata.org/wiki/Q192776","display_name":"Artificial neural network","level":2,"score":0.34796152},{"id":"https://openalex.org/C105795698","wikidata":"https://www.wikidata.org/wiki/Q12483","display_name":"Statistics","level":1,"score":0.0},{"id":"https://openalex.org/C33923547","wikidata":"https://www.wikidata.org/wiki/Q395","display_name":"Mathematics","level":0,"score":0.0},{"id":"https://openalex.org/C187736073","wikidata":"https://www.wikidata.org/wiki/Q2920921","display_name":"Management","level":1,"score":0.0},{"id":"https://openalex.org/C162324750","wikidata":"https://www.wikidata.org/wiki/Q8134","display_name":"Economics","level":0,"score":0.0},{"id":"https://openalex.org/C157286648","wikidata":"https://www.wikidata.org/wiki/Q846780","display_name":"Kalman filter","level":2,"score":0.0}],"mesh":[{"descriptor_ui":"D007858","descriptor_name":"Learning","qualifier_ui":"","qualifier_name":null,"is_major_topic":true},{"descriptor_ui":"D012054","descriptor_name":"Reinforcement, Psychology","qualifier_ui":"","qualifier_name":null,"is_major_topic":true},{"descriptor_ui":"D001288","descriptor_name":"Attention","qualifier_ui":"","qualifier_name":null,"is_major_topic":false},{"descriptor_ui":"D001685","descriptor_name":"Biological Factors","qualifier_ui":"","qualifier_name":null,"is_major_topic":false},{"descriptor_ui":"D012201","descriptor_name":"Reward","qualifier_ui":"","qualifier_name":null,"is_major_topic":false}],"locations_count":4,"locations":[{"is_oa":true,"landing_page_url":"https://doi.org/10.1016/j.neunet.2022.03.015","pdf_url":null,"source":{"id":"https://openalex.org/S123019304","display_name":"Neural Networks","issn_l":"0893-6080","issn":["0893-6080","1879-2782"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310320990","host_organization_name":"Elsevier BV","host_organization_lineage":["https://openalex.org/P4310320990"],"host_organization_lineage_names":["Elsevier BV"],"type":"journal"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"publishedVersion","is_accepted":true,"is_published":true},{"is_oa":true,"landing_page_url":"https://www.ncbi.nlm.nih.gov/pmc/articles/PMC9037388","pdf_url":null,"source":{"id":"https://openalex.org/S2764455111","display_name":"PubMed Central","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I1299303238","host_organization_name":"National Institutes of Health","host_organization_lineage":["https://openalex.org/I1299303238"],"host_organization_lineage_names":["National Institutes of Health"],"type":"repository"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true},{"is_oa":true,"landing_page_url":"https://eprints.bbk.ac.uk/id/eprint/47766/1/47766.pdf","pdf_url":"https://eprints.bbk.ac.uk/id/eprint/47766/1/47766.pdf","source":{"id":"https://openalex.org/S4306400466","display_name":"BIROn (Birkbeck, University of London)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I98259816","host_organization_name":"Birkbeck, University of London","host_organization_lineage":["https://openalex.org/I98259816"],"host_organization_lineage_names":["Birkbeck, University of London"],"type":"repository"},"license":null,"license_id":null,"version":"acceptedVersion","is_accepted":true,"is_published":false},{"is_oa":false,"landing_page_url":"https://pubmed.ncbi.nlm.nih.gov/35358888","pdf_url":null,"source":{"id":"https://openalex.org/S4306525036","display_name":"PubMed","issn_l":null,"issn":null,"is_oa":false,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I1299303238","host_organization_name":"National Institutes of Health","host_organization_lineage":["https://openalex.org/I1299303238"],"host_organization_lineage_names":["National Institutes of Health"],"type":"repository"},"license":null,"license_id":null,"version":null,"is_accepted":false,"is_published":false}],"best_oa_location":{"is_oa":true,"landing_page_url":"https://doi.org/10.1016/j.neunet.2022.03.015","pdf_url":null,"source":{"id":"https://openalex.org/S123019304","display_name":"Neural Networks","issn_l":"0893-6080","issn":["0893-6080","1879-2782"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310320990","host_organization_name":"Elsevier BV","host_organization_lineage":["https://openalex.org/P4310320990"],"host_organization_lineage_names":["Elsevier BV"],"type":"journal"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"publishedVersion","is_accepted":true,"is_published":true},"sustainable_development_goals":[{"display_name":"Peace, justice, and strong institutions","score":0.81,"id":"https://metadata.un.org/sdg/16"}],"grants":[{"funder":"https://openalex.org/F4320334629","funder_display_name":"Biotechnology and Biological Sciences Research Council","award_id":null}],"datasets":[],"versions":[],"referenced_works_count":59,"referenced_works":["https://openalex.org/W1581202840","https://openalex.org/W1602651658","https://openalex.org/W1675937554","https://openalex.org/W1686810756","https://openalex.org/W1969757816","https://openalex.org/W1973479817","https://openalex.org/W1986264597","https://openalex.org/W1989692592","https://openalex.org/W1992694071","https://openalex.org/W1993637338","https://openalex.org/W2007339694","https://openalex.org/W2027096892","https://openalex.org/W2037986568","https://openalex.org/W2041336675","https://openalex.org/W2064675550","https://openalex.org/W2078492619","https://openalex.org/W2088085131","https://openalex.org/W2115733720","https://openalex.org/W2118615399","https://openalex.org/W2120545133","https://openalex.org/W2145339207","https://openalex.org/W2149166988","https://openalex.org/W2151137320","https://openalex.org/W2169214866","https://openalex.org/W2183992914","https://openalex.org/W2266673418","https://openalex.org/W2753738274","https://openalex.org/W2759324644","https://openalex.org/W2769514070","https://openalex.org/W2774756601","https://openalex.org/W2807340089","https://openalex.org/W2807915115","https://openalex.org/W2823112946","https://openalex.org/W2892147425","https://openalex.org/W2893184150","https://openalex.org/W2899742573","https://openalex.org/W2902476877","https://openalex.org/W2917491140","https://openalex.org/W2927638312","https://openalex.org/W2950872548","https://openalex.org/W2963305465","https://openalex.org/W2977481643","https://openalex.org/W2982316857","https://openalex.org/W2995546843","https://openalex.org/W2999905431","https://openalex.org/W3017152929","https://openalex.org/W3115293622","https://openalex.org/W3118608800","https://openalex.org/W3150815575","https://openalex.org/W3170308824","https://openalex.org/W3206188474","https://openalex.org/W4214717370","https://openalex.org/W4233065987","https://openalex.org/W4234009070","https://openalex.org/W4248221301","https://openalex.org/W4249142012","https://openalex.org/W4297744728","https://openalex.org/W4301172471","https://openalex.org/W4385245566"],"related_works":["https://openalex.org/W4378510483","https://openalex.org/W4376166922","https://openalex.org/W4362597605","https://openalex.org/W4297676672","https://openalex.org/W4281702477","https://openalex.org/W3099765033","https://openalex.org/W3009056573","https://openalex.org/W2922073769","https://openalex.org/W2490526372","https://openalex.org/W1574414179"],"abstract_inverted_index":{"Deep":[0,27,48,71,158,224],"Reinforcement":[1],"Learning":[2],"(RL)":[3],"is":[4,25,45,82,169],"often":[5],"criticised":[6],"for":[7,22,41,116,157],"being":[8],"data":[9,87],"inefficient":[10],"and":[11,81,89,108,141,171,183,205,212,220],"inflexible":[12],"to":[13,46,50,86,97,128,173,208],"changes":[14,207],"in":[15,36,57,138],"task":[16,121,210],"structure.":[17],"Part":[18],"of":[19,77,92,113,154,188,222],"the":[20,67,70,120,209,218],"reason":[21],"these":[23,43,114,161],"issues":[24],"that":[26,53,181,200,214],"RL":[28,49,72,225],"typically":[29],"learns":[30,74],"end-to-end":[31],"using":[32,190],"backpropagation,":[33,167],"which":[34,151,168],"results":[35],"task-specific":[37],"representations.":[38],"One":[39],"approach":[40],"circumventing":[42],"problems":[44],"apply":[47],"existing":[51,155],"representations":[52,80,104,156],"have":[54],"been":[55],"learned":[56,165],"a":[58,75,90,111,124,143,178],"more":[59],"task-agnostic":[60],"fashion.":[61],"However,":[62],"this":[63,99],"only":[64,109,191],"partially":[65],"solves":[66],"problem":[68,100],"as":[69,129],"algorithm":[73,145],"function":[76],"all":[78],"pre-existing":[79],"therefore":[83],"still":[84],"susceptible":[85],"inefficiency":[88],"lack":[91],"flexibility.":[93],"Biological":[94],"agents":[95,140],"appear":[96],"solve":[98],"by":[101],"forming":[102],"internal":[103],"over":[105],"many":[106],"tasks":[107,199],"selecting":[110],"subset":[112],"features":[115,189],"decision-making":[117],"based":[118],"on":[119,197],"at":[122],"hand;":[123],"process":[125],"commonly":[126],"referred":[127],"selective":[130,136],"attention.":[131],"We":[132,194],"take":[133],"inspiration":[134],"from":[135],"attention":[137],"biological":[139],"propose":[142],"novel":[144],"called":[146],"Selective":[147],"Particle":[148],"Attention":[149],"(SPA),":[150],"selects":[152],"subsets":[153,162,187],"RL.":[159],"Crucially,":[160],"are":[163],"not":[164],"through":[166],"slow":[170],"prone":[172],"overfitting,":[174],"but":[175],"instead":[176],"via":[177],"particle":[179],"filter":[180],"rapidly":[182],"flexibly":[184],"identifies":[185],"key":[186],"reward":[192],"feedback.":[193],"evaluate":[195],"SPA":[196],"two":[198],"involve":[201],"raw":[202],"pixel":[203],"input":[204],"dynamic":[206],"structure,":[211],"show":[213],"it":[215],"greatly":[216],"increases":[217],"efficiency":[219],"flexibility":[221],"downstream":[223],"algorithms.":[226]},"cited_by_api_url":"https://api.openalex.org/works?filter=cites:W4220904111","counts_by_year":[{"year":2024,"cited_by_count":2}],"updated_date":"2024-12-19T01:52:59.889899","created_date":"2022-04-03"}