{"id":"https://openalex.org/W4224992903","doi":"https://doi.org/10.48550/arxiv.2204.11842","title":"Adaptive Online Value Function Approximation with Wavelets","display_name":"Adaptive Online Value Function Approximation with Wavelets","publication_year":2022,"publication_date":"2022-01-01","ids":{"openalex":"https://openalex.org/W4224992903","doi":"https://doi.org/10.48550/arxiv.2204.11842"},"language":"en","primary_location":{"is_oa":true,"landing_page_url":"https://arxiv.org/abs/2204.11842","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":["Cornell University"],"type":"repository"},"license":"other-oa","license_id":"https://openalex.org/licenses/other-oa","version":"submittedVersion","is_accepted":false,"is_published":false},"type":"preprint","type_crossref":"posted-content","indexed_in":["arxiv","datacite"],"open_access":{"is_oa":true,"oa_status":"green","oa_url":"https://arxiv.org/abs/2204.11842","any_repository_has_fulltext":true},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5091348511","display_name":"Michael Beukman","orcid":"https://orcid.org/0000-0002-5468-284X"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Beukman, Michael","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5016013995","display_name":"Michael Mitchley","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Mitchley, Michael","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5068919660","display_name":"Dean Wookey","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Wookey, Dean","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5078861770","display_name":"Steven James","orcid":"https://orcid.org/0000-0003-4366-4125"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"James, Steven","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"last","author":{"id":"https://openalex.org/A5078124517","display_name":"George Konidaris","orcid":"https://orcid.org/0000-0002-4460-2519"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Konidaris, George","raw_affiliation_strings":[],"affiliations":[]}],"institution_assertions":[],"countries_distinct_count":0,"institutions_distinct_count":0,"corresponding_author_ids":[],"corresponding_institution_ids":[],"apc_list":null,"apc_paid":null,"fwci":null,"has_fulltext":false,"cited_by_count":0,"citation_normalized_percentile":{"value":0.0,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":{"min":0,"max":60},"biblio":{"volume":null,"issue":null,"first_page":null,"last_page":null},"is_retracted":false,"is_paratext":false,"primary_topic":{"id":"https://openalex.org/T10462","display_name":"Reinforcement Learning in Robotics","score":0.9927,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10462","display_name":"Reinforcement Learning in Robotics","score":0.9927,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10270","display_name":"Blockchain Technology Applications and Security","score":0.944,"subfield":{"id":"https://openalex.org/subfields/1710","display_name":"Information Systems"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11241","display_name":"Advanced Malware Detection Techniques","score":0.9367,"subfield":{"id":"https://openalex.org/subfields/1711","display_name":"Signal Processing"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/basis-function","display_name":"Basis function","score":0.7079009},{"id":"https://openalex.org/keywords/basis","display_name":"Basis (linear algebra)","score":0.670277},{"id":"https://openalex.org/keywords/function-approximation","display_name":"Function Approximation","score":0.5742353},{"id":"https://openalex.org/keywords/granularity","display_name":"Granularity","score":0.41857645}],"concepts":[{"id":"https://openalex.org/C47432892","wikidata":"https://www.wikidata.org/wiki/Q831390","display_name":"Wavelet","level":2,"score":0.8089594},{"id":"https://openalex.org/C5917680","wikidata":"https://www.wikidata.org/wiki/Q2621825","display_name":"Basis function","level":2,"score":0.7079009},{"id":"https://openalex.org/C12426560","wikidata":"https://www.wikidata.org/wiki/Q189569","display_name":"Basis (linear algebra)","level":2,"score":0.670277},{"id":"https://openalex.org/C91873725","wikidata":"https://www.wikidata.org/wiki/Q3445816","display_name":"Function approximation","level":3,"score":0.5742353},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.54767954},{"id":"https://openalex.org/C111030470","wikidata":"https://www.wikidata.org/wiki/Q1430460","display_name":"Curse of dimensionality","level":2,"score":0.5109026},{"id":"https://openalex.org/C14036430","wikidata":"https://www.wikidata.org/wiki/Q3736076","display_name":"Function (biology)","level":2,"score":0.4836196},{"id":"https://openalex.org/C126255220","wikidata":"https://www.wikidata.org/wiki/Q141495","display_name":"Mathematical optimization","level":1,"score":0.44207942},{"id":"https://openalex.org/C72434380","wikidata":"https://www.wikidata.org/wiki/Q230930","display_name":"State space","level":2,"score":0.43619984},{"id":"https://openalex.org/C11413529","wikidata":"https://www.wikidata.org/wiki/Q8366","display_name":"Algorithm","level":1,"score":0.4242545},{"id":"https://openalex.org/C177774035","wikidata":"https://www.wikidata.org/wiki/Q1246948","display_name":"Granularity","level":2,"score":0.41857645},{"id":"https://openalex.org/C33923547","wikidata":"https://www.wikidata.org/wiki/Q395","display_name":"Mathematics","level":0,"score":0.40226737},{"id":"https://openalex.org/C50644808","wikidata":"https://www.wikidata.org/wiki/Q192776","display_name":"Artificial neural network","level":2,"score":0.35743764},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.32423228},{"id":"https://openalex.org/C134306372","wikidata":"https://www.wikidata.org/wiki/Q7754","display_name":"Mathematical analysis","level":1,"score":0.08633259},{"id":"https://openalex.org/C105795698","wikidata":"https://www.wikidata.org/wiki/Q12483","display_name":"Statistics","level":1,"score":0.0},{"id":"https://openalex.org/C2524010","wikidata":"https://www.wikidata.org/wiki/Q8087","display_name":"Geometry","level":1,"score":0.0},{"id":"https://openalex.org/C78458016","wikidata":"https://www.wikidata.org/wiki/Q840400","display_name":"Evolutionary biology","level":1,"score":0.0},{"id":"https://openalex.org/C86803240","wikidata":"https://www.wikidata.org/wiki/Q420","display_name":"Biology","level":0,"score":0.0},{"id":"https://openalex.org/C111919701","wikidata":"https://www.wikidata.org/wiki/Q9135","display_name":"Operating system","level":1,"score":0.0}],"mesh":[],"locations_count":3,"locations":[{"is_oa":true,"landing_page_url":"https://arxiv.org/abs/2204.11842","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":["Cornell University"],"type":"repository"},"license":"other-oa","license_id":"https://openalex.org/licenses/other-oa","version":"submittedVersion","is_accepted":false,"is_published":false},{"is_oa":true,"landing_page_url":"http://arxiv.org/abs/2204.11842","pdf_url":"http://arxiv.org/pdf/2204.11842","source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":["Cornell University"],"type":"repository"},"license":null,"license_id":null,"version":"submittedVersion","is_accepted":false,"is_published":false},{"is_oa":false,"landing_page_url":"https://api.datacite.org/dois/10.48550/arxiv.2204.11842","pdf_url":null,"source":{"id":"https://openalex.org/S4393179698","display_name":"DataCite API","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I4210145204","host_organization_name":"DataCite","host_organization_lineage":["https://openalex.org/I4210145204"],"host_organization_lineage_names":["DataCite"],"type":"metadata"},"license":null,"license_id":null,"version":null}],"best_oa_location":{"is_oa":true,"landing_page_url":"https://arxiv.org/abs/2204.11842","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":["Cornell University"],"type":"repository"},"license":"other-oa","license_id":"https://openalex.org/licenses/other-oa","version":"submittedVersion","is_accepted":false,"is_published":false},"sustainable_development_goals":[],"grants":[],"datasets":[],"versions":[],"referenced_works_count":0,"referenced_works":[],"related_works":["https://openalex.org/W4322615556","https://openalex.org/W4287555349","https://openalex.org/W3198417070","https://openalex.org/W3133651710","https://openalex.org/W3113111988","https://openalex.org/W2999756192","https://openalex.org/W2963359646","https://openalex.org/W2931688134","https://openalex.org/W2378857091","https://openalex.org/W2377919138"],"abstract_inverted_index":{"Using":[0],"function":[1,7,17,139],"approximation":[2,18,108],"to":[3,79,91,136,180],"represent":[4],"a":[5,71,94,110,138,154,177],"value":[6],"is":[8],"necessary":[9,130],"for":[10,62],"continuous":[11],"and":[12,23,28,74,131,169,171],"high-dimensional":[13],"state":[14,51,113],"spaces.":[15],"Linear":[16],"has":[19],"desirable":[20],"theoretical":[21],"guarantees":[22],"often":[24],"requires":[25],"less":[26],"compute":[27],"samples":[29],"than":[30],"neural":[31],"networks,":[32],"but":[33],"most":[34],"approaches":[35],"suffer":[36],"from":[37],"an":[38,182],"exponential":[39],"growth":[40],"in":[41,112,117],"the":[42,47,50,59,77,82,104,107,162,173,195],"number":[43],"of":[44,49,106,148],"functions":[45],"as":[46,70,85,122],"dimensionality":[48],"space":[52],"increases.":[53],"In":[54],"this":[55],"work,":[56],"we":[57,134],"introduce":[58],"wavelet":[60,156,197],"basis":[61,73,83,96,157,165,185],"reinforcement":[63],"learning.":[64],"Wavelets":[65],"can":[66,101,142],"effectively":[67],"be":[68,143],"used":[69],"fixed":[72,155,196],"additionally":[75],"provide":[76,176],"ability":[78],"adaptively":[80,144],"refine":[81],"set":[84,158],"learning":[86],"progresses,":[87],"making":[88],"it":[89],"feasible":[90],"start":[92],"with":[93],"minimal":[95],"set.":[97],"This":[98],"adaptive":[99,174],"method":[100],"either":[102],"increase":[103],"granularity":[105],"at":[109],"point":[111],"space,":[114],"or":[115,192],"add":[116],"interactions":[118],"between":[119],"different":[120],"dimensions":[121],"necessary.":[123],"We":[124,150],"prove":[125],"that":[126,141,153,172],"wavelets":[127],"are":[128],"both":[129],"sufficient":[132],"if":[133],"wish":[135],"construct":[137],"approximator":[140],"refined":[145],"without":[146],"loss":[147],"precision.":[149],"further":[151],"demonstrate":[152],"performs":[159],"comparably":[160],"against":[161],"high-performing":[163],"Fourier":[164],"on":[166],"Mountain":[167],"Car":[168],"Acrobot,":[170],"methods":[175],"convenient":[178],"approach":[179],"addressing":[181],"oversized":[183],"initial":[184],"set,":[186],"while":[187],"demonstrating":[188],"performance":[189],"comparable":[190],"to,":[191],"greater":[193],"than,":[194],"basis.":[198]},"cited_by_api_url":"https://api.openalex.org/works?filter=cites:W4224992903","counts_by_year":[],"updated_date":"2024-12-15T16:41:10.170581","created_date":"2022-04-28"}