{"id":"https://openalex.org/W1654131902","doi":"https://doi.org/10.1109/iros.1997.655073","title":"Region-based Q-learning using convex clustering approach","display_name":"Region-based Q-learning using convex clustering approach","publication_year":2002,"publication_date":"2002-11-22","ids":{"openalex":"https://openalex.org/W1654131902","doi":"https://doi.org/10.1109/iros.1997.655073","mag":"1654131902"},"language":"en","primary_location":{"is_oa":false,"landing_page_url":"https://doi.org/10.1109/iros.1997.655073","pdf_url":null,"source":null,"license":null,"license_id":null,"version":null,"is_accepted":false,"is_published":false},"type":"article","type_crossref":"proceedings-article","indexed_in":["crossref"],"open_access":{"is_oa":false,"oa_status":"closed","oa_url":null,"any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5006610241","display_name":"J.H. Kim","orcid":"https://orcid.org/0000-0003-2530-349X"},"institutions":[{"id":"https://openalex.org/I4575257","display_name":"Hanyang University","ror":"https://ror.org/046865y68","country_code":"KR","type":"funder","lineage":["https://openalex.org/I4575257"]}],"countries":["KR"],"is_corresponding":false,"raw_author_name":"J.H. Kim","raw_affiliation_strings":["Intelligent Control & Robotics Lab., Hanyang Univ., Kyeongki, South Korea"],"affiliations":[{"raw_affiliation_string":"Intelligent Control & Robotics Lab., Hanyang Univ., Kyeongki, South Korea","institution_ids":["https://openalex.org/I4575257"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5030410269","display_name":"Il Hong Suh","orcid":"https://orcid.org/0000-0002-0981-329X"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"I.H. Suh","raw_affiliation_strings":["DEPARTMENT OF ELECTRONIC ENGINEERING"],"affiliations":[{"raw_affiliation_string":"DEPARTMENT OF ELECTRONIC ENGINEERING","institution_ids":[]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5014100305","display_name":"Sang\u2013Rok Oh","orcid":"https://orcid.org/0000-0002-1102-031X"},"institutions":[{"id":"https://openalex.org/I4575257","display_name":"Hanyang University","ror":"https://ror.org/046865y68","country_code":"KR","type":"funder","lineage":["https://openalex.org/I4575257"]}],"countries":["KR"],"is_corresponding":false,"raw_author_name":"S.R. Oh","raw_affiliation_strings":[" Hanyang University"],"affiliations":[{"raw_affiliation_string":" Hanyang University","institution_ids":["https://openalex.org/I4575257"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5008385535","display_name":"Yunseol Cho","orcid":null},"institutions":[{"id":"https://openalex.org/I4575257","display_name":"Hanyang University","ror":"https://ror.org/046865y68","country_code":"KR","type":"funder","lineage":["https://openalex.org/I4575257"]}],"countries":["KR"],"is_corresponding":false,"raw_author_name":"Y.J. Cho","raw_affiliation_strings":[" Hanyang University"],"affiliations":[{"raw_affiliation_string":" Hanyang University","institution_ids":["https://openalex.org/I4575257"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5108369781","display_name":"Y.K. Chung","orcid":null},"institutions":[{"id":"https://openalex.org/I4575257","display_name":"Hanyang University","ror":"https://ror.org/046865y68","country_code":"KR","type":"funder","lineage":["https://openalex.org/I4575257"]}],"countries":["KR"],"is_corresponding":false,"raw_author_name":"Y.K. Chung","raw_affiliation_strings":[" Hanyang University"],"affiliations":[{"raw_affiliation_string":" Hanyang University","institution_ids":["https://openalex.org/I4575257"]}]}],"institution_assertions":[],"countries_distinct_count":1,"institutions_distinct_count":1,"corresponding_author_ids":[],"corresponding_institution_ids":[],"apc_list":null,"apc_paid":null,"fwci":0.54,"has_fulltext":true,"fulltext_origin":"ngrams","cited_by_count":6,"citation_normalized_percentile":{"value":0.523928,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":{"min":75,"max":76},"biblio":{"volume":"2","issue":null,"first_page":"601","last_page":"607"},"is_retracted":false,"is_paratext":false,"primary_topic":{"id":"https://openalex.org/T10462","display_name":"Reinforcement Learning in Robotics","score":0.999,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10462","display_name":"Reinforcement Learning in Robotics","score":0.999,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10586","display_name":"Robotic Path Planning Algorithms","score":0.9971,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T12288","display_name":"Optimization and Search Problems","score":0.9963,"subfield":{"id":"https://openalex.org/subfields/1705","display_name":"Computer Networks and Communications"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/q-learning","display_name":"Q-learning","score":0.54317826},{"id":"https://openalex.org/keywords/scara","display_name":"SCARA","score":0.5099803}],"concepts":[{"id":"https://openalex.org/C73555534","wikidata":"https://www.wikidata.org/wiki/Q622825","display_name":"Cluster analysis","level":2,"score":0.6664003},{"id":"https://openalex.org/C8038995","wikidata":"https://www.wikidata.org/wiki/Q1152135","display_name":"Unsupervised learning","level":2,"score":0.59641635},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.5573993},{"id":"https://openalex.org/C188116033","wikidata":"https://www.wikidata.org/wiki/Q2664563","display_name":"Q-learning","level":3,"score":0.54317826},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.5325982},{"id":"https://openalex.org/C90509273","wikidata":"https://www.wikidata.org/wiki/Q11012","display_name":"Robot","level":2,"score":0.51357293},{"id":"https://openalex.org/C158732272","wikidata":"https://www.wikidata.org/wiki/Q1484792","display_name":"SCARA","level":3,"score":0.5099803},{"id":"https://openalex.org/C72434380","wikidata":"https://www.wikidata.org/wiki/Q230930","display_name":"State space","level":2,"score":0.48347074},{"id":"https://openalex.org/C189950617","wikidata":"https://www.wikidata.org/wiki/Q937228","display_name":"Property (philosophy)","level":2,"score":0.46702743},{"id":"https://openalex.org/C112680207","wikidata":"https://www.wikidata.org/wiki/Q714886","display_name":"Regular polygon","level":2,"score":0.43008986},{"id":"https://openalex.org/C126255220","wikidata":"https://www.wikidata.org/wiki/Q141495","display_name":"Mathematical optimization","level":1,"score":0.3284405},{"id":"https://openalex.org/C33923547","wikidata":"https://www.wikidata.org/wiki/Q395","display_name":"Mathematics","level":0,"score":0.27146834},{"id":"https://openalex.org/C97541855","wikidata":"https://www.wikidata.org/wiki/Q830687","display_name":"Reinforcement learning","level":2,"score":0.18299645},{"id":"https://openalex.org/C138885662","wikidata":"https://www.wikidata.org/wiki/Q5891","display_name":"Philosophy","level":0,"score":0.0},{"id":"https://openalex.org/C105795698","wikidata":"https://www.wikidata.org/wiki/Q12483","display_name":"Statistics","level":1,"score":0.0},{"id":"https://openalex.org/C2524010","wikidata":"https://www.wikidata.org/wiki/Q8087","display_name":"Geometry","level":1,"score":0.0},{"id":"https://openalex.org/C111472728","wikidata":"https://www.wikidata.org/wiki/Q9471","display_name":"Epistemology","level":1,"score":0.0}],"mesh":[],"locations_count":1,"locations":[{"is_oa":false,"landing_page_url":"https://doi.org/10.1109/iros.1997.655073","pdf_url":null,"source":null,"license":null,"license_id":null,"version":null,"is_accepted":false,"is_published":false}],"best_oa_location":null,"sustainable_development_goals":[],"grants":[],"datasets":[],"versions":[],"referenced_works_count":12,"referenced_works":["https://openalex.org/W1557517019","https://openalex.org/W1590631717","https://openalex.org/W1612579644","https://openalex.org/W1712925070","https://openalex.org/W1952590090","https://openalex.org/W2103626435","https://openalex.org/W2139465937","https://openalex.org/W2151012394","https://openalex.org/W2158316397","https://openalex.org/W3011120880","https://openalex.org/W32403112","https://openalex.org/W50296447"],"related_works":["https://openalex.org/W3169911176","https://openalex.org/W3095489175","https://openalex.org/W2573045761","https://openalex.org/W2542992786","https://openalex.org/W2171128163","https://openalex.org/W2113822937","https://openalex.org/W2104958792","https://openalex.org/W1968617831","https://openalex.org/W152605265","https://openalex.org/W1486209696"],"abstract_inverted_index":{"For":[0],"continuous":[1],"state":[2,56],"space":[3,109],"applications,":[4],"a":[5,16,24,30,36,49,83,104,118],"novel":[6],"method":[7,14,46,76,96,102],"of":[8,52,72,90],"Q-learning":[9,95,101],"is":[10,97],"proposed,":[11],"where":[12],"the":[13,39,63,88,93],"incorporates":[15],"region-based":[17],"reward":[18,41],"assignment":[19,27],"being":[20],"used":[21],"to":[22,34,65,70,79],"solve":[23],"structural":[25],"credit":[26],"problem":[28],"and":[29,61,112],"convex":[31],"clustering":[32],"approach":[33],"find":[35],"region":[37],"with":[38,99],"same":[40],"attribution":[42],"property.":[43],"Our":[44],"learning":[45],"can":[47],"estimate":[48],"current":[50],"Q-value":[51],"an":[53],"arbitrarily":[54],"given":[55],"by":[57],"using":[58],"effect":[59],"functions,":[60],"has":[62],"ability":[64],"learn":[66],"its":[67],"actions":[68],"similar":[69],"that":[71],"Q-learning.":[73],"Thus,":[74],"our":[75,91],"enables":[77],"robots":[78],"move":[80],"smoothly":[81],"in":[82],"real":[84],"environment.":[85],"To":[86],"show":[87],"validity":[89],"method,":[92],"proposed":[94],"compared":[98],"conventional":[100],"through":[103],"simple":[105],"two":[106],"dimensional":[107],"free":[108],"navigation":[110],"problem,":[111],"visual":[113],"tracking":[114],"simulation":[115],"results":[116],"involving":[117],"2-DOF":[119],"SCARA":[120],"robot":[121],"are":[122],"also":[123],"presented.":[124]},"abstract_inverted_index_v3":null,"cited_by_api_url":"https://api.openalex.org/works?filter=cites:W1654131902","counts_by_year":[{"year":2019,"cited_by_count":1}],"updated_date":"2025-04-19T10:57:50.580546","created_date":"2016-06-24"}