{"id":"https://openalex.org/W2991478725","doi":"https://doi.org/10.1109/itsc.2019.8917519","title":"Reinforcement Learning with Explainability for Traffic Signal Control","display_name":"Reinforcement Learning with Explainability for Traffic Signal Control","publication_year":2019,"publication_date":"2019-10-01","ids":{"openalex":"https://openalex.org/W2991478725","doi":"https://doi.org/10.1109/itsc.2019.8917519","mag":"2991478725"},"language":"en","primary_location":{"is_oa":false,"landing_page_url":"https://doi.org/10.1109/itsc.2019.8917519","pdf_url":null,"source":null,"license":null,"license_id":null,"version":null,"is_accepted":false,"is_published":false},"type":"article","type_crossref":"proceedings-article","indexed_in":["crossref"],"open_access":{"is_oa":false,"oa_status":"closed","oa_url":null,"any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5077420826","display_name":"Stefano Rizzo","orcid":"https://orcid.org/0000-0003-3346-3389"},"institutions":[{"id":"https://openalex.org/I4210138380","display_name":"Qatar Cardiovascular Research Center","ror":"https://ror.org/038vyt185","country_code":"QA","type":"healthcare","lineage":["https://openalex.org/I4210138380"]}],"countries":["QA"],"is_corresponding":false,"raw_author_name":"Stefano Giovanni Rizzo","raw_affiliation_strings":["Qatar Computing Research Institute (QCRI), Doha, Qatar"],"affiliations":[{"raw_affiliation_string":"Qatar Computing Research Institute (QCRI), Doha, Qatar","institution_ids":["https://openalex.org/I4210138380"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5046441501","display_name":"Giovanna Vantini","orcid":null},"institutions":[{"id":"https://openalex.org/I4210138380","display_name":"Qatar Cardiovascular Research Center","ror":"https://ror.org/038vyt185","country_code":"QA","type":"healthcare","lineage":["https://openalex.org/I4210138380"]}],"countries":["QA"],"is_corresponding":false,"raw_author_name":"Giovanna Vantini","raw_affiliation_strings":["Qatar Computing Research Institute (QCRI), Doha, Qatar"],"affiliations":[{"raw_affiliation_string":"Qatar Computing Research Institute (QCRI), Doha, Qatar","institution_ids":["https://openalex.org/I4210138380"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5037947876","display_name":"Sanjay Chawla","orcid":"https://orcid.org/0000-0002-8102-2572"},"institutions":[{"id":"https://openalex.org/I4210138380","display_name":"Qatar Cardiovascular Research Center","ror":"https://ror.org/038vyt185","country_code":"QA","type":"healthcare","lineage":["https://openalex.org/I4210138380"]}],"countries":["QA"],"is_corresponding":false,"raw_author_name":"Sanjay Chawla","raw_affiliation_strings":["Qatar Computing Research Institute (QCRI), Doha, Qatar"],"affiliations":[{"raw_affiliation_string":"Qatar Computing Research Institute (QCRI), Doha, Qatar","institution_ids":["https://openalex.org/I4210138380"]}]}],"institution_assertions":[],"countries_distinct_count":1,"institutions_distinct_count":1,"corresponding_author_ids":[],"corresponding_institution_ids":[],"apc_list":null,"apc_paid":null,"fwci":4.611,"has_fulltext":false,"cited_by_count":22,"citation_normalized_percentile":{"value":0.968471,"is_in_top_1_percent":false,"is_in_top_10_percent":true},"cited_by_percentile_year":{"min":91,"max":92},"biblio":{"volume":null,"issue":null,"first_page":"3567","last_page":"3572"},"is_retracted":false,"is_paratext":false,"primary_topic":{"id":"https://openalex.org/T10524","display_name":"Traffic control and management","score":0.9998,"subfield":{"id":"https://openalex.org/subfields/2207","display_name":"Control and Systems Engineering"},"field":{"id":"https://openalex.org/fields/22","display_name":"Engineering"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10524","display_name":"Traffic control and management","score":0.9998,"subfield":{"id":"https://openalex.org/subfields/2207","display_name":"Control and Systems Engineering"},"field":{"id":"https://openalex.org/fields/22","display_name":"Engineering"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11344","display_name":"Traffic Prediction and Management Techniques","score":0.9972,"subfield":{"id":"https://openalex.org/subfields/2215","display_name":"Building and Construction"},"field":{"id":"https://openalex.org/fields/22","display_name":"Engineering"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11099","display_name":"Autonomous Vehicle Technology and Safety","score":0.9965,"subfield":{"id":"https://openalex.org/subfields/2203","display_name":"Automotive Engineering"},"field":{"id":"https://openalex.org/fields/22","display_name":"Engineering"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/roundabout","display_name":"Roundabout","score":0.8837631},{"id":"https://openalex.org/keywords/signal","display_name":"SIGNAL (programming language)","score":0.4281491}],"concepts":[{"id":"https://openalex.org/C109157449","wikidata":"https://www.wikidata.org/wiki/Q7371221","display_name":"Roundabout","level":2,"score":0.8837631},{"id":"https://openalex.org/C97541855","wikidata":"https://www.wikidata.org/wiki/Q830687","display_name":"Reinforcement learning","level":2,"score":0.8363914},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.70088804},{"id":"https://openalex.org/C50644808","wikidata":"https://www.wikidata.org/wiki/Q192776","display_name":"Artificial neural network","level":2,"score":0.5387396},{"id":"https://openalex.org/C25343380","wikidata":"https://www.wikidata.org/wiki/Q277521","display_name":"Relation (database)","level":2,"score":0.50992405},{"id":"https://openalex.org/C2775924081","wikidata":"https://www.wikidata.org/wiki/Q55608371","display_name":"Control (management)","level":2,"score":0.484276},{"id":"https://openalex.org/C48103436","wikidata":"https://www.wikidata.org/wiki/Q599031","display_name":"State (computer science)","level":2,"score":0.4610855},{"id":"https://openalex.org/C2779843651","wikidata":"https://www.wikidata.org/wiki/Q7390335","display_name":"SIGNAL (programming language)","level":2,"score":0.4281491},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.4267842},{"id":"https://openalex.org/C2987419075","wikidata":"https://www.wikidata.org/wiki/Q8004","display_name":"Traffic signal","level":2,"score":0.42162973},{"id":"https://openalex.org/C94915269","wikidata":"https://www.wikidata.org/wiki/Q1834857","display_name":"Detector","level":2,"score":0.41866},{"id":"https://openalex.org/C79403827","wikidata":"https://www.wikidata.org/wiki/Q3988","display_name":"Real-time computing","level":1,"score":0.33742866},{"id":"https://openalex.org/C127413603","wikidata":"https://www.wikidata.org/wiki/Q11023","display_name":"Engineering","level":0,"score":0.18341216},{"id":"https://openalex.org/C22212356","wikidata":"https://www.wikidata.org/wiki/Q775325","display_name":"Transport engineering","level":1,"score":0.17139259},{"id":"https://openalex.org/C124101348","wikidata":"https://www.wikidata.org/wiki/Q172491","display_name":"Data mining","level":1,"score":0.13220295},{"id":"https://openalex.org/C11413529","wikidata":"https://www.wikidata.org/wiki/Q8366","display_name":"Algorithm","level":1,"score":0.12433681},{"id":"https://openalex.org/C76155785","wikidata":"https://www.wikidata.org/wiki/Q418","display_name":"Telecommunications","level":1,"score":0.10607806},{"id":"https://openalex.org/C199360897","wikidata":"https://www.wikidata.org/wiki/Q9143","display_name":"Programming language","level":1,"score":0.0}],"mesh":[],"locations_count":1,"locations":[{"is_oa":false,"landing_page_url":"https://doi.org/10.1109/itsc.2019.8917519","pdf_url":null,"source":null,"license":null,"license_id":null,"version":null,"is_accepted":false,"is_published":false}],"best_oa_location":null,"sustainable_development_goals":[{"id":"https://metadata.un.org/sdg/11","display_name":"Sustainable cities and communities","score":0.41}],"grants":[],"datasets":[],"versions":[],"referenced_works_count":25,"referenced_works":["https://openalex.org/W1515851193","https://openalex.org/W1542507415","https://openalex.org/W1639167632","https://openalex.org/W2020070197","https://openalex.org/W2048805856","https://openalex.org/W2072979389","https://openalex.org/W2102099143","https://openalex.org/W2149174281","https://openalex.org/W2163207186","https://openalex.org/W2257979135","https://openalex.org/W2282821441","https://openalex.org/W2384435634","https://openalex.org/W2462310663","https://openalex.org/W2498017881","https://openalex.org/W2548134372","https://openalex.org/W2613020517","https://openalex.org/W2725582697","https://openalex.org/W2797527950","https://openalex.org/W2809148419","https://openalex.org/W2962862931","https://openalex.org/W2963027910","https://openalex.org/W3122002227","https://openalex.org/W33871791","https://openalex.org/W4214717370","https://openalex.org/W4389739628"],"related_works":["https://openalex.org/W3195808870","https://openalex.org/W3169884754","https://openalex.org/W3121910006","https://openalex.org/W3046449118","https://openalex.org/W2943218108","https://openalex.org/W2799340515","https://openalex.org/W2394278401","https://openalex.org/W2353721067","https://openalex.org/W2140594597","https://openalex.org/W2131944147"],"abstract_inverted_index":{"Deep":[0],"reinforcement":[1],"learning":[2],"has":[3],"recently":[4],"provided":[5],"promising":[6],"results":[7,162],"on":[8,95,142,172],"the":[9,22,38,62,75,108,111,116,122,128,135,138,143,148,173,184,188],"traffic":[10,23,40,84,104,185],"light":[11,24],"control":[12],"optimization":[13],"problem,":[14],"by":[15,31,176],"training":[16,90],"neural":[17],"network":[18],"agents":[19,27],"to":[20,49,127,168,182],"select":[21],"phase.":[25],"These":[26],"learn":[28],"complex":[29,67,178],"models":[30],"optimizing":[32],"a":[33,91,96,157,177],"simple":[34],"objective,":[35],"such":[36,72],"as":[37,73],"average":[39],"speed,":[41],"but":[42],"are":[43,55],"considered":[44],"opaque":[45],"when":[46],"it":[47,165],"comes":[48],"explaining":[50],"their":[51],"decisions.":[52],"Nevertheless,":[53],"explanations":[54,171],"required":[56],"in":[57,61,66,74,180],"transferring":[58],"this":[59,87],"technology":[60],"real":[63,103],"world,":[64],"especially":[65],"scenarios":[68],"with":[69,80,99],"nontrivial":[70],"phases,":[71,146],"case":[76],"of":[77,125,137],"signalized":[78,97],"roundabouts":[79],"entry":[81],"and":[82,102,115,119,187],"circulatory":[83],"lights.":[85],"In":[86],"paper,":[88],"after":[89],"Policy":[92],"Gradient":[93],"agent":[94,112,123,144],"roundabout":[98],"11":[100],"phases":[101],"data,":[105],"we":[106,120,133],"analyze":[107],"relation":[109,181],"between":[110],"phase":[113],"preferences":[114],"actual":[117],"traffic,":[118],"assess":[121],"capability":[124],"reacting":[126],"current":[129],"detectors":[130,140],"state.":[131],"Then,":[132],"estimate":[134],"effect":[136],"road":[139],"state":[141],"selected":[145],"through":[147],"SHAP":[149],"model-agnostic":[150],"technique,":[151],"using":[152],"Shapley":[153],"values":[154],"recovered":[155],"from":[156],"linear":[158],"explanation":[159],"model.":[160],"The":[161],"show":[163],"that":[164],"is":[166],"possible":[167],"extract":[169],"meaningful":[170],"decision":[174],"taken":[175],"policy,":[179],"both":[183],"volumes":[186],"lanes":[189],"occupancy.":[190]},"abstract_inverted_index_v3":null,"cited_by_api_url":"https://api.openalex.org/works?filter=cites:W2991478725","counts_by_year":[{"year":2025,"cited_by_count":1},{"year":2024,"cited_by_count":3},{"year":2023,"cited_by_count":5},{"year":2022,"cited_by_count":4},{"year":2021,"cited_by_count":6},{"year":2020,"cited_by_count":3}],"updated_date":"2025-04-21T23:31:09.737914","created_date":"2019-12-05"}