{"id":"https://openalex.org/W4413318781","doi":"https://doi.org/10.1109/tmc.2025.3600533","title":"$\\pi$-eLight: Learning Interpretable Programmatic Policies for Effective Traffic Signal Control","display_name":"$\\pi$-eLight: Learning Interpretable Programmatic Policies for Effective Traffic Signal Control","publication_year":2025,"publication_date":"2025-08-19","ids":{"openalex":"https://openalex.org/W4413318781","doi":"https://doi.org/10.1109/tmc.2025.3600533"},"language":"en","primary_location":{"id":"doi:10.1109/tmc.2025.3600533","is_oa":false,"landing_page_url":"https://doi.org/10.1109/tmc.2025.3600533","pdf_url":null,"source":{"id":"https://openalex.org/S69141925","display_name":"IEEE Transactions on Mobile Computing","issn_l":"1536-1233","issn":["1536-1233","1558-0660","2161-9875"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310320439","host_organization_name":"IEEE Computer Society","host_organization_lineage":["https://openalex.org/P4310320439","https://openalex.org/P4310319808"],"host_organization_lineage_names":["IEEE Computer Society","Institute of Electrical and Electronics Engineers"],"type":"journal"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"IEEE Transactions on Mobile Computing","raw_type":"journal-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":false,"oa_status":"closed","oa_url":null,"any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5014673381","display_name":"Yin Gu","orcid":"https://orcid.org/0000-0002-6734-9085"},"institutions":[{"id":"https://openalex.org/I126520041","display_name":"University of Science and Technology of China","ror":"https://ror.org/04c4dkn09","country_code":"CN","type":"education","lineage":["https://openalex.org/I126520041","https://openalex.org/I19820366"]}],"countries":["CN"],"is_corresponding":true,"raw_author_name":"Yin Gu","raw_affiliation_strings":["State Key Laboratory of Cognitive Intelligence, University of Science and Technology of China, Hefei, China","State Key Laboratory of Cognitive Intelligence, University of Science and Technology of China, Wangjiang West Road, Hefei, Anhui, China"],"raw_orcid":"https://orcid.org/0000-0002-6734-9085","affiliations":[{"raw_affiliation_string":"State Key Laboratory of Cognitive Intelligence, University of Science and Technology of China, Hefei, China","institution_ids":["https://openalex.org/I126520041"]},{"raw_affiliation_string":"State Key Laboratory of Cognitive Intelligence, University of Science and Technology of China, Wangjiang West Road, Hefei, Anhui, China","institution_ids":["https://openalex.org/I126520041"]}]},{"author_position":"middle","author":{"id":null,"display_name":"Kai Zhang","orcid":"https://orcid.org/0000-0001-5335-2470"},"institutions":[{"id":"https://openalex.org/I126520041","display_name":"University of Science and Technology of China","ror":"https://ror.org/04c4dkn09","country_code":"CN","type":"education","lineage":["https://openalex.org/I126520041","https://openalex.org/I19820366"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Kai Zhang","raw_affiliation_strings":["State Key Laboratory of Cognitive Intelligence, University of Science and Technology of China, Hefei, China","State Key Laboratory of Cognitive Intelligence, University of Science and Technology of China, Wangjiang West Road, Hefei, Anhui, China"],"raw_orcid":"https://orcid.org/0000-0001-5335-2470","affiliations":[{"raw_affiliation_string":"State Key Laboratory of Cognitive Intelligence, University of Science and Technology of China, Hefei, China","institution_ids":["https://openalex.org/I126520041"]},{"raw_affiliation_string":"State Key Laboratory of Cognitive Intelligence, University of Science and Technology of China, Wangjiang West Road, Hefei, Anhui, China","institution_ids":["https://openalex.org/I126520041"]}]},{"author_position":"middle","author":{"id":null,"display_name":"Qi Liu","orcid":"https://orcid.org/0000-0001-6956-5550"},"institutions":[{"id":"https://openalex.org/I126520041","display_name":"University of Science and Technology of China","ror":"https://ror.org/04c4dkn09","country_code":"CN","type":"education","lineage":["https://openalex.org/I126520041","https://openalex.org/I19820366"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Qi Liu","raw_affiliation_strings":["State Key Laboratory of Cognitive Intelligence, University of Science and Technology of China, Hefei, China","State Key Laboratory of Cognitive Intelligence, University of Science and Technology of China, Wangjiang West Road, Hefei, Anhui, China"],"raw_orcid":"https://orcid.org/0000-0001-6956-5550","affiliations":[{"raw_affiliation_string":"State Key Laboratory of Cognitive Intelligence, University of Science and Technology of China, Hefei, China","institution_ids":["https://openalex.org/I126520041"]},{"raw_affiliation_string":"State Key Laboratory of Cognitive Intelligence, University of Science and Technology of China, Wangjiang West Road, Hefei, Anhui, China","institution_ids":["https://openalex.org/I126520041"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5004107420","display_name":"Haojie Yuan","orcid":null},"institutions":[{"id":"https://openalex.org/I126520041","display_name":"University of Science and Technology of China","ror":"https://ror.org/04c4dkn09","country_code":"CN","type":"education","lineage":["https://openalex.org/I126520041","https://openalex.org/I19820366"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Haojie Yuan","raw_affiliation_strings":["University of Science and Technology of China, Hefei, China","University of Science and Technology of China, China"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"University of Science and Technology of China, Hefei, China","institution_ids":["https://openalex.org/I126520041"]},{"raw_affiliation_string":"University of Science and Technology of China, China","institution_ids":["https://openalex.org/I126520041"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5100767610","display_name":"Runlong Yu","orcid":"https://orcid.org/0000-0003-4080-2377"},"institutions":[{"id":"https://openalex.org/I170201317","display_name":"University of Pittsburgh","ror":"https://ror.org/01an3r305","country_code":"US","type":"education","lineage":["https://openalex.org/I170201317"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Runlong Yu","raw_affiliation_strings":["Department of Computer Science, University of Pittsburgh, Pittsburgh, PA, USA","Department of Computer Science, the University of Pittsburgh, USA"],"raw_orcid":"https://orcid.org/0000-0003-4080-2377","affiliations":[{"raw_affiliation_string":"Department of Computer Science, University of Pittsburgh, Pittsburgh, PA, USA","institution_ids":["https://openalex.org/I170201317"]},{"raw_affiliation_string":"Department of Computer Science, the University of Pittsburgh, USA","institution_ids":["https://openalex.org/I170201317"]}]}],"institutions":[],"countries_distinct_count":2,"institutions_distinct_count":5,"corresponding_author_ids":["https://openalex.org/A5014673381"],"corresponding_institution_ids":["https://openalex.org/I126520041"],"apc_list":null,"apc_paid":null,"fwci":0.0,"has_fulltext":false,"cited_by_count":0,"citation_normalized_percentile":{"value":0.21622076,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":null,"biblio":{"volume":"25","issue":"1","first_page":"1122","last_page":"1136"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T11344","display_name":"Traffic Prediction and Management Techniques","score":0.9625999927520752,"subfield":{"id":"https://openalex.org/subfields/2215","display_name":"Building and Construction"},"field":{"id":"https://openalex.org/fields/22","display_name":"Engineering"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T11344","display_name":"Traffic Prediction and Management Techniques","score":0.9625999927520752,"subfield":{"id":"https://openalex.org/subfields/2215","display_name":"Building and Construction"},"field":{"id":"https://openalex.org/fields/22","display_name":"Engineering"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.771996796131134},{"id":"https://openalex.org/keywords/reinforcement-learning","display_name":"Reinforcement learning","score":0.7345250844955444},{"id":"https://openalex.org/keywords/traffic-signal","display_name":"Traffic signal","score":0.5118424296379089},{"id":"https://openalex.org/keywords/control","display_name":"Control (management)","score":0.46787071228027344},{"id":"https://openalex.org/keywords/signal","display_name":"SIGNAL (programming language)","score":0.4535851776599884},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.44507843255996704},{"id":"https://openalex.org/keywords/signal-processing","display_name":"Signal processing","score":0.43714362382888794},{"id":"https://openalex.org/keywords/machine-learning","display_name":"Machine learning","score":0.3540504574775696},{"id":"https://openalex.org/keywords/telecommunications","display_name":"Telecommunications","score":0.20163217186927795},{"id":"https://openalex.org/keywords/real-time-computing","display_name":"Real-time computing","score":0.17609041929244995},{"id":"https://openalex.org/keywords/programming-language","display_name":"Programming language","score":0.09002122282981873}],"concepts":[{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.771996796131134},{"id":"https://openalex.org/C97541855","wikidata":"https://www.wikidata.org/wiki/Q830687","display_name":"Reinforcement learning","level":2,"score":0.7345250844955444},{"id":"https://openalex.org/C2987419075","wikidata":"https://www.wikidata.org/wiki/Q8004","display_name":"Traffic signal","level":2,"score":0.5118424296379089},{"id":"https://openalex.org/C2775924081","wikidata":"https://www.wikidata.org/wiki/Q55608371","display_name":"Control (management)","level":2,"score":0.46787071228027344},{"id":"https://openalex.org/C2779843651","wikidata":"https://www.wikidata.org/wiki/Q7390335","display_name":"SIGNAL (programming language)","level":2,"score":0.4535851776599884},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.44507843255996704},{"id":"https://openalex.org/C104267543","wikidata":"https://www.wikidata.org/wiki/Q208163","display_name":"Signal processing","level":3,"score":0.43714362382888794},{"id":"https://openalex.org/C119857082","wikidata":"https://www.wikidata.org/wiki/Q2539","display_name":"Machine learning","level":1,"score":0.3540504574775696},{"id":"https://openalex.org/C76155785","wikidata":"https://www.wikidata.org/wiki/Q418","display_name":"Telecommunications","level":1,"score":0.20163217186927795},{"id":"https://openalex.org/C79403827","wikidata":"https://www.wikidata.org/wiki/Q3988","display_name":"Real-time computing","level":1,"score":0.17609041929244995},{"id":"https://openalex.org/C199360897","wikidata":"https://www.wikidata.org/wiki/Q9143","display_name":"Programming language","level":1,"score":0.09002122282981873},{"id":"https://openalex.org/C554190296","wikidata":"https://www.wikidata.org/wiki/Q47528","display_name":"Radar","level":2,"score":0.0}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.1109/tmc.2025.3600533","is_oa":false,"landing_page_url":"https://doi.org/10.1109/tmc.2025.3600533","pdf_url":null,"source":{"id":"https://openalex.org/S69141925","display_name":"IEEE Transactions on Mobile Computing","issn_l":"1536-1233","issn":["1536-1233","1558-0660","2161-9875"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310320439","host_organization_name":"IEEE Computer Society","host_organization_lineage":["https://openalex.org/P4310320439","https://openalex.org/P4310319808"],"host_organization_lineage_names":["IEEE Computer Society","Institute of Electrical and Electronics Engineers"],"type":"journal"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"IEEE Transactions on Mobile Computing","raw_type":"journal-article"}],"best_oa_location":null,"sustainable_development_goals":[],"awards":[{"id":"https://openalex.org/G3552964096","display_name":null,"funder_award_id":"62406303","funder_id":"https://openalex.org/F4320321001","funder_display_name":"National Natural Science Foundation of China"},{"id":"https://openalex.org/G4715534059","display_name":null,"funder_award_id":"2308085MG226","funder_id":"https://openalex.org/F4320334897","funder_display_name":"Natural Science Foundation of Anhui Province"},{"id":"https://openalex.org/G487329743","display_name":null,"funder_award_id":"62525606","funder_id":"https://openalex.org/F4320321001","funder_display_name":"National Natural Science Foundation of China"},{"id":"https://openalex.org/G5599671648","display_name":null,"funder_award_id":"2308085QF229","funder_id":"https://openalex.org/F4320334897","funder_display_name":"Natural Science Foundation of Anhui Province"}],"funders":[{"id":"https://openalex.org/F4320321001","display_name":"National Natural Science Foundation of China","ror":"https://ror.org/01h0zpd94"},{"id":"https://openalex.org/F4320334897","display_name":"Natural Science Foundation of Anhui Province","ror":null},{"id":"https://openalex.org/F4320335787","display_name":"Fundamental Research Funds for the Central Universities","ror":null}],"has_content":{"pdf":false,"grobid_xml":false},"content_urls":null,"referenced_works_count":36,"referenced_works":["https://openalex.org/W5525483","https://openalex.org/W1516835682","https://openalex.org/W1625390266","https://openalex.org/W1714211023","https://openalex.org/W2031530760","https://openalex.org/W2145339207","https://openalex.org/W2766447205","https://openalex.org/W2809148419","https://openalex.org/W2945976633","https://openalex.org/W2945991855","https://openalex.org/W2963027910","https://openalex.org/W2983178256","https://openalex.org/W2988973041","https://openalex.org/W2996811470","https://openalex.org/W2998187693","https://openalex.org/W2998332605","https://openalex.org/W3034604283","https://openalex.org/W3086530824","https://openalex.org/W3096739060","https://openalex.org/W3123082711","https://openalex.org/W4249184314","https://openalex.org/W4283787646","https://openalex.org/W4285601936","https://openalex.org/W4302010773","https://openalex.org/W4313555308","https://openalex.org/W4378830682","https://openalex.org/W4384916665","https://openalex.org/W4388624373","https://openalex.org/W4388722291","https://openalex.org/W4393161217","https://openalex.org/W4393241349","https://openalex.org/W4394963598","https://openalex.org/W4398188072","https://openalex.org/W4400412709","https://openalex.org/W4402892022","https://openalex.org/W4409158145"],"related_works":["https://openalex.org/W4306904969","https://openalex.org/W2138720691","https://openalex.org/W4362501864","https://openalex.org/W4367838498","https://openalex.org/W2393348402","https://openalex.org/W4293167677","https://openalex.org/W2242021741","https://openalex.org/W2377015873","https://openalex.org/W2605253768","https://openalex.org/W2392201083"],"abstract_inverted_index":{"The":[0],"recent":[1],"advancements":[2],"in":[3,170,192],"Deep":[4],"Reinforcement":[5],"Learning":[6],"(DRL)":[7],"have":[8],"significantly":[9],"improved":[10],"the":[11,35,51,61,71,83,92,128,167,196],"performance":[12],"of":[13,74,85],"adaptive":[14],"Traffic":[15],"Signal":[16],"Control":[17],"(TSC).":[18],"However,":[19],"DRL":[20,52],"policies":[21,37,63,199],"are":[22,42],"typically":[23],"represented":[24],"by":[25],"over-parameterized":[26],"neural":[27],"networks,":[28],"which":[29],"function":[30],"as":[31,127],"black-box":[32],"models.":[33],"Consequently,":[34],"learned":[36,62,197],"often":[38],"lack":[39],"interpretability":[40],"and":[41,148],"challenging":[43],"to":[44,59,114,165],"deploy":[45],"on":[46,204],"resource-constrained":[47],"edge":[48,205],"hardware.":[49],"Moreover,":[50,195],"methods":[53],"frequently":[54],"exhibit":[55],"poor":[56],"generalization,":[57],"struggling":[58],"transfer":[60],"across":[64,190],"different":[65,193],"geographical":[66],"regions.":[67],"These":[68],"limitations":[69],"hinder":[70],"real-world":[72,213],"applicability":[73],"learning-based":[75],"approaches.":[76],"To":[77],"address":[78],"these":[79],"issues,":[80],"we":[81,120,137,158],"suggest":[82],"use":[84],"an":[86,123],"inherently":[87],"interpretable":[88,146],"program":[89,125,169],"for":[90,101,144,151],"representing":[91],"control":[93,105,129],"policy.":[94],"We":[95],"present":[96],"Programmatic":[97],"Interpretable":[98],"reinforcement":[99],"learning":[100],"effective":[102,124],"traffic":[103],"signal":[104],"(<inline-formula":[106],"xmlns:mml=\"http://www.w3.org/1998/Math/MathML\"":[107,179],"xmlns:xlink=\"http://www.w3.org/1999/xlink\"><tex-math":[108,180],"notation=\"LaTeX\">$\\pi$</tex-math></inline-formula>-eLight),":[109],"a":[110,139,171],"new":[111],"approach":[112],"designed":[113],"autonomously":[115],"discover":[116],"non-differentiable":[117],"programs.":[118],"Specifically,":[119],"first":[121],"define":[122],"framework":[126],"policy,":[130],"where":[131],"certain":[132],"components":[133],"remain":[134],"learnable.":[135],"Next,":[136],"introduce":[138],"Domain":[140],"Specific":[141],"Language":[142],"(DSL)":[143],"constructing":[145],"programs":[147,153],"transformation":[149],"rules":[150],"generating":[152],"with":[154,207],"hierarchical":[155],"structures.":[156],"Last,":[157],"utilize":[159],"Monte":[160],"Carlo":[161],"Tree":[162],"Search":[163],"(MCTS)":[164],"find":[166],"optimal":[168],"discrete":[172],"space.":[173],"Extensive":[174],"experiments":[175],"demonstrate":[176],"that":[177],"<inline-formula":[178],"notation=\"LaTeX\">$\\pi$</tex-math></inline-formula>-eLight":[181],"consistently":[182],"outperforms":[183],"DRL-based":[184],"baselines":[185],"while":[186],"exhibiting":[187],"superior":[188],"generalization":[189],"intersections":[191],"cities.":[194],"programmatic":[198],"can":[200],"be":[201],"directly":[202],"deployed":[203],"devices":[206],"minimal":[208],"computational":[209],"resources,":[210],"further":[211],"enhancing":[212],"applicability.":[214]},"counts_by_year":[],"updated_date":"2025-12-04T23:47:47.292601","created_date":"2025-10-10T00:00:00"}
