{"id":"https://openalex.org/W7125494631","doi":"https://doi.org/10.1145/3790252","title":"A Hybrid Approach of Imitation Learning and Deep Reinforcement Learning with Direct-Effect Update Interval for Elevator Dispatching","display_name":"A Hybrid Approach of Imitation Learning and Deep Reinforcement Learning with Direct-Effect Update Interval for Elevator Dispatching","publication_year":2026,"publication_date":"2026-01-23","ids":{"openalex":"https://openalex.org/W7125494631","doi":"https://doi.org/10.1145/3790252"},"language":"en","primary_location":{"id":"doi:10.1145/3790252","is_oa":true,"landing_page_url":"https://doi.org/10.1145/3790252","pdf_url":null,"source":{"id":"https://openalex.org/S2506189754","display_name":"ACM Transactions on Cyber-Physical Systems","issn_l":"2378-962X","issn":["2378-962X","2378-9638"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310319798","host_organization_name":"Association for Computing Machinery","host_organization_lineage":["https://openalex.org/P4310319798"],"host_organization_lineage_names":["Association for Computing Machinery"],"type":"journal"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"ACM Transactions on Cyber-Physical Systems","raw_type":"journal-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":true,"oa_status":"hybrid","oa_url":"https://doi.org/10.1145/3790252","any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5044790776","display_name":"Jiansong Wan","orcid":"https://orcid.org/0000-0002-3748-8404"},"institutions":[{"id":"https://openalex.org/I157485424","display_name":"Korea Advanced Institute of Science and Technology","ror":"https://ror.org/05apxxy63","country_code":"KR","type":"education","lineage":["https://openalex.org/I157485424"]}],"countries":["KR"],"is_corresponding":true,"raw_author_name":"Jiansong Wan","raw_affiliation_strings":["Korea Advanced Institute of Science and Technology, Daejeon, Republic of Korea"],"raw_orcid":"https://orcid.org/0000-0002-3748-8404","affiliations":[{"raw_affiliation_string":"Korea Advanced Institute of Science and Technology, Daejeon, Republic of Korea","institution_ids":["https://openalex.org/I157485424"]}]},{"author_position":"middle","author":{"id":null,"display_name":"Kanghoon Lee","orcid":"https://orcid.org/0000-0003-2195-798X"},"institutions":[{"id":"https://openalex.org/I157485424","display_name":"Korea Advanced Institute of Science and Technology","ror":"https://ror.org/05apxxy63","country_code":"KR","type":"education","lineage":["https://openalex.org/I157485424"]}],"countries":["KR"],"is_corresponding":false,"raw_author_name":"Kanghoon Lee","raw_affiliation_strings":["Korea Advanced Institute of Science and Technology, Daejeon, Republic of Korea"],"raw_orcid":"https://orcid.org/0000-0003-2195-798X","affiliations":[{"raw_affiliation_string":"Korea Advanced Institute of Science and Technology, Daejeon, Republic of Korea","institution_ids":["https://openalex.org/I157485424"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5064587334","display_name":"Hayong Shin","orcid":"https://orcid.org/0000-0002-5161-661X"},"institutions":[{"id":"https://openalex.org/I157485424","display_name":"Korea Advanced Institute of Science and Technology","ror":"https://ror.org/05apxxy63","country_code":"KR","type":"education","lineage":["https://openalex.org/I157485424"]}],"countries":["KR"],"is_corresponding":false,"raw_author_name":"Hayong Shin","raw_affiliation_strings":["Korea Advanced Institute of Science and Technology, Daejeon, Republic of Korea"],"raw_orcid":"https://orcid.org/0000-0002-5161-661X","affiliations":[{"raw_affiliation_string":"Korea Advanced Institute of Science and Technology, Daejeon, Republic of Korea","institution_ids":["https://openalex.org/I157485424"]}]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":3,"corresponding_author_ids":["https://openalex.org/A5044790776"],"corresponding_institution_ids":["https://openalex.org/I157485424"],"apc_list":null,"apc_paid":null,"fwci":0.0,"has_fulltext":false,"cited_by_count":0,"citation_normalized_percentile":{"value":0.1108475,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":null,"biblio":{"volume":"10","issue":"3","first_page":"1","last_page":"19"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T14011","display_name":"Elevator Systems and Control","score":0.9959999918937683,"subfield":{"id":"https://openalex.org/subfields/2207","display_name":"Control and Systems Engineering"},"field":{"id":"https://openalex.org/fields/22","display_name":"Engineering"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T14011","display_name":"Elevator Systems and Control","score":0.9959999918937683,"subfield":{"id":"https://openalex.org/subfields/2207","display_name":"Control and Systems Engineering"},"field":{"id":"https://openalex.org/fields/22","display_name":"Engineering"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T12206","display_name":"Vibration and Dynamic Analysis","score":0.0007999999797903001,"subfield":{"id":"https://openalex.org/subfields/2207","display_name":"Control and Systems Engineering"},"field":{"id":"https://openalex.org/fields/22","display_name":"Engineering"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10524","display_name":"Traffic control and management","score":0.00039999998989515007,"subfield":{"id":"https://openalex.org/subfields/2207","display_name":"Control and Systems Engineering"},"field":{"id":"https://openalex.org/fields/22","display_name":"Engineering"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/reinforcement-learning","display_name":"Reinforcement learning","score":0.9031999707221985},{"id":"https://openalex.org/keywords/elevator","display_name":"Elevator","score":0.6748999953269958},{"id":"https://openalex.org/keywords/benchmark","display_name":"Benchmark (surveying)","score":0.6700999736785889},{"id":"https://openalex.org/keywords/q-learning","display_name":"Q-learning","score":0.6284000277519226},{"id":"https://openalex.org/keywords/interval","display_name":"Interval (graph theory)","score":0.5209000110626221},{"id":"https://openalex.org/keywords/scheduling","display_name":"Scheduling (production processes)","score":0.4767000079154968},{"id":"https://openalex.org/keywords/imitation","display_name":"Imitation","score":0.453000009059906}],"concepts":[{"id":"https://openalex.org/C97541855","wikidata":"https://www.wikidata.org/wiki/Q830687","display_name":"Reinforcement learning","level":2,"score":0.9031999707221985},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.6869999766349792},{"id":"https://openalex.org/C147021018","wikidata":"https://www.wikidata.org/wiki/Q252451","display_name":"Elevator","level":2,"score":0.6748999953269958},{"id":"https://openalex.org/C185798385","wikidata":"https://www.wikidata.org/wiki/Q1161707","display_name":"Benchmark (surveying)","level":2,"score":0.6700999736785889},{"id":"https://openalex.org/C188116033","wikidata":"https://www.wikidata.org/wiki/Q2664563","display_name":"Q-learning","level":3,"score":0.6284000277519226},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.5648000240325928},{"id":"https://openalex.org/C2778067643","wikidata":"https://www.wikidata.org/wiki/Q166507","display_name":"Interval (graph theory)","level":2,"score":0.5209000110626221},{"id":"https://openalex.org/C206729178","wikidata":"https://www.wikidata.org/wiki/Q2271896","display_name":"Scheduling (production processes)","level":2,"score":0.4767000079154968},{"id":"https://openalex.org/C126388530","wikidata":"https://www.wikidata.org/wiki/Q1131737","display_name":"Imitation","level":2,"score":0.453000009059906},{"id":"https://openalex.org/C98045186","wikidata":"https://www.wikidata.org/wiki/Q205663","display_name":"Process (computing)","level":2,"score":0.4327000081539154},{"id":"https://openalex.org/C119857082","wikidata":"https://www.wikidata.org/wiki/Q2539","display_name":"Machine learning","level":1,"score":0.3889999985694885},{"id":"https://openalex.org/C108583219","wikidata":"https://www.wikidata.org/wiki/Q197536","display_name":"Deep learning","level":2,"score":0.3253999948501587},{"id":"https://openalex.org/C2775924081","wikidata":"https://www.wikidata.org/wiki/Q55608371","display_name":"Control (management)","level":2,"score":0.3149000108242035},{"id":"https://openalex.org/C67203356","wikidata":"https://www.wikidata.org/wiki/Q1321905","display_name":"Reinforcement","level":2,"score":0.29600000381469727},{"id":"https://openalex.org/C112758219","wikidata":"https://www.wikidata.org/wiki/Q16038819","display_name":"Duration (music)","level":2,"score":0.29490000009536743},{"id":"https://openalex.org/C139002025","wikidata":"https://www.wikidata.org/wiki/Q3001212","display_name":"Lift (data mining)","level":2,"score":0.2883000075817108},{"id":"https://openalex.org/C196340769","wikidata":"https://www.wikidata.org/wiki/Q7698910","display_name":"Temporal difference learning","level":3,"score":0.2833999991416931},{"id":"https://openalex.org/C91575142","wikidata":"https://www.wikidata.org/wiki/Q1971426","display_name":"Optimal control","level":2,"score":0.27320000529289246}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.1145/3790252","is_oa":true,"landing_page_url":"https://doi.org/10.1145/3790252","pdf_url":null,"source":{"id":"https://openalex.org/S2506189754","display_name":"ACM Transactions on Cyber-Physical Systems","issn_l":"2378-962X","issn":["2378-962X","2378-9638"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310319798","host_organization_name":"Association for Computing Machinery","host_organization_lineage":["https://openalex.org/P4310319798"],"host_organization_lineage_names":["Association for Computing Machinery"],"type":"journal"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"ACM Transactions on Cyber-Physical Systems","raw_type":"journal-article"}],"best_oa_location":{"id":"doi:10.1145/3790252","is_oa":true,"landing_page_url":"https://doi.org/10.1145/3790252","pdf_url":null,"source":{"id":"https://openalex.org/S2506189754","display_name":"ACM Transactions on Cyber-Physical Systems","issn_l":"2378-962X","issn":["2378-962X","2378-9638"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310319798","host_organization_name":"Association for Computing Machinery","host_organization_lineage":["https://openalex.org/P4310319798"],"host_organization_lineage_names":["Association for Computing Machinery"],"type":"journal"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"ACM Transactions on Cyber-Physical Systems","raw_type":"journal-article"},"sustainable_development_goals":[],"awards":[],"funders":[],"has_content":{"pdf":false,"grobid_xml":false},"content_urls":null,"referenced_works_count":15,"referenced_works":["https://openalex.org/W2062353690","https://openalex.org/W2082373829","https://openalex.org/W2121099957","https://openalex.org/W2274680267","https://openalex.org/W2525813444","https://openalex.org/W2604382266","https://openalex.org/W3049468855","https://openalex.org/W3133722106","https://openalex.org/W3138984732","https://openalex.org/W3153113933","https://openalex.org/W3154178432","https://openalex.org/W3177457598","https://openalex.org/W4200067854","https://openalex.org/W4307234290","https://openalex.org/W4319737028"],"related_works":[],"abstract_inverted_index":{"The":[0],"rapid":[1],"increase":[2],"in":[3,23,187],"high-rise":[4],"building":[5],"construction":[6],"has":[7,143],"intensified":[8],"the":[9,19,30,39,63,69,73,83,96,99,126,134,154,166,170,175,180,194],"need":[10],"for":[11,86],"efficient":[12],"elevator":[13,20,24,65,87],"system":[14],"operations.":[15],"This":[16],"article":[17],"addresses":[18],"dispatching":[21,66],"problem":[22,31],"group":[25],"control":[26],"systems.":[27],"We":[28],"formulate":[29],"as":[32,163,165,200],"a":[33,76,111,121],"Semi-Markov":[34],"Decision":[35],"Process":[36],"(SMDP),":[37],"defining":[38],"state":[40],"representation,":[41],"action":[42],"space,":[43],"and":[44,56,193],"reward":[45],"function.":[46],"A":[47],"two-phase":[48],"model":[49,182],"is":[50,79,103],"then":[51],"introduced,":[52],"integrating":[53],"imitation":[54,158],"learning":[55,59,116,136,159,177],"deep":[57,114],"reinforcement":[58,115,135,161,176],"techniques":[60],"to":[61,89,146],"derive":[62],"optimal":[64],"policy":[67,77,101,131],"from":[68],"formulated":[70],"SMDP.":[71],"In":[72,95],"first":[74],"phase,":[75,98],"network":[78,102],"pre-trained":[80,100],"by":[81],"estimating":[82],"time":[84,192],"required":[85],"cars":[88],"pick":[90],"up":[91],"assigned":[92],"hall":[93],"requests.":[94],"second":[97],"further":[104],"optimized":[105],"using":[106],"Proximal":[107],"Policy":[108],"Optimization":[109],"(PPO),":[110],"well-known":[112],"policy-based":[113],"method.":[117],"Additionally,":[118],"we":[119],"propose":[120],"novel":[122],"update":[123,172],"interval,":[124,128],"termed":[125],"\u201cdirect-effect\u201d":[127],"which":[129],"improves":[130],"training":[132],"during":[133,174],"phase.":[137,178],"Notably,":[138],"this":[139],"direct-effect":[140,171],"interval":[141,173],"concept":[142],"potential":[144],"applicability":[145],"other":[147],"multi-resource":[148],"scheduling":[149],"problems.":[150],"Empirical":[151],"experiments":[152],"demonstrate":[153],"advantages":[155],"of":[156,168,189,196],"incorporating":[157],"before":[160],"learning,":[162],"well":[164],"effectiveness":[167],"employing":[169],"Furthermore,":[179],"proposed":[181],"outperforms":[183],"various":[184],"benchmark":[185],"rules":[186],"terms":[188],"average":[190],"waiting":[191,198],"distribution":[195],"long":[197],"times,":[199],"validated":[201],"across":[202],"four":[203],"traffic":[204],"patterns.":[205]},"counts_by_year":[],"updated_date":"2026-05-21T06:26:12.895304","created_date":"2026-01-24T00:00:00"}
