{"id":"https://openalex.org/W4289812636","doi":"https://doi.org/10.1109/tits.2022.3193852","title":"Transformer-Based Reinforcement Learning for Pickup and Delivery Problems With Late Penalties","display_name":"Transformer-Based Reinforcement Learning for Pickup and Delivery Problems With Late Penalties","publication_year":2022,"publication_date":"2022-08-04","ids":{"openalex":"https://openalex.org/W4289812636","doi":"https://doi.org/10.1109/tits.2022.3193852"},"language":"en","primary_location":{"id":"doi:10.1109/tits.2022.3193852","is_oa":false,"landing_page_url":"https://doi.org/10.1109/tits.2022.3193852","pdf_url":null,"source":{"id":"https://openalex.org/S144771191","display_name":"IEEE Transactions on Intelligent Transportation Systems","issn_l":"1524-9050","issn":["1524-9050","1558-0016"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310319808","host_organization_name":"Institute of Electrical and Electronics Engineers","host_organization_lineage":["https://openalex.org/P4310319808"],"host_organization_lineage_names":["Institute of Electrical and Electronics Engineers"],"type":"journal"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"IEEE Transactions on Intelligent Transportation Systems","raw_type":"journal-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":false,"oa_status":"closed","oa_url":null,"any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5058375369","display_name":"Ke Zhang","orcid":"https://orcid.org/0000-0001-7397-5560"},"institutions":[{"id":"https://openalex.org/I99065089","display_name":"Tsinghua University","ror":"https://ror.org/03cve4549","country_code":"CN","type":"education","lineage":["https://openalex.org/I99065089"]}],"countries":["CN"],"is_corresponding":true,"raw_author_name":"Ke Zhang","raw_affiliation_strings":["Department of Civil Engineering, Tsinghua University, Beijing, China"],"raw_orcid":"https://orcid.org/0000-0001-7397-5560","affiliations":[{"raw_affiliation_string":"Department of Civil Engineering, Tsinghua University, Beijing, China","institution_ids":["https://openalex.org/I99065089"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5103252409","display_name":"Xi Lin","orcid":"https://orcid.org/0000-0001-7137-5406"},"institutions":[{"id":"https://openalex.org/I99065089","display_name":"Tsinghua University","ror":"https://ror.org/03cve4549","country_code":"CN","type":"education","lineage":["https://openalex.org/I99065089"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Xi Lin","raw_affiliation_strings":["Department of Civil Engineering, Tsinghua University, Beijing, China"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"Department of Civil Engineering, Tsinghua University, Beijing, China","institution_ids":["https://openalex.org/I99065089"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5100457416","display_name":"Meng Li","orcid":"https://orcid.org/0000-0001-9494-4552"},"institutions":[{"id":"https://openalex.org/I99065089","display_name":"Tsinghua University","ror":"https://ror.org/03cve4549","country_code":"CN","type":"education","lineage":["https://openalex.org/I99065089"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Meng Li","raw_affiliation_strings":["Department of Civil Engineering, Tsinghua University, Beijing, China"],"raw_orcid":"https://orcid.org/0000-0001-9494-4552","affiliations":[{"raw_affiliation_string":"Department of Civil Engineering, Tsinghua University, Beijing, China","institution_ids":["https://openalex.org/I99065089"]}]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":3,"corresponding_author_ids":["https://openalex.org/A5058375369"],"corresponding_institution_ids":["https://openalex.org/I99065089"],"apc_list":null,"apc_paid":null,"fwci":1.4884,"has_fulltext":false,"cited_by_count":20,"citation_normalized_percentile":{"value":0.80672543,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":{"min":96,"max":99},"biblio":{"volume":"23","issue":"12","first_page":"24649","last_page":"24661"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T11942","display_name":"Transportation and Mobility Innovations","score":0.9994000196456909,"subfield":{"id":"https://openalex.org/subfields/2203","display_name":"Automotive Engineering"},"field":{"id":"https://openalex.org/fields/22","display_name":"Engineering"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T11942","display_name":"Transportation and Mobility Innovations","score":0.9994000196456909,"subfield":{"id":"https://openalex.org/subfields/2203","display_name":"Automotive Engineering"},"field":{"id":"https://openalex.org/fields/22","display_name":"Engineering"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T12546","display_name":"Smart Parking Systems Research","score":0.9984999895095825,"subfield":{"id":"https://openalex.org/subfields/2215","display_name":"Building and Construction"},"field":{"id":"https://openalex.org/fields/22","display_name":"Engineering"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10567","display_name":"Vehicle Routing Optimization Methods","score":0.9977999925613403,"subfield":{"id":"https://openalex.org/subfields/2209","display_name":"Industrial and Manufacturing Engineering"},"field":{"id":"https://openalex.org/fields/22","display_name":"Engineering"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/reinforcement-learning","display_name":"Reinforcement learning","score":0.8322965502738953},{"id":"https://openalex.org/keywords/pickup","display_name":"Pickup","score":0.7497711181640625},{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.6391599774360657},{"id":"https://openalex.org/keywords/transformer","display_name":"Transformer","score":0.5898767113685608},{"id":"https://openalex.org/keywords/heuristic","display_name":"Heuristic","score":0.46741724014282227},{"id":"https://openalex.org/keywords/process","display_name":"Process (computing)","score":0.45265311002731323},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.35997825860977173},{"id":"https://openalex.org/keywords/engineering","display_name":"Engineering","score":0.2808312773704529},{"id":"https://openalex.org/keywords/voltage","display_name":"Voltage","score":0.08635741472244263}],"concepts":[{"id":"https://openalex.org/C97541855","wikidata":"https://www.wikidata.org/wiki/Q830687","display_name":"Reinforcement learning","level":2,"score":0.8322965502738953},{"id":"https://openalex.org/C2776221269","wikidata":"https://www.wikidata.org/wiki/Q572648","display_name":"Pickup","level":3,"score":0.7497711181640625},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.6391599774360657},{"id":"https://openalex.org/C66322947","wikidata":"https://www.wikidata.org/wiki/Q11658","display_name":"Transformer","level":3,"score":0.5898767113685608},{"id":"https://openalex.org/C173801870","wikidata":"https://www.wikidata.org/wiki/Q201413","display_name":"Heuristic","level":2,"score":0.46741724014282227},{"id":"https://openalex.org/C98045186","wikidata":"https://www.wikidata.org/wiki/Q205663","display_name":"Process (computing)","level":2,"score":0.45265311002731323},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.35997825860977173},{"id":"https://openalex.org/C127413603","wikidata":"https://www.wikidata.org/wiki/Q11023","display_name":"Engineering","level":0,"score":0.2808312773704529},{"id":"https://openalex.org/C165801399","wikidata":"https://www.wikidata.org/wiki/Q25428","display_name":"Voltage","level":2,"score":0.08635741472244263},{"id":"https://openalex.org/C111919701","wikidata":"https://www.wikidata.org/wiki/Q9135","display_name":"Operating system","level":1,"score":0.0},{"id":"https://openalex.org/C119599485","wikidata":"https://www.wikidata.org/wiki/Q43035","display_name":"Electrical engineering","level":1,"score":0.0},{"id":"https://openalex.org/C115961682","wikidata":"https://www.wikidata.org/wiki/Q860623","display_name":"Image (mathematics)","level":2,"score":0.0}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.1109/tits.2022.3193852","is_oa":false,"landing_page_url":"https://doi.org/10.1109/tits.2022.3193852","pdf_url":null,"source":{"id":"https://openalex.org/S144771191","display_name":"IEEE Transactions on Intelligent Transportation Systems","issn_l":"1524-9050","issn":["1524-9050","1558-0016"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310319808","host_organization_name":"Institute of Electrical and Electronics Engineers","host_organization_lineage":["https://openalex.org/P4310319808"],"host_organization_lineage_names":["Institute of Electrical and Electronics Engineers"],"type":"journal"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"IEEE Transactions on Intelligent Transportation Systems","raw_type":"journal-article"}],"best_oa_location":null,"sustainable_development_goals":[],"awards":[],"funders":[],"has_content":{"grobid_xml":false,"pdf":false},"content_urls":null,"referenced_works_count":50,"referenced_works":["https://openalex.org/W1484665340","https://openalex.org/W1522301498","https://openalex.org/W1601649239","https://openalex.org/W1969261937","https://openalex.org/W1996315642","https://openalex.org/W1999406036","https://openalex.org/W2017462516","https://openalex.org/W2019567064","https://openalex.org/W2045673887","https://openalex.org/W2058405995","https://openalex.org/W2081230102","https://openalex.org/W2082670167","https://openalex.org/W2100711246","https://openalex.org/W2130942839","https://openalex.org/W2146870367","https://openalex.org/W2155027007","https://openalex.org/W2163947723","https://openalex.org/W2194775991","https://openalex.org/W2466673901","https://openalex.org/W2563119939","https://openalex.org/W2805798351","https://openalex.org/W2907833097","https://openalex.org/W2938157874","https://openalex.org/W2951846985","https://openalex.org/W2952332632","https://openalex.org/W2963084599","https://openalex.org/W2986488952","https://openalex.org/W3014845548","https://openalex.org/W3018779742","https://openalex.org/W3040879766","https://openalex.org/W3043239066","https://openalex.org/W3044015199","https://openalex.org/W3109386843","https://openalex.org/W3128933491","https://openalex.org/W3133471011","https://openalex.org/W3190367510","https://openalex.org/W3193590387","https://openalex.org/W3199468096","https://openalex.org/W4295138992","https://openalex.org/W4385245566","https://openalex.org/W6631190155","https://openalex.org/W6679436768","https://openalex.org/W6683204974","https://openalex.org/W6725207838","https://openalex.org/W6730742100","https://openalex.org/W6739901393","https://openalex.org/W6748487558","https://openalex.org/W6758687306","https://openalex.org/W6790709252","https://openalex.org/W6801123346"],"related_works":["https://openalex.org/W2185313546","https://openalex.org/W2185850456","https://openalex.org/W2994962043","https://openalex.org/W2351571732","https://openalex.org/W1496169957","https://openalex.org/W2324305961","https://openalex.org/W2075333697","https://openalex.org/W202150730","https://openalex.org/W1971021931","https://openalex.org/W166444759"],"abstract_inverted_index":{"Pickup":[0],"and":[1,23,34,94,97,133,189],"delivery":[2,95],"problems":[3],"with":[4,101,130,152,185],"late":[5,39],"penalties":[6,40],"can":[7,86,163],"be":[8,164,196],"adopted":[9],"to":[10,44,63,105,109,144,166,195,199],"model":[11,158,176],"a":[12,54,146,168],"wide":[13],"range":[14],"of":[15,21,80,123,142,203],"practical":[16],"situations":[17],"in":[18,182],"the":[19,26,29,38,75,81,88,92,98,117,121,126,138,150,156,174,190,201],"field":[20],"transportation":[22],"logistics.":[24],"However,":[25],"restrictions":[27],"on":[28,113,125,149,160],"multiple":[30],"vehicles\u2019":[31],"service":[32],"sequences":[33],"non-linearity":[35],"caused":[36],"by":[37,60],"make":[41],"it":[42],"time-consuming":[43],"solve":[45],"this":[46,50],"problem.":[47],"To":[48],"overcome":[49],"difficulty,":[51],"we":[52],"propose":[53],"novel":[55],"reinforcement":[56],"learning":[57],"framework":[58],"inspired":[59],"transformer":[61],"architecture":[62],"generate":[64],"tours":[65],"instantly":[66],"after":[67],"offline":[68],"training.":[69],"This":[70],"framework,":[71],"as":[72],"trained":[73],"through":[74],"policy":[76],"gradient":[77],"method,":[78],"consists":[79],"information":[82],"encoder":[83],"process":[84,100],"which":[85],"extract":[87],"coupling":[89],"relationships":[90],"among":[91],"pickup":[93],"customers,":[96],"decoder":[99],"multi-vehicle":[102],"attention":[103],"network":[104],"allocate":[106],"reasonable":[107],"orders":[108],"each":[110],"vehicle.":[111],"Validated":[112],"Sioux":[114],"Falls":[115],"network,":[116],"proposed":[118,175],"method":[119,162],"yields":[120],"improvement":[122],"2.4%-8.0%":[124],"solution":[127,170],"quality":[128],"compared":[129],"Google":[131],"OR-Tools":[132],"several":[134],"heuristic":[135],"algorithms.":[136],"Notably,":[137],"baselines":[139],"require":[140],"dozens":[141],"minutes":[143],"achieve":[145],"lesser":[147],"result":[148],"case":[151],"100":[153],"customers":[154],"while":[155],"well-trained":[157],"based":[159],"our":[161],"deployed":[165],"provide":[167],"high-quality":[169],"within":[171],"seconds.":[172],"Furthermore,":[173],"also":[177],"shows":[178],"good":[179],"generalization":[180],"ability":[181],"different":[183],"scenarios":[184],"various":[186],"scale":[187],"problems,":[188],"obtained":[191],"results":[192],"are":[193],"shown":[194],"quite":[197],"robust":[198],"counter":[200],"fluctuation":[202],"travel":[204],"time.":[205]},"counts_by_year":[{"year":2026,"cited_by_count":1},{"year":2025,"cited_by_count":3},{"year":2024,"cited_by_count":11},{"year":2023,"cited_by_count":5}],"updated_date":"2025-11-06T03:46:38.306776","created_date":"2025-10-10T00:00:00"}
