{"id":"https://openalex.org/W4406418770","doi":"https://doi.org/10.1007/s40747-024-01772-x","title":"Preference learning based deep reinforcement learning for flexible job shop scheduling problem","display_name":"Preference learning based deep reinforcement learning for flexible job shop scheduling problem","publication_year":2025,"publication_date":"2025-01-15","ids":{"openalex":"https://openalex.org/W4406418770","doi":"https://doi.org/10.1007/s40747-024-01772-x"},"language":"en","primary_location":{"id":"doi:10.1007/s40747-024-01772-x","is_oa":true,"landing_page_url":"https://doi.org/10.1007/s40747-024-01772-x","pdf_url":"https://link.springer.com/content/pdf/10.1007/s40747-024-01772-x.pdf","source":{"id":"https://openalex.org/S3035462843","display_name":"Complex & Intelligent Systems","issn_l":"2198-6053","issn":["2198-6053","2199-4536"],"is_oa":true,"is_in_doaj":true,"is_core":true,"host_organization":"https://openalex.org/P4310319900","host_organization_name":"Springer Science+Business Media","host_organization_lineage":["https://openalex.org/P4310319900","https://openalex.org/P4310319965"],"host_organization_lineage_names":["Springer Science+Business Media","Springer Nature"],"type":"journal"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Complex &amp; Intelligent Systems","raw_type":"journal-article"},"type":"article","indexed_in":["crossref","doaj"],"open_access":{"is_oa":true,"oa_status":"gold","oa_url":"https://link.springer.com/content/pdf/10.1007/s40747-024-01772-x.pdf","any_repository_has_fulltext":true},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5014519178","display_name":"Xinning Liu","orcid":"https://orcid.org/0009-0003-4032-1976"},"institutions":[{"id":"https://openalex.org/I4210131997","display_name":"Dalian Neusoft University of Information","ror":"https://ror.org/0304ty515","country_code":"CN","type":"education","lineage":["https://openalex.org/I4210131997"]}],"countries":["CN"],"is_corresponding":true,"raw_author_name":"Xinning Liu","raw_affiliation_strings":["School of Computer and Software, Dalian Neusoft University of Information, Dalian, 116023, Liaoning, China"],"affiliations":[{"raw_affiliation_string":"School of Computer and Software, Dalian Neusoft University of Information, Dalian, 116023, Liaoning, China","institution_ids":["https://openalex.org/I4210131997"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5090216201","display_name":"Han\u2010Xiong Li","orcid":"https://orcid.org/0000-0002-0707-5940"},"institutions":[{"id":"https://openalex.org/I4210131997","display_name":"Dalian Neusoft University of Information","ror":"https://ror.org/0304ty515","country_code":"CN","type":"education","lineage":["https://openalex.org/I4210131997"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Li Han","raw_affiliation_strings":["School of Computer and Software, Dalian Neusoft University of Information, Dalian, 116023, Liaoning, China"],"affiliations":[{"raw_affiliation_string":"School of Computer and Software, Dalian Neusoft University of Information, Dalian, 116023, Liaoning, China","institution_ids":["https://openalex.org/I4210131997"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5100306027","display_name":"Ling Kang","orcid":null},"institutions":[{"id":"https://openalex.org/I4210131997","display_name":"Dalian Neusoft University of Information","ror":"https://ror.org/0304ty515","country_code":"CN","type":"education","lineage":["https://openalex.org/I4210131997"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Ling Kang","raw_affiliation_strings":["Neusoft Research Institute, Dalian Neusoft University of Information, Dalian, 116023, Liaoning, China"],"affiliations":[{"raw_affiliation_string":"Neusoft Research Institute, Dalian Neusoft University of Information, Dalian, 116023, Liaoning, China","institution_ids":["https://openalex.org/I4210131997"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5101522666","display_name":"Jiannan Liu","orcid":"https://orcid.org/0000-0002-2083-4657"},"institutions":[{"id":"https://openalex.org/I4210131997","display_name":"Dalian Neusoft University of Information","ror":"https://ror.org/0304ty515","country_code":"CN","type":"education","lineage":["https://openalex.org/I4210131997"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Jiannan Liu","raw_affiliation_strings":["School of Computer and Software, Dalian Neusoft University of Information, Dalian, 116023, Liaoning, China"],"affiliations":[{"raw_affiliation_string":"School of Computer and Software, Dalian Neusoft University of Information, Dalian, 116023, Liaoning, China","institution_ids":["https://openalex.org/I4210131997"]}]},{"author_position":"last","author":{"id":null,"display_name":"Huadong Miao","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Huadong Miao","raw_affiliation_strings":["SNOW China (Beijing) Co. Ltd., Dalian Branch, Dalian, 116023, Liaoning, China"],"affiliations":[{"raw_affiliation_string":"SNOW China (Beijing) Co. Ltd., Dalian Branch, Dalian, 116023, Liaoning, China","institution_ids":[]}]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":5,"corresponding_author_ids":["https://openalex.org/A5014519178"],"corresponding_institution_ids":["https://openalex.org/I4210131997"],"apc_list":{"value":1320,"currency":"GBP","value_usd":1619},"apc_paid":{"value":1320,"currency":"GBP","value_usd":1619},"fwci":9.0471,"has_fulltext":true,"cited_by_count":8,"citation_normalized_percentile":{"value":0.97427988,"is_in_top_1_percent":false,"is_in_top_10_percent":true},"cited_by_percentile_year":{"min":98,"max":99},"biblio":{"volume":"11","issue":"2","first_page":null,"last_page":null},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10551","display_name":"Scheduling and Optimization Algorithms","score":1.0,"subfield":{"id":"https://openalex.org/subfields/2209","display_name":"Industrial and Manufacturing Engineering"},"field":{"id":"https://openalex.org/fields/22","display_name":"Engineering"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10551","display_name":"Scheduling and Optimization Algorithms","score":1.0,"subfield":{"id":"https://openalex.org/subfields/2209","display_name":"Industrial and Manufacturing Engineering"},"field":{"id":"https://openalex.org/fields/22","display_name":"Engineering"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11814","display_name":"Advanced Manufacturing and Logistics Optimization","score":0.9976000189781189,"subfield":{"id":"https://openalex.org/subfields/2209","display_name":"Industrial and Manufacturing Engineering"},"field":{"id":"https://openalex.org/fields/22","display_name":"Engineering"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T12782","display_name":"Assembly Line Balancing Optimization","score":0.9886999726295471,"subfield":{"id":"https://openalex.org/subfields/2209","display_name":"Industrial and Manufacturing Engineering"},"field":{"id":"https://openalex.org/fields/22","display_name":"Engineering"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/reinforcement-learning","display_name":"Reinforcement learning","score":0.6846022605895996},{"id":"https://openalex.org/keywords/reinforcement","display_name":"Reinforcement","score":0.5778292417526245},{"id":"https://openalex.org/keywords/preference","display_name":"Preference","score":0.555491030216217},{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.4891403019428253},{"id":"https://openalex.org/keywords/scheduling","display_name":"Scheduling (production processes)","score":0.4833345115184784},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.46383747458457947},{"id":"https://openalex.org/keywords/job-shop-scheduling","display_name":"Job shop scheduling","score":0.46282583475112915},{"id":"https://openalex.org/keywords/computational-intelligence","display_name":"Computational intelligence","score":0.4572978913784027},{"id":"https://openalex.org/keywords/operations-research","display_name":"Operations research","score":0.39115676283836365},{"id":"https://openalex.org/keywords/industrial-engineering","display_name":"Industrial engineering","score":0.35262274742126465},{"id":"https://openalex.org/keywords/psychology","display_name":"Psychology","score":0.24800699949264526},{"id":"https://openalex.org/keywords/operations-management","display_name":"Operations management","score":0.22934624552726746},{"id":"https://openalex.org/keywords/engineering","display_name":"Engineering","score":0.21601828932762146},{"id":"https://openalex.org/keywords/microeconomics","display_name":"Microeconomics","score":0.1396472454071045},{"id":"https://openalex.org/keywords/social-psychology","display_name":"Social psychology","score":0.12818485498428345},{"id":"https://openalex.org/keywords/economics","display_name":"Economics","score":0.10096833109855652}],"concepts":[{"id":"https://openalex.org/C97541855","wikidata":"https://www.wikidata.org/wiki/Q830687","display_name":"Reinforcement learning","level":2,"score":0.6846022605895996},{"id":"https://openalex.org/C67203356","wikidata":"https://www.wikidata.org/wiki/Q1321905","display_name":"Reinforcement","level":2,"score":0.5778292417526245},{"id":"https://openalex.org/C2781249084","wikidata":"https://www.wikidata.org/wiki/Q908656","display_name":"Preference","level":2,"score":0.555491030216217},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.4891403019428253},{"id":"https://openalex.org/C206729178","wikidata":"https://www.wikidata.org/wiki/Q2271896","display_name":"Scheduling (production processes)","level":2,"score":0.4833345115184784},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.46383747458457947},{"id":"https://openalex.org/C55416958","wikidata":"https://www.wikidata.org/wiki/Q6206757","display_name":"Job shop scheduling","level":3,"score":0.46282583475112915},{"id":"https://openalex.org/C139502532","wikidata":"https://www.wikidata.org/wiki/Q1122090","display_name":"Computational intelligence","level":2,"score":0.4572978913784027},{"id":"https://openalex.org/C42475967","wikidata":"https://www.wikidata.org/wiki/Q194292","display_name":"Operations research","level":1,"score":0.39115676283836365},{"id":"https://openalex.org/C13736549","wikidata":"https://www.wikidata.org/wiki/Q4489420","display_name":"Industrial engineering","level":1,"score":0.35262274742126465},{"id":"https://openalex.org/C15744967","wikidata":"https://www.wikidata.org/wiki/Q9418","display_name":"Psychology","level":0,"score":0.24800699949264526},{"id":"https://openalex.org/C21547014","wikidata":"https://www.wikidata.org/wiki/Q1423657","display_name":"Operations management","level":1,"score":0.22934624552726746},{"id":"https://openalex.org/C127413603","wikidata":"https://www.wikidata.org/wiki/Q11023","display_name":"Engineering","level":0,"score":0.21601828932762146},{"id":"https://openalex.org/C175444787","wikidata":"https://www.wikidata.org/wiki/Q39072","display_name":"Microeconomics","level":1,"score":0.1396472454071045},{"id":"https://openalex.org/C77805123","wikidata":"https://www.wikidata.org/wiki/Q161272","display_name":"Social psychology","level":1,"score":0.12818485498428345},{"id":"https://openalex.org/C162324750","wikidata":"https://www.wikidata.org/wiki/Q8134","display_name":"Economics","level":0,"score":0.10096833109855652},{"id":"https://openalex.org/C111919701","wikidata":"https://www.wikidata.org/wiki/Q9135","display_name":"Operating system","level":1,"score":0.0},{"id":"https://openalex.org/C68387754","wikidata":"https://www.wikidata.org/wiki/Q7271585","display_name":"Schedule","level":2,"score":0.0}],"mesh":[],"locations_count":2,"locations":[{"id":"doi:10.1007/s40747-024-01772-x","is_oa":true,"landing_page_url":"https://doi.org/10.1007/s40747-024-01772-x","pdf_url":"https://link.springer.com/content/pdf/10.1007/s40747-024-01772-x.pdf","source":{"id":"https://openalex.org/S3035462843","display_name":"Complex & Intelligent Systems","issn_l":"2198-6053","issn":["2198-6053","2199-4536"],"is_oa":true,"is_in_doaj":true,"is_core":true,"host_organization":"https://openalex.org/P4310319900","host_organization_name":"Springer Science+Business Media","host_organization_lineage":["https://openalex.org/P4310319900","https://openalex.org/P4310319965"],"host_organization_lineage_names":["Springer Science+Business Media","Springer Nature"],"type":"journal"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Complex &amp; Intelligent Systems","raw_type":"journal-article"},{"id":"pmh:oai:doaj.org/article:4d4b96dc2f8646fa95020a2fad6cda40","is_oa":true,"landing_page_url":"https://doaj.org/article/4d4b96dc2f8646fa95020a2fad6cda40","pdf_url":null,"source":{"id":"https://openalex.org/S112646816","display_name":"SHILAP Revista de lepidopterolog\u00eda","issn_l":"0300-5267","issn":["0300-5267","2340-4078"],"is_oa":true,"is_in_doaj":true,"is_core":false,"host_organization":null,"host_organization_name":null,"host_organization_lineage":[],"host_organization_lineage_names":[],"type":"journal"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":"Complex & Intelligent Systems, Vol 11, Iss 2, Pp 1-23 (2025)","raw_type":"article"}],"best_oa_location":{"id":"doi:10.1007/s40747-024-01772-x","is_oa":true,"landing_page_url":"https://doi.org/10.1007/s40747-024-01772-x","pdf_url":"https://link.springer.com/content/pdf/10.1007/s40747-024-01772-x.pdf","source":{"id":"https://openalex.org/S3035462843","display_name":"Complex & Intelligent Systems","issn_l":"2198-6053","issn":["2198-6053","2199-4536"],"is_oa":true,"is_in_doaj":true,"is_core":true,"host_organization":"https://openalex.org/P4310319900","host_organization_name":"Springer Science+Business Media","host_organization_lineage":["https://openalex.org/P4310319900","https://openalex.org/P4310319965"],"host_organization_lineage_names":["Springer Science+Business Media","Springer Nature"],"type":"journal"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Complex &amp; Intelligent Systems","raw_type":"journal-article"},"sustainable_development_goals":[],"awards":[],"funders":[],"has_content":{"pdf":true,"grobid_xml":false},"content_urls":{"pdf":"https://content.openalex.org/works/W4406418770.pdf"},"referenced_works_count":42,"referenced_works":["https://openalex.org/W1560042744","https://openalex.org/W1588382077","https://openalex.org/W1970176495","https://openalex.org/W1999445878","https://openalex.org/W2002692271","https://openalex.org/W2014034914","https://openalex.org/W2024085737","https://openalex.org/W2026541511","https://openalex.org/W2076716919","https://openalex.org/W2145079270","https://openalex.org/W2156391157","https://openalex.org/W2157846217","https://openalex.org/W2761608996","https://openalex.org/W2798885736","https://openalex.org/W2949676527","https://openalex.org/W3002239905","https://openalex.org/W3173097263","https://openalex.org/W3183714391","https://openalex.org/W3194871405","https://openalex.org/W3209424396","https://openalex.org/W3210972560","https://openalex.org/W4210876519","https://openalex.org/W4214717370","https://openalex.org/W4282946405","https://openalex.org/W4285024875","https://openalex.org/W4285130537","https://openalex.org/W4304481271","https://openalex.org/W4304692597","https://openalex.org/W4308487886","https://openalex.org/W4386472940","https://openalex.org/W4387918017","https://openalex.org/W4388281316","https://openalex.org/W4389802953","https://openalex.org/W4390368000","https://openalex.org/W4391450140","https://openalex.org/W4393906168","https://openalex.org/W4394573533","https://openalex.org/W4397293298","https://openalex.org/W4401890413","https://openalex.org/W4402493089","https://openalex.org/W4402597514","https://openalex.org/W6600599538"],"related_works":["https://openalex.org/W4310083477","https://openalex.org/W2328553770","https://openalex.org/W2920061524","https://openalex.org/W1977959518","https://openalex.org/W2038908348","https://openalex.org/W2107890255","https://openalex.org/W2106552856","https://openalex.org/W2145821588","https://openalex.org/W2086122291","https://openalex.org/W1987513656"],"abstract_inverted_index":{"Abstract":[0],"The":[1,206],"flexible":[2],"job":[3],"shop":[4],"scheduling":[5,31,166,182],"problem":[6],"(FJSP)":[7],"holds":[8],"significant":[9],"importance":[10],"in":[11,40,201,217],"both":[12,41],"theoretical":[13],"research":[14],"and":[15,21,28,43,63,117,132,173,184],"practical":[16],"applications.":[17],"Given":[18],"the":[19,26,58,90,124,136,145,148,211,218],"complexity":[20],"diversity":[22],"of":[23,30,38,60,147,158,213],"FJSP,":[24],"improving":[25,130],"generalization":[27],"quality":[29],"methods":[32],"has":[33],"become":[34],"a":[35,51,72,98],"hot":[36],"topic":[37],"interest":[39],"industry":[42],"academia.":[44],"To":[45],"address":[46],"this,":[47],"this":[48],"paper":[49],"proposes":[50],"Preference-Based":[52],"Mask-PPO":[53],"(PBMP)":[54],"algorithm,":[55],"which":[56],"leverages":[57],"strengths":[59],"preference":[61,77,149,192],"learning":[62,78,177,193,203],"invalid":[64],"action":[65,125],"masking":[66],"to":[67,81,112,143,195],"optimize":[68],"FJSP":[69,155],"solutions.":[70],"First,":[71],"reward":[73,83,94,199],"predictor":[74],"based":[75],"on":[76,154],"is":[79,103,110,141],"designed":[80],"model":[82],"prediction":[84],"by":[85],"comparing":[86],"random":[87],"fragments,":[88],"eliminating":[89],"need":[91],"for":[92,204],"complex":[93],"function":[95],"design.":[96],"Second,":[97],"novel":[99],"intelligent":[100],"switching":[101],"mechanism":[102,200],"introduced,":[104],"where":[105],"proximal":[106,119],"policy":[107,120],"optimization":[108,121],"(PPO)":[109],"employed":[111],"enhance":[113],"exploration":[114],"during":[115,127],"sampling,":[116],"masked":[118],"(Mask-PPO)":[122],"refines":[123],"space":[126],"training,":[128],"significantly":[129],"efficiency":[131],"solution":[133],"quality.":[134],"Furthermore,":[135],"Pearson":[137],"correlation":[138],"coefficient":[139],"(PCC)":[140],"used":[142],"evaluate":[144],"performance":[146,222],"model.":[150],"Finally,":[151],"comparative":[152],"experiments":[153],"benchmark":[156],"instances":[157],"varying":[159],"sizes":[160],"demonstrate":[161],"that":[162],"PBMP":[163,219],"outperforms":[164],"traditional":[165],"strategies":[167],"such":[168],"as":[169],"dispatching":[170],"rules,":[171],"OR-Tools,":[172],"other":[174],"deep":[175],"reinforcement":[176,202],"(DRL)":[178],"algorithms,":[179],"achieving":[180],"superior":[181],"policies":[183],"faster":[185],"convergence.":[186],"Even":[187],"with":[188],"increasing":[189],"instance":[190],"sizes,":[191],"proves":[194],"be":[196],"an":[197],"effective":[198],"FJSP.":[205],"ablation":[207],"study":[208],"further":[209],"highlights":[210],"advantages":[212],"each":[214],"key":[215],"component":[216],"algorithm":[220],"across":[221],"metrics.":[223]},"counts_by_year":[{"year":2026,"cited_by_count":2},{"year":2025,"cited_by_count":6}],"updated_date":"2026-04-21T08:09:41.155169","created_date":"2025-10-10T00:00:00"}
