{"id":"https://openalex.org/W4416965655","doi":"https://doi.org/10.1109/tase.2025.3639576","title":"Game Theory-Based Production-Maintenance Collaborative Scheduling Using Imitation-Enhanced Alternating-Training Reinforcement Learning","display_name":"Game Theory-Based Production-Maintenance Collaborative Scheduling Using Imitation-Enhanced Alternating-Training Reinforcement Learning","publication_year":2025,"publication_date":"2025-12-03","ids":{"openalex":"https://openalex.org/W4416965655","doi":"https://doi.org/10.1109/tase.2025.3639576"},"language":null,"primary_location":{"id":"doi:10.1109/tase.2025.3639576","is_oa":false,"landing_page_url":"https://doi.org/10.1109/tase.2025.3639576","pdf_url":null,"source":{"id":"https://openalex.org/S34881539","display_name":"IEEE Transactions on Automation Science and Engineering","issn_l":"1545-5955","issn":["1545-5955","1558-3783"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310319808","host_organization_name":"Institute of Electrical and Electronics Engineers","host_organization_lineage":["https://openalex.org/P4310319808"],"host_organization_lineage_names":["Institute of Electrical and Electronics Engineers"],"type":"journal"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"IEEE Transactions on Automation Science and Engineering","raw_type":"journal-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":false,"oa_status":"closed","oa_url":null,"any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5058918143","display_name":"Jiaxuan Shi","orcid":"https://orcid.org/0009-0004-0027-7226"},"institutions":[{"id":"https://openalex.org/I116953780","display_name":"Tongji University","ror":"https://ror.org/03rc6as71","country_code":"CN","type":"education","lineage":["https://openalex.org/I116953780"]}],"countries":["CN"],"is_corresponding":true,"raw_author_name":"Jiaxuan Shi","raw_affiliation_strings":["Shanghai Research Institute for Intelligent Autonomous Systems, Tongji University, Shanghai, China"],"affiliations":[{"raw_affiliation_string":"Shanghai Research Institute for Intelligent Autonomous Systems, Tongji University, Shanghai, China","institution_ids":["https://openalex.org/I116953780"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5103108404","display_name":"Fei Qiao","orcid":"https://orcid.org/0000-0002-1513-8753"},"institutions":[{"id":"https://openalex.org/I116953780","display_name":"Tongji University","ror":"https://ror.org/03rc6as71","country_code":"CN","type":"education","lineage":["https://openalex.org/I116953780"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Fei Qiao","raw_affiliation_strings":["College of Electronics and Information Engineering, Tongji University, Shanghai, China"],"affiliations":[{"raw_affiliation_string":"College of Electronics and Information Engineering, Tongji University, Shanghai, China","institution_ids":["https://openalex.org/I116953780"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5061363418","display_name":"Juan Liu","orcid":"https://orcid.org/0000-0001-8934-2127"},"institutions":[{"id":"https://openalex.org/I116953780","display_name":"Tongji University","ror":"https://ror.org/03rc6as71","country_code":"CN","type":"education","lineage":["https://openalex.org/I116953780"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Juan Liu","raw_affiliation_strings":["College of Electronics and Information Engineering, Tongji University, Shanghai, China"],"affiliations":[{"raw_affiliation_string":"College of Electronics and Information Engineering, Tongji University, Shanghai, China","institution_ids":["https://openalex.org/I116953780"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5051315321","display_name":"Yumin Ma","orcid":"https://orcid.org/0000-0001-9271-3363"},"institutions":[{"id":"https://openalex.org/I116953780","display_name":"Tongji University","ror":"https://ror.org/03rc6as71","country_code":"CN","type":"education","lineage":["https://openalex.org/I116953780"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Yumin Ma","raw_affiliation_strings":["College of Electronics and Information Engineering, Tongji University, Shanghai, China"],"affiliations":[{"raw_affiliation_string":"College of Electronics and Information Engineering, Tongji University, Shanghai, China","institution_ids":["https://openalex.org/I116953780"]}]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":4,"corresponding_author_ids":["https://openalex.org/A5058918143"],"corresponding_institution_ids":["https://openalex.org/I116953780"],"apc_list":null,"apc_paid":null,"fwci":0.0,"has_fulltext":false,"cited_by_count":0,"citation_normalized_percentile":{"value":0.52536056,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":null,"biblio":{"volume":"23","issue":null,"first_page":"1284","last_page":"1300"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T12782","display_name":"Assembly Line Balancing Optimization","score":0.3549000024795532,"subfield":{"id":"https://openalex.org/subfields/2209","display_name":"Industrial and Manufacturing Engineering"},"field":{"id":"https://openalex.org/fields/22","display_name":"Engineering"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T12782","display_name":"Assembly Line Balancing Optimization","score":0.3549000024795532,"subfield":{"id":"https://openalex.org/subfields/2209","display_name":"Industrial and Manufacturing Engineering"},"field":{"id":"https://openalex.org/fields/22","display_name":"Engineering"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10551","display_name":"Scheduling and Optimization Algorithms","score":0.3093000054359436,"subfield":{"id":"https://openalex.org/subfields/2209","display_name":"Industrial and Manufacturing Engineering"},"field":{"id":"https://openalex.org/fields/22","display_name":"Engineering"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T12177","display_name":"Resource-Constrained Project Scheduling","score":0.06019999831914902,"subfield":{"id":"https://openalex.org/subfields/1803","display_name":"Management Science and Operations Research"},"field":{"id":"https://openalex.org/fields/18","display_name":"Decision Sciences"},"domain":{"id":"https://openalex.org/domains/2","display_name":"Social Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/reinforcement-learning","display_name":"Reinforcement learning","score":0.7785000205039978},{"id":"https://openalex.org/keywords/scheduling","display_name":"Scheduling (production processes)","score":0.5857999920845032},{"id":"https://openalex.org/keywords/nash-equilibrium","display_name":"Nash equilibrium","score":0.5760999917984009},{"id":"https://openalex.org/keywords/game-theory","display_name":"Game theory","score":0.46320000290870667},{"id":"https://openalex.org/keywords/initialization","display_name":"Initialization","score":0.4343000054359436},{"id":"https://openalex.org/keywords/job-shop-scheduling","display_name":"Job shop scheduling","score":0.39430001378059387},{"id":"https://openalex.org/keywords/multi-agent-system","display_name":"Multi-agent system","score":0.3725000023841858},{"id":"https://openalex.org/keywords/markov-decision-process","display_name":"Markov decision process","score":0.35339999198913574}],"concepts":[{"id":"https://openalex.org/C97541855","wikidata":"https://www.wikidata.org/wiki/Q830687","display_name":"Reinforcement learning","level":2,"score":0.7785000205039978},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.689300000667572},{"id":"https://openalex.org/C206729178","wikidata":"https://www.wikidata.org/wiki/Q2271896","display_name":"Scheduling (production processes)","level":2,"score":0.5857999920845032},{"id":"https://openalex.org/C46814582","wikidata":"https://www.wikidata.org/wiki/Q23389","display_name":"Nash equilibrium","level":2,"score":0.5760999917984009},{"id":"https://openalex.org/C177142836","wikidata":"https://www.wikidata.org/wiki/Q44455","display_name":"Game theory","level":2,"score":0.46320000290870667},{"id":"https://openalex.org/C114466953","wikidata":"https://www.wikidata.org/wiki/Q6034165","display_name":"Initialization","level":2,"score":0.4343000054359436},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.40470001101493835},{"id":"https://openalex.org/C126255220","wikidata":"https://www.wikidata.org/wiki/Q141495","display_name":"Mathematical optimization","level":1,"score":0.39559999108314514},{"id":"https://openalex.org/C55416958","wikidata":"https://www.wikidata.org/wiki/Q6206757","display_name":"Job shop scheduling","level":3,"score":0.39430001378059387},{"id":"https://openalex.org/C41550386","wikidata":"https://www.wikidata.org/wiki/Q529909","display_name":"Multi-agent system","level":2,"score":0.3725000023841858},{"id":"https://openalex.org/C106189395","wikidata":"https://www.wikidata.org/wiki/Q176789","display_name":"Markov decision process","level":3,"score":0.35339999198913574},{"id":"https://openalex.org/C42475967","wikidata":"https://www.wikidata.org/wiki/Q194292","display_name":"Operations research","level":1,"score":0.32850000262260437},{"id":"https://openalex.org/C47175762","wikidata":"https://www.wikidata.org/wiki/Q13422573","display_name":"Non-cooperative game","level":3,"score":0.32170000672340393},{"id":"https://openalex.org/C137836250","wikidata":"https://www.wikidata.org/wiki/Q984063","display_name":"Optimization problem","level":2,"score":0.3116999864578247},{"id":"https://openalex.org/C89611455","wikidata":"https://www.wikidata.org/wiki/Q6804646","display_name":"Mechanism (biology)","level":2,"score":0.3089999854564667},{"id":"https://openalex.org/C32407928","wikidata":"https://www.wikidata.org/wiki/Q2733833","display_name":"Best response","level":3,"score":0.30379998683929443},{"id":"https://openalex.org/C188116033","wikidata":"https://www.wikidata.org/wiki/Q2664563","display_name":"Q-learning","level":3,"score":0.2770000100135803},{"id":"https://openalex.org/C119857082","wikidata":"https://www.wikidata.org/wiki/Q2539","display_name":"Machine learning","level":1,"score":0.2705000042915344},{"id":"https://openalex.org/C107568181","wikidata":"https://www.wikidata.org/wiki/Q5319000","display_name":"Dynamic priority scheduling","level":3,"score":0.26260000467300415},{"id":"https://openalex.org/C175154964","wikidata":"https://www.wikidata.org/wiki/Q380077","display_name":"Task analysis","level":3,"score":0.2623000144958496},{"id":"https://openalex.org/C126388530","wikidata":"https://www.wikidata.org/wiki/Q1131737","display_name":"Imitation","level":2,"score":0.2590999901294708},{"id":"https://openalex.org/C554579003","wikidata":"https://www.wikidata.org/wiki/Q474157","display_name":"Collaborative software","level":2,"score":0.2549999952316284},{"id":"https://openalex.org/C68781425","wikidata":"https://www.wikidata.org/wiki/Q2052203","display_name":"Multi-objective optimization","level":2,"score":0.25360000133514404},{"id":"https://openalex.org/C153517567","wikidata":"https://www.wikidata.org/wiki/Q26090","display_name":"Mechanism design","level":2,"score":0.25040000677108765},{"id":"https://openalex.org/C194387892","wikidata":"https://www.wikidata.org/wiki/Q1747770","display_name":"Stochastic optimization","level":2,"score":0.2502000033855438}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.1109/tase.2025.3639576","is_oa":false,"landing_page_url":"https://doi.org/10.1109/tase.2025.3639576","pdf_url":null,"source":{"id":"https://openalex.org/S34881539","display_name":"IEEE Transactions on Automation Science and Engineering","issn_l":"1545-5955","issn":["1545-5955","1558-3783"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310319808","host_organization_name":"Institute of Electrical and Electronics Engineers","host_organization_lineage":["https://openalex.org/P4310319808"],"host_organization_lineage_names":["Institute of Electrical and Electronics Engineers"],"type":"journal"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"IEEE Transactions on Automation Science and Engineering","raw_type":"journal-article"}],"best_oa_location":null,"sustainable_development_goals":[],"awards":[],"funders":[],"has_content":{"grobid_xml":false,"pdf":false},"content_urls":null,"referenced_works_count":43,"referenced_works":["https://openalex.org/W2023249309","https://openalex.org/W2067050450","https://openalex.org/W2513678011","https://openalex.org/W2889787818","https://openalex.org/W2904246096","https://openalex.org/W2979899262","https://openalex.org/W2996786783","https://openalex.org/W3007831445","https://openalex.org/W3120813239","https://openalex.org/W3123950820","https://openalex.org/W3173943138","https://openalex.org/W3191327624","https://openalex.org/W3194871405","https://openalex.org/W3211131134","https://openalex.org/W4220966002","https://openalex.org/W4220994423","https://openalex.org/W4221116989","https://openalex.org/W4234761190","https://openalex.org/W4285262488","https://openalex.org/W4285499526","https://openalex.org/W4293023550","https://openalex.org/W4303986743","https://openalex.org/W4312143595","https://openalex.org/W4313681148","https://openalex.org/W4367301423","https://openalex.org/W4379928525","https://openalex.org/W4382119654","https://openalex.org/W4385325797","https://openalex.org/W4385338914","https://openalex.org/W4386706959","https://openalex.org/W4387046648","https://openalex.org/W4387967184","https://openalex.org/W4388240372","https://openalex.org/W4388579659","https://openalex.org/W4389037345","https://openalex.org/W4393146695","https://openalex.org/W4393371729","https://openalex.org/W4400086563","https://openalex.org/W4403628545","https://openalex.org/W4404593169","https://openalex.org/W4404809728","https://openalex.org/W4408915573","https://openalex.org/W4414396687"],"related_works":[],"abstract_inverted_index":{"The":[0,164],"collaborative":[1,59],"organization":[2],"of":[3,38,44,101,130,166],"production":[4],"scheduling":[5,60],"and":[6,41,74,134,154],"machine":[7],"maintenance":[8],"is":[9,114,124,170],"crucial":[10],"for":[11,97],"achieving":[12,156],"effective":[13],"manufacturing.":[14],"However,":[15],"since":[16],"these":[17],"two":[18,69,131,143],"activities":[19,70,79],"are":[20,71,80,139],"typically":[21],"managed":[22],"by":[23,68],"different":[24],"self-interested":[25],"managers":[26],"with":[27],"distinct":[28],"optimization":[29,43],"needs":[30],"in":[31],"practice,":[32],"their":[33],"collaboration":[34],"faces":[35],"the":[36,63,75,90,94,99,128,147,157,167],"challenge":[37],"simultaneous":[39],"consideration":[40],"balanced":[42],"both":[45,102],"parties\u2019":[46],"interests.":[47],"To":[48,104],"this":[49,51,106,117],"end,":[50],"study":[52],"investigates":[53],"a":[54,83],"novel":[55],"game":[56,91,132],"theory-based":[57],"production-maintenance":[58],"problem,":[61,107],"wherein":[62],"typical":[64],"objectives":[65],"individually":[66],"concerned":[67],"explicitly":[72],"considered":[73],"decision":[76],"interactions":[77],"between":[78],"modeled":[81],"as":[82],"non-cooperative":[84],"stochastic":[85],"game.":[86],"Nash":[87,162],"equilibrium":[88],"within":[89],"model":[92],"provides":[93],"ideal":[95],"solution":[96],"balancing":[98],"interests":[100],"parties.":[103],"solve":[105],"an":[108,119,135],"imitation-enhanced":[109],"alternating-training":[110],"reinforcement":[111],"learning":[112,146],"method":[113,169],"presented.":[115],"In":[116],"method,":[118],"imitation":[120],"learning-based":[121],"initialization":[122],"mechanism":[123,138],"designed":[125],"to":[126,141,150,161],"accelerate":[127],"training":[129,137],"agents,":[133],"alternating":[136],"developed":[140],"facilitate":[142],"agents":[144],"efficiently":[145],"optimal":[148],"responses":[149],"each":[151],"other\u2019s":[152],"behaviors":[153],"ultimately":[155],"decisions":[158],"that":[159],"converge":[160],"equilibrium.":[163],"superiority":[165],"proposed":[168],"verified":[171],"through":[172],"comprehensive":[173],"experiments.":[174]},"counts_by_year":[],"updated_date":"2026-03-07T16:01:11.037858","created_date":"2025-12-03T00:00:00"}
