{"id":"https://openalex.org/W4403123027","doi":"https://doi.org/10.1109/tii.2024.3423440","title":"Controlling Partially Observed Industrial System Based on Offline Reinforcement Learning\u2014A Case Study of Paste Thickener","display_name":"Controlling Partially Observed Industrial System Based on Offline Reinforcement Learning\u2014A Case Study of Paste Thickener","publication_year":2024,"publication_date":"2024-10-04","ids":{"openalex":"https://openalex.org/W4403123027","doi":"https://doi.org/10.1109/tii.2024.3423440"},"language":"en","primary_location":{"id":"doi:10.1109/tii.2024.3423440","is_oa":false,"landing_page_url":"https://doi.org/10.1109/tii.2024.3423440","pdf_url":null,"source":{"id":"https://openalex.org/S184777250","display_name":"IEEE Transactions on Industrial Informatics","issn_l":"1551-3203","issn":["1551-3203","1941-0050"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310319808","host_organization_name":"Institute of Electrical and Electronics Engineers","host_organization_lineage":["https://openalex.org/P4310319808"],"host_organization_lineage_names":["Institute of Electrical and Electronics Engineers"],"type":"journal"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"IEEE Transactions on Industrial Informatics","raw_type":"journal-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":false,"oa_status":"closed","oa_url":null,"any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5041883391","display_name":"Zhaolin Yuan","orcid":"https://orcid.org/0000-0001-5829-8952"},"institutions":[{"id":"https://openalex.org/I92403157","display_name":"University of Science and Technology Beijing","ror":"https://ror.org/02egmk993","country_code":"CN","type":"education","lineage":["https://openalex.org/I92403157"]}],"countries":["CN"],"is_corresponding":true,"raw_author_name":"Zhaolin Yuan","raw_affiliation_strings":["Institute of Artificial Intelligence, University of Science and Technology Beijing, Beijing, China"],"affiliations":[{"raw_affiliation_string":"Institute of Artificial Intelligence, University of Science and Technology Beijing, Beijing, China","institution_ids":["https://openalex.org/I92403157"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5035164440","display_name":"Z.Y. Zhang","orcid":null},"institutions":[{"id":"https://openalex.org/I92403157","display_name":"University of Science and Technology Beijing","ror":"https://ror.org/02egmk993","country_code":"CN","type":"education","lineage":["https://openalex.org/I92403157"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"ZiXuan Zhang","raw_affiliation_strings":["Institute of Artificial Intelligence, University of Science and Technology Beijing, Beijing, China"],"affiliations":[{"raw_affiliation_string":"Institute of Artificial Intelligence, University of Science and Technology Beijing, Beijing, China","institution_ids":["https://openalex.org/I92403157"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5016410675","display_name":"Xiaorui Li","orcid":"https://orcid.org/0000-0001-5163-3797"},"institutions":[{"id":"https://openalex.org/I92403157","display_name":"University of Science and Technology Beijing","ror":"https://ror.org/02egmk993","country_code":"CN","type":"education","lineage":["https://openalex.org/I92403157"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Xiaorui Li","raw_affiliation_strings":["Institute of Artificial Intelligence, University of Science and Technology Beijing, Beijing, China"],"affiliations":[{"raw_affiliation_string":"Institute of Artificial Intelligence, University of Science and Technology Beijing, Beijing, China","institution_ids":["https://openalex.org/I92403157"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5011048472","display_name":"Yunduan Cui","orcid":"https://orcid.org/0000-0001-5539-4260"},"institutions":[{"id":"https://openalex.org/I19820366","display_name":"Chinese Academy of Sciences","ror":"https://ror.org/034t30j35","country_code":"CN","type":"government","lineage":["https://openalex.org/I19820366"]},{"id":"https://openalex.org/I4210145761","display_name":"Shenzhen Institutes of Advanced Technology","ror":"https://ror.org/04gh4er46","country_code":"CN","type":"facility","lineage":["https://openalex.org/I19820366","https://openalex.org/I4210145761"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Yunduan Cui","raw_affiliation_strings":["Shenzhen Institute of Advanced Technology, Chinese Academy of Sciences, Shenzhen, China"],"affiliations":[{"raw_affiliation_string":"Shenzhen Institute of Advanced Technology, Chinese Academy of Sciences, Shenzhen, China","institution_ids":["https://openalex.org/I4210145761","https://openalex.org/I19820366"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5068624653","display_name":"Ming Li","orcid":"https://orcid.org/0000-0003-4119-7340"},"institutions":[{"id":"https://openalex.org/I14243506","display_name":"Hong Kong Polytechnic University","ror":"https://ror.org/0030zas98","country_code":"HK","type":"education","lineage":["https://openalex.org/I14243506"]}],"countries":["HK"],"is_corresponding":false,"raw_author_name":"Ming Li","raw_affiliation_strings":["Department of Industrial and Systems Engineering, Research Institute for Advanced Manufacturing, Research Centre for Digital Transformation of Tourism, The Hong Kong Polytechnic University, Hong Kong"],"affiliations":[{"raw_affiliation_string":"Department of Industrial and Systems Engineering, Research Institute for Advanced Manufacturing, Research Centre for Digital Transformation of Tourism, The Hong Kong Polytechnic University, Hong Kong","institution_ids":["https://openalex.org/I14243506"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5009624071","display_name":"Xiaojuan Ban","orcid":"https://orcid.org/0000-0001-9142-3276"},"institutions":[{"id":"https://openalex.org/I92403157","display_name":"University of Science and Technology Beijing","ror":"https://ror.org/02egmk993","country_code":"CN","type":"education","lineage":["https://openalex.org/I92403157"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Xiaojuan Ban","raw_affiliation_strings":["Beijing Advanced Innovation Center for Materials Genome Engineering, School of Intelligence Science and Technology, Key Laboratory of Intelligent Bionic Unmanned Systems, Ministry of Education, University of Science and Technology Beijing and Institute of Materials Intelligent Technology, Liaoning Academy of Materials, Shenyang, China"],"affiliations":[{"raw_affiliation_string":"Beijing Advanced Innovation Center for Materials Genome Engineering, School of Intelligence Science and Technology, Key Laboratory of Intelligent Bionic Unmanned Systems, Ministry of Education, University of Science and Technology Beijing and Institute of Materials Intelligent Technology, Liaoning Academy of Materials, Shenyang, China","institution_ids":["https://openalex.org/I92403157"]}]}],"institutions":[],"countries_distinct_count":2,"institutions_distinct_count":6,"corresponding_author_ids":["https://openalex.org/A5041883391"],"corresponding_institution_ids":["https://openalex.org/I92403157"],"apc_list":null,"apc_paid":null,"fwci":3.5511,"has_fulltext":false,"cited_by_count":11,"citation_normalized_percentile":{"value":0.93330686,"is_in_top_1_percent":false,"is_in_top_10_percent":true},"cited_by_percentile_year":{"min":94,"max":99},"biblio":{"volume":"21","issue":"1","first_page":"49","last_page":"59"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T14225","display_name":"Advanced Sensor and Control Systems","score":0.17270000278949738,"subfield":{"id":"https://openalex.org/subfields/2207","display_name":"Control and Systems Engineering"},"field":{"id":"https://openalex.org/fields/22","display_name":"Engineering"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T14225","display_name":"Advanced Sensor and Control Systems","score":0.17270000278949738,"subfield":{"id":"https://openalex.org/subfields/2207","display_name":"Control and Systems Engineering"},"field":{"id":"https://openalex.org/fields/22","display_name":"Engineering"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/reinforcement","display_name":"Reinforcement","score":0.6049017906188965},{"id":"https://openalex.org/keywords/reinforcement-learning","display_name":"Reinforcement learning","score":0.534002423286438},{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.4372463822364807},{"id":"https://openalex.org/keywords/materials-science","display_name":"Materials science","score":0.24658456444740295},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.2248172163963318},{"id":"https://openalex.org/keywords/composite-material","display_name":"Composite material","score":0.19212308526039124}],"concepts":[{"id":"https://openalex.org/C67203356","wikidata":"https://www.wikidata.org/wiki/Q1321905","display_name":"Reinforcement","level":2,"score":0.6049017906188965},{"id":"https://openalex.org/C97541855","wikidata":"https://www.wikidata.org/wiki/Q830687","display_name":"Reinforcement learning","level":2,"score":0.534002423286438},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.4372463822364807},{"id":"https://openalex.org/C192562407","wikidata":"https://www.wikidata.org/wiki/Q228736","display_name":"Materials science","level":0,"score":0.24658456444740295},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.2248172163963318},{"id":"https://openalex.org/C159985019","wikidata":"https://www.wikidata.org/wiki/Q181790","display_name":"Composite material","level":1,"score":0.19212308526039124}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.1109/tii.2024.3423440","is_oa":false,"landing_page_url":"https://doi.org/10.1109/tii.2024.3423440","pdf_url":null,"source":{"id":"https://openalex.org/S184777250","display_name":"IEEE Transactions on Industrial Informatics","issn_l":"1551-3203","issn":["1551-3203","1941-0050"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310319808","host_organization_name":"Institute of Electrical and Electronics Engineers","host_organization_lineage":["https://openalex.org/P4310319808"],"host_organization_lineage_names":["Institute of Electrical and Electronics Engineers"],"type":"journal"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"IEEE Transactions on Industrial Informatics","raw_type":"journal-article"}],"best_oa_location":null,"sustainable_development_goals":[],"awards":[{"id":"https://openalex.org/G1093189910","display_name":null,"funder_award_id":"62376025","funder_id":"https://openalex.org/F4320321001","funder_display_name":"National Natural Science Foundation of China"},{"id":"https://openalex.org/G2756798008","display_name":null,"funder_award_id":"62306032","funder_id":"https://openalex.org/F4320321001","funder_display_name":"National Natural Science Foundation of China"},{"id":"https://openalex.org/G2819759403","display_name":null,"funder_award_id":"2022A1515110350","funder_id":"https://openalex.org/F4320337111","funder_display_name":"Basic and Applied Basic Research Foundation of Guangdong Province"},{"id":"https://openalex.org/G5292391546","display_name":null,"funder_award_id":"62332017","funder_id":"https://openalex.org/F4320321001","funder_display_name":"National Natural Science Foundation of China"}],"funders":[{"id":"https://openalex.org/F4320321001","display_name":"National Natural Science Foundation of China","ror":"https://ror.org/01h0zpd94"},{"id":"https://openalex.org/F4320337111","display_name":"Basic and Applied Basic Research Foundation of Guangdong Province","ror":null}],"has_content":{"pdf":false,"grobid_xml":false},"content_urls":null,"referenced_works_count":29,"referenced_works":["https://openalex.org/W2077447451","https://openalex.org/W2145339207","https://openalex.org/W2520847632","https://openalex.org/W2583461487","https://openalex.org/W2754615637","https://openalex.org/W2762709466","https://openalex.org/W2901625717","https://openalex.org/W2962917939","https://openalex.org/W2988984361","https://openalex.org/W2993272697","https://openalex.org/W3022566517","https://openalex.org/W3127561923","https://openalex.org/W3131674817","https://openalex.org/W3158384428","https://openalex.org/W3197950013","https://openalex.org/W4206497039","https://openalex.org/W4213377513","https://openalex.org/W4221034994","https://openalex.org/W4296913567","https://openalex.org/W4312281895","https://openalex.org/W4368232742","https://openalex.org/W4375929150","https://openalex.org/W4382202915","https://openalex.org/W4386285856","https://openalex.org/W6617744952","https://openalex.org/W6684205842","https://openalex.org/W6757469721","https://openalex.org/W6790767801","https://openalex.org/W6884732130"],"related_works":["https://openalex.org/W4391375266","https://openalex.org/W2748952813","https://openalex.org/W4310083477","https://openalex.org/W2328553770","https://openalex.org/W2920061524","https://openalex.org/W1977959518","https://openalex.org/W2038908348","https://openalex.org/W2107890255","https://openalex.org/W2106552856","https://openalex.org/W2145821588"],"abstract_inverted_index":{"In":[0,29,86,119],"the":[1,7,19,40,44,67,70,75,95,99,108,116,128,137,141,199,203,208],"field":[2],"of":[3,18,69,88,98,140,211,220],"mineral":[4],"processing,":[5],"controlling":[6,36,127,165],"paste":[8,188,224],"thickener":[9,189,225],"is":[10],"a":[11,104,123,146,180,185,191,243,247],"highly":[12],"challenging":[13],"and":[14,25,144,157,173,184,205],"critical":[15,124],"task":[16],"because":[17],"high":[20],"complexity,":[21],"incomplete":[22],"observation":[23,132],"space,":[24,133],"excessive":[26],"environmental":[27],"noises.":[28],"this":[30,92,134],"article,":[31],"we":[32],"propose":[33],"an":[34,228],"offline-data-driven":[35],"strategy":[37],"to":[38,54,102,111,121],"optimize":[39],"operational":[41,113],"indices":[42],"in":[43,126,178,190,223,235],"thickening":[45,100,129,142,182],"system":[46,143],"based":[47],"on":[48,60,231,242],"offline":[49,79,89,117,148,240],"reinforcement":[50],"learning":[51],"(RL).":[52],"Compared":[53],"common":[55],"RL":[56,149,241],"methods":[57],"that":[58,198],"rely":[59],"online":[61,84],"interactive":[62],"training,":[63],"our":[64,221],"approach":[65],"ensures":[66],"safety":[68],"production":[71],"process":[72],"by":[73,214],"training":[74],"controller":[76,106,201],"solely":[77],"using":[78],"datasets,":[80],"thereby":[81],"avoiding":[82],"dangerous":[83],"exploration.":[85],"terms":[87],"dataset":[90,244],"collection,":[91],"study":[93],"utilizes":[94],"prior":[96],"knowledge":[97],"mechanism":[101],"design":[103],"proportional\u2013integral\u2013derivative":[105],"as":[107,115],"behavior":[109],"policy":[110,175],"collect":[112],"trajectories":[114],"dataset.":[118],"addition,":[120],"tackle":[122],"issue":[125],"system:":[130],"constrained":[131],"article":[135],"analyzes":[136],"dynamical":[138],"properties":[139],"introduces":[145],"novel":[147],"algorithm,":[150],"temporal":[151],"batch-constrained":[152],"Q-learning":[153],"(TBCQ).":[154],"The":[155,171,194,217],"algorithm":[156],"associated":[158],"model":[159],"framework":[160],"are":[161,176],"specifically":[162],"developed":[163],"for":[164],"partially":[166],"observed":[167],"Markov":[168],"decision":[169],"processes.":[170],"TBCQ":[172],"trained":[174],"evaluated":[177],"both":[179],"simulated":[181],"environment":[183],"real":[186],"industrial":[187,237],"copper":[192],"mine.":[193],"real-world":[195],"experiments":[196],"demonstrate":[197],"proposed":[200],"outperforms":[202],"baselines":[204],"effectively":[206],"reduces":[207],"tracking":[209],"error":[210],"underflow":[212],"concentration":[213],"over":[215],"12%.":[216],"successful":[218],"application":[219],"pipeline":[222],"also":[226],"offers":[227],"innovative":[229],"perspective":[230],"addressing":[232],"optimization":[233],"problems":[234],"complex":[236],"systems:":[238],"performing":[239],"sampled":[245],"from":[246],"suboptimal":[248],"policy.":[249]},"counts_by_year":[{"year":2025,"cited_by_count":9},{"year":2024,"cited_by_count":2}],"updated_date":"2026-04-09T08:11:56.329763","created_date":"2025-10-10T00:00:00"}
