{"id":"https://openalex.org/W4407247577","doi":"https://doi.org/10.1109/tcds.2025.3540115","title":"Visual Reinforcement Learning Based on Multiview Optimization Aggregation","display_name":"Visual Reinforcement Learning Based on Multiview Optimization Aggregation","publication_year":2025,"publication_date":"2025-02-07","ids":{"openalex":"https://openalex.org/W4407247577","doi":"https://doi.org/10.1109/tcds.2025.3540115"},"language":"en","primary_location":{"id":"doi:10.1109/tcds.2025.3540115","is_oa":false,"landing_page_url":"https://doi.org/10.1109/tcds.2025.3540115","pdf_url":null,"source":{"id":"https://openalex.org/S2488537894","display_name":"IEEE Transactions on Cognitive and Developmental Systems","issn_l":"2379-8920","issn":["2379-8920","2379-8939"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310319808","host_organization_name":"Institute of Electrical and Electronics Engineers","host_organization_lineage":["https://openalex.org/P4310319808"],"host_organization_lineage_names":["Institute of Electrical and Electronics Engineers"],"type":"journal"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"IEEE Transactions on Cognitive and Developmental Systems","raw_type":"journal-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":false,"oa_status":"closed","oa_url":null,"any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5108064895","display_name":"Xuesong Wang","orcid":"https://orcid.org/0000-0002-5327-1088"},"institutions":[{"id":"https://openalex.org/I1327237609","display_name":"Ministry of Education of the People's Republic of China","ror":"https://ror.org/01mv9t934","country_code":"CN","type":"government","lineage":["https://openalex.org/I1327237609","https://openalex.org/I4210127390"]}],"countries":["CN"],"is_corresponding":true,"raw_author_name":"Xuesong Wang","raw_affiliation_strings":["Engineering Research Center of Intelligent Control for Underground Space, Ministry of Education, Xuzhou, China"],"raw_orcid":"https://orcid.org/0000-0002-5327-1088","affiliations":[{"raw_affiliation_string":"Engineering Research Center of Intelligent Control for Underground Space, Ministry of Education, Xuzhou, China","institution_ids":["https://openalex.org/I1327237609"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5041550104","display_name":"Ruyi Lu","orcid":null},"institutions":[{"id":"https://openalex.org/I1327237609","display_name":"Ministry of Education of the People's Republic of China","ror":"https://ror.org/01mv9t934","country_code":"CN","type":"government","lineage":["https://openalex.org/I1327237609","https://openalex.org/I4210127390"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Ruyi Lu","raw_affiliation_strings":["Engineering Research Center of Intelligent Control for Underground Space, Ministry of Education, Xuzhou, China"],"raw_orcid":"https://orcid.org/0009-0001-8771-7498","affiliations":[{"raw_affiliation_string":"Engineering Research Center of Intelligent Control for Underground Space, Ministry of Education, Xuzhou, China","institution_ids":["https://openalex.org/I1327237609"]}]},{"author_position":"middle","author":{"id":null,"display_name":"Hengrui Zhang","orcid":"https://orcid.org/0009-0004-3827-8363"},"institutions":[{"id":"https://openalex.org/I1327237609","display_name":"Ministry of Education of the People's Republic of China","ror":"https://ror.org/01mv9t934","country_code":"CN","type":"government","lineage":["https://openalex.org/I1327237609","https://openalex.org/I4210127390"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Hengrui Zhang","raw_affiliation_strings":["Engineering Research Center of Intelligent Control for Underground Space, Ministry of Education, Xuzhou, China"],"raw_orcid":"https://orcid.org/0009-0004-3827-8363","affiliations":[{"raw_affiliation_string":"Engineering Research Center of Intelligent Control for Underground Space, Ministry of Education, Xuzhou, China","institution_ids":["https://openalex.org/I1327237609"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5091364297","display_name":"Yuhu Cheng","orcid":"https://orcid.org/0000-0003-2022-9999"},"institutions":[{"id":"https://openalex.org/I1327237609","display_name":"Ministry of Education of the People's Republic of China","ror":"https://ror.org/01mv9t934","country_code":"CN","type":"government","lineage":["https://openalex.org/I1327237609","https://openalex.org/I4210127390"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Yuhu Cheng","raw_affiliation_strings":["Engineering Research Center of Intelligent Control for Underground Space, Ministry of Education, Xuzhou, China"],"raw_orcid":"https://orcid.org/0000-0003-2022-9999","affiliations":[{"raw_affiliation_string":"Engineering Research Center of Intelligent Control for Underground Space, Ministry of Education, Xuzhou, China","institution_ids":["https://openalex.org/I1327237609"]}]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":4,"corresponding_author_ids":["https://openalex.org/A5108064895"],"corresponding_institution_ids":["https://openalex.org/I1327237609"],"apc_list":null,"apc_paid":null,"fwci":5.4855,"has_fulltext":false,"cited_by_count":1,"citation_normalized_percentile":{"value":0.92049596,"is_in_top_1_percent":false,"is_in_top_10_percent":true},"cited_by_percentile_year":{"min":91,"max":95},"biblio":{"volume":"17","issue":"4","first_page":"1011","last_page":"1021"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T13731","display_name":"Advanced Computing and Algorithms","score":0.8586999773979187,"subfield":{"id":"https://openalex.org/subfields/3322","display_name":"Urban Studies"},"field":{"id":"https://openalex.org/fields/33","display_name":"Social Sciences"},"domain":{"id":"https://openalex.org/domains/2","display_name":"Social Sciences"}},"topics":[{"id":"https://openalex.org/T13731","display_name":"Advanced Computing and Algorithms","score":0.8586999773979187,"subfield":{"id":"https://openalex.org/subfields/3322","display_name":"Urban Studies"},"field":{"id":"https://openalex.org/fields/33","display_name":"Social Sciences"},"domain":{"id":"https://openalex.org/domains/2","display_name":"Social Sciences"}},{"id":"https://openalex.org/T10331","display_name":"Video Surveillance and Tracking Methods","score":0.8166000247001648,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T13114","display_name":"Image Processing Techniques and Applications","score":0.8065999746322632,"subfield":{"id":"https://openalex.org/subfields/2214","display_name":"Media Technology"},"field":{"id":"https://openalex.org/fields/22","display_name":"Engineering"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.860995352268219},{"id":"https://openalex.org/keywords/reinforcement-learning","display_name":"Reinforcement learning","score":0.7578022480010986},{"id":"https://openalex.org/keywords/human\u2013computer-interaction","display_name":"Human\u2013computer interaction","score":0.45170462131500244},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.41880252957344055}],"concepts":[{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.860995352268219},{"id":"https://openalex.org/C97541855","wikidata":"https://www.wikidata.org/wiki/Q830687","display_name":"Reinforcement learning","level":2,"score":0.7578022480010986},{"id":"https://openalex.org/C107457646","wikidata":"https://www.wikidata.org/wiki/Q207434","display_name":"Human\u2013computer interaction","level":1,"score":0.45170462131500244},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.41880252957344055}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.1109/tcds.2025.3540115","is_oa":false,"landing_page_url":"https://doi.org/10.1109/tcds.2025.3540115","pdf_url":null,"source":{"id":"https://openalex.org/S2488537894","display_name":"IEEE Transactions on Cognitive and Developmental Systems","issn_l":"2379-8920","issn":["2379-8920","2379-8939"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310319808","host_organization_name":"Institute of Electrical and Electronics Engineers","host_organization_lineage":["https://openalex.org/P4310319808"],"host_organization_lineage_names":["Institute of Electrical and Electronics Engineers"],"type":"journal"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"IEEE Transactions on Cognitive and Developmental Systems","raw_type":"journal-article"}],"best_oa_location":null,"sustainable_development_goals":[],"awards":[{"id":"https://openalex.org/G4756161396","display_name":null,"funder_award_id":"62176259","funder_id":"https://openalex.org/F4320321001","funder_display_name":"National Natural Science Foundation of China"},{"id":"https://openalex.org/G4823360002","display_name":null,"funder_award_id":"62373364","funder_id":"https://openalex.org/F4320321001","funder_display_name":"National Natural Science Foundation of China"}],"funders":[{"id":"https://openalex.org/F4320321001","display_name":"National Natural Science Foundation of China","ror":"https://ror.org/01h0zpd94"}],"has_content":{"pdf":false,"grobid_xml":false},"content_urls":null,"referenced_works_count":35,"referenced_works":["https://openalex.org/W3035524453","https://openalex.org/W3093210455","https://openalex.org/W3110979110","https://openalex.org/W3175558129","https://openalex.org/W3205321526","https://openalex.org/W3211437739","https://openalex.org/W4220733308","https://openalex.org/W4252279978","https://openalex.org/W4286896674","https://openalex.org/W4312335991","https://openalex.org/W4323644076","https://openalex.org/W4368232633","https://openalex.org/W4380763481","https://openalex.org/W4386562162","https://openalex.org/W4388286372","https://openalex.org/W4389104669","https://openalex.org/W4392745198","https://openalex.org/W4392902630","https://openalex.org/W4393405305","https://openalex.org/W4395069565","https://openalex.org/W4409057813","https://openalex.org/W6747387971","https://openalex.org/W6747473740","https://openalex.org/W6756256016","https://openalex.org/W6768843968","https://openalex.org/W6771570156","https://openalex.org/W6776867236","https://openalex.org/W6776901495","https://openalex.org/W6787959036","https://openalex.org/W6796848067","https://openalex.org/W6803519892","https://openalex.org/W6809850638","https://openalex.org/W6810343060","https://openalex.org/W6839256673","https://openalex.org/W6843334904"],"related_works":["https://openalex.org/W4391375266","https://openalex.org/W2899084033","https://openalex.org/W2748952813","https://openalex.org/W2390279801","https://openalex.org/W4306904969","https://openalex.org/W4391913857","https://openalex.org/W2358668433","https://openalex.org/W4396701345","https://openalex.org/W2138720691","https://openalex.org/W2376932109"],"abstract_inverted_index":{"Although":[0],"recent":[1],"research":[2],"has":[3],"made":[4],"some":[5],"progress":[6],"in":[7,23,37,51,116,157],"deep":[8],"reinforcement":[9,64,78,121],"learning":[10,40,54,65,79,90,119,122,144],"based":[11,67],"on":[12,31,68,89,153],"raw":[13],"pixels,":[14],"the":[15,38,52,84,117,126,142,158],"low":[16],"sample":[17,174],"efficiency":[18],"remains":[19],"a":[20,59],"key":[21],"challenge":[22],"this":[24],"field.":[25],"Existing":[26],"solutions":[27],"often":[28],"focus":[29,88],"solely":[30],"extracting":[32],"more":[33],"effective":[34,146],"state":[35,49,93,130],"representations":[36,50,147],"representation":[39,118],"stage":[41],"and":[42,61,91,105,120,129,148,171],"overlook":[43],"how":[44],"to":[45,86,124,140],"better":[46],"utilize":[47],"these":[48],"policy":[53],"stage.":[55],"To":[56],"address":[57],"this,":[58],"simple":[60],"sample-efficient":[62],"visual":[63],"method":[66,82],"multiview":[69],"optimization":[70,112],"aggregation":[71,113],"(MVOA-VRL)":[72],"is":[73],"proposed":[74],"for":[75],"pixel-based":[76],"off-policy":[77],"frameworks.":[80],"This":[81],"enables":[83],"agent":[85],"concurrently":[87],"utilizing":[92],"representations.":[94],"Specifically,":[95],"MVOA-VRL":[96,138,167],"acquires":[97],"multiple":[98,133],"views":[99],"of":[100,132,145],"samples":[101,134],"through":[102],"random":[103],"crop":[104],"adaptive":[106],"intensity":[107],"adjustment.":[108],"It":[109],"then":[110],"introduces":[111],"methods":[114],"separately":[115],"modules":[123],"aggregate":[125],"similarities,":[127],"actions,":[128],"values":[131],"from":[135],"different":[136],"views.":[137],"aims":[139],"promote":[141],"agent's":[143],"stable":[149],"policies.":[150],"Experimental":[151],"results":[152],"continuous":[154],"control":[155],"tasks":[156],"DMControl":[159],"environment":[160],"show":[161],"that,":[162],"compared":[163],"with":[164],"state-of-the-art":[165],"methods,":[166],"achieves":[168],"higher":[169],"scores":[170],"significantly":[172],"improves":[173],"efficiency.":[175]},"counts_by_year":[{"year":2025,"cited_by_count":1}],"updated_date":"2025-12-22T23:10:17.713674","created_date":"2025-10-10T00:00:00"}
