{"id":"https://openalex.org/W4375928942","doi":"https://doi.org/10.1109/tim.2023.3273687","title":"Learning End-to-End Visual Servoing Using an Improved Soft Actor-Critic Approach With Centralized Novelty Measurement","display_name":"Learning End-to-End Visual Servoing Using an Improved Soft Actor-Critic Approach With Centralized Novelty Measurement","publication_year":2023,"publication_date":"2023-01-01","ids":{"openalex":"https://openalex.org/W4375928942","doi":"https://doi.org/10.1109/tim.2023.3273687"},"language":"en","primary_location":{"id":"doi:10.1109/tim.2023.3273687","is_oa":false,"landing_page_url":"https://doi.org/10.1109/tim.2023.3273687","pdf_url":null,"source":{"id":"https://openalex.org/S10892749","display_name":"IEEE Transactions on Instrumentation and Measurement","issn_l":"0018-9456","issn":["0018-9456","1557-9662"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310319808","host_organization_name":"Institute of Electrical and Electronics Engineers","host_organization_lineage":["https://openalex.org/P4310319808"],"host_organization_lineage_names":["Institute of Electrical and Electronics Engineers"],"type":"journal"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"IEEE Transactions on Instrumentation and Measurement","raw_type":"journal-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":false,"oa_status":"closed","oa_url":null,"any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5032200261","display_name":"Jian Gao","orcid":"https://orcid.org/0000-0002-1181-4531"},"institutions":[{"id":"https://openalex.org/I17145004","display_name":"Northwestern Polytechnical University","ror":"https://ror.org/01y0j0j86","country_code":"CN","type":"education","lineage":["https://openalex.org/I17145004"]}],"countries":["CN"],"is_corresponding":true,"raw_author_name":"Jian Gao","raw_affiliation_strings":["School of Marine Science and Technology, Northwestern Polytechnical University, Xi&#x2019;an, China"],"raw_orcid":"https://orcid.org/0000-0002-1181-4531","affiliations":[{"raw_affiliation_string":"School of Marine Science and Technology, Northwestern Polytechnical University, Xi&#x2019;an, China","institution_ids":["https://openalex.org/I17145004"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5014270991","display_name":"Yaozhen He","orcid":"https://orcid.org/0000-0002-4671-8371"},"institutions":[{"id":"https://openalex.org/I17145004","display_name":"Northwestern Polytechnical University","ror":"https://ror.org/01y0j0j86","country_code":"CN","type":"education","lineage":["https://openalex.org/I17145004"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Yaozhen He","raw_affiliation_strings":["School of Marine Science and Technology, Northwestern Polytechnical University, Xi&#x2019;an, China"],"raw_orcid":"https://orcid.org/0000-0002-4671-8371","affiliations":[{"raw_affiliation_string":"School of Marine Science and Technology, Northwestern Polytechnical University, Xi&#x2019;an, China","institution_ids":["https://openalex.org/I17145004"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5100377728","display_name":"Yimin Chen","orcid":"https://orcid.org/0000-0003-1562-1443"},"institutions":[{"id":"https://openalex.org/I17145004","display_name":"Northwestern Polytechnical University","ror":"https://ror.org/01y0j0j86","country_code":"CN","type":"education","lineage":["https://openalex.org/I17145004"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Yimin Chen","raw_affiliation_strings":["School of Marine Science and Technology, Northwestern Polytechnical University, Xi&#x2019;an, China"],"raw_orcid":"https://orcid.org/0000-0003-1562-1443","affiliations":[{"raw_affiliation_string":"School of Marine Science and Technology, Northwestern Polytechnical University, Xi&#x2019;an, China","institution_ids":["https://openalex.org/I17145004"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5070341037","display_name":"Yufeng Li","orcid":"https://orcid.org/0000-0003-0634-6734"},"institutions":[{"id":"https://openalex.org/I17145004","display_name":"Northwestern Polytechnical University","ror":"https://ror.org/01y0j0j86","country_code":"CN","type":"education","lineage":["https://openalex.org/I17145004"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Yufeng Li","raw_affiliation_strings":["School of Marine Science and Technology, Northwestern Polytechnical University, Xi&#x2019;an, China"],"raw_orcid":"https://orcid.org/0000-0003-0634-6734","affiliations":[{"raw_affiliation_string":"School of Marine Science and Technology, Northwestern Polytechnical University, Xi&#x2019;an, China","institution_ids":["https://openalex.org/I17145004"]}]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":4,"corresponding_author_ids":["https://openalex.org/A5032200261"],"corresponding_institution_ids":["https://openalex.org/I17145004"],"apc_list":null,"apc_paid":null,"fwci":0.7065,"has_fulltext":false,"cited_by_count":6,"citation_normalized_percentile":{"value":0.71211923,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":{"min":94,"max":96},"biblio":{"volume":"72","issue":null,"first_page":"1","last_page":"12"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10531","display_name":"Advanced Vision and Imaging","score":0.9998000264167786,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10531","display_name":"Advanced Vision and Imaging","score":0.9998000264167786,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11992","display_name":"CCD and CMOS Imaging Sensors","score":0.9969000220298767,"subfield":{"id":"https://openalex.org/subfields/2208","display_name":"Electrical and Electronic Engineering"},"field":{"id":"https://openalex.org/fields/22","display_name":"Engineering"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10540","display_name":"Advanced Fluorescence Microscopy Techniques","score":0.9927999973297119,"subfield":{"id":"https://openalex.org/subfields/1304","display_name":"Biophysics"},"field":{"id":"https://openalex.org/fields/13","display_name":"Biochemistry, Genetics and Molecular Biology"},"domain":{"id":"https://openalex.org/domains/1","display_name":"Life Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/reinforcement-learning","display_name":"Reinforcement learning","score":0.79190593957901},{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.6964879631996155},{"id":"https://openalex.org/keywords/novelty","display_name":"Novelty","score":0.6641802787780762},{"id":"https://openalex.org/keywords/scalability","display_name":"Scalability","score":0.5925084352493286},{"id":"https://openalex.org/keywords/end-to-end-principle","display_name":"End-to-end principle","score":0.5595185160636902},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.5415464043617249},{"id":"https://openalex.org/keywords/artificial-neural-network","display_name":"Artificial neural network","score":0.5327214002609253},{"id":"https://openalex.org/keywords/convergence","display_name":"Convergence (economics)","score":0.5177654027938843},{"id":"https://openalex.org/keywords/entropy","display_name":"Entropy (arrow of time)","score":0.5154955983161926},{"id":"https://openalex.org/keywords/visual-servoing","display_name":"Visual servoing","score":0.4553724527359009},{"id":"https://openalex.org/keywords/novelty-detection","display_name":"Novelty detection","score":0.41986536979675293},{"id":"https://openalex.org/keywords/machine-learning","display_name":"Machine learning","score":0.35671842098236084},{"id":"https://openalex.org/keywords/robot","display_name":"Robot","score":0.18728870153427124}],"concepts":[{"id":"https://openalex.org/C97541855","wikidata":"https://www.wikidata.org/wiki/Q830687","display_name":"Reinforcement learning","level":2,"score":0.79190593957901},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.6964879631996155},{"id":"https://openalex.org/C2778738651","wikidata":"https://www.wikidata.org/wiki/Q16546687","display_name":"Novelty","level":2,"score":0.6641802787780762},{"id":"https://openalex.org/C48044578","wikidata":"https://www.wikidata.org/wiki/Q727490","display_name":"Scalability","level":2,"score":0.5925084352493286},{"id":"https://openalex.org/C74296488","wikidata":"https://www.wikidata.org/wiki/Q2527392","display_name":"End-to-end principle","level":2,"score":0.5595185160636902},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.5415464043617249},{"id":"https://openalex.org/C50644808","wikidata":"https://www.wikidata.org/wiki/Q192776","display_name":"Artificial neural network","level":2,"score":0.5327214002609253},{"id":"https://openalex.org/C2777303404","wikidata":"https://www.wikidata.org/wiki/Q759757","display_name":"Convergence (economics)","level":2,"score":0.5177654027938843},{"id":"https://openalex.org/C106301342","wikidata":"https://www.wikidata.org/wiki/Q4117933","display_name":"Entropy (arrow of time)","level":2,"score":0.5154955983161926},{"id":"https://openalex.org/C10912380","wikidata":"https://www.wikidata.org/wiki/Q527952","display_name":"Visual servoing","level":3,"score":0.4553724527359009},{"id":"https://openalex.org/C2778924833","wikidata":"https://www.wikidata.org/wiki/Q7064603","display_name":"Novelty detection","level":3,"score":0.41986536979675293},{"id":"https://openalex.org/C119857082","wikidata":"https://www.wikidata.org/wiki/Q2539","display_name":"Machine learning","level":1,"score":0.35671842098236084},{"id":"https://openalex.org/C90509273","wikidata":"https://www.wikidata.org/wiki/Q11012","display_name":"Robot","level":2,"score":0.18728870153427124},{"id":"https://openalex.org/C162324750","wikidata":"https://www.wikidata.org/wiki/Q8134","display_name":"Economics","level":0,"score":0.0},{"id":"https://openalex.org/C50522688","wikidata":"https://www.wikidata.org/wiki/Q189833","display_name":"Economic growth","level":1,"score":0.0},{"id":"https://openalex.org/C138885662","wikidata":"https://www.wikidata.org/wiki/Q5891","display_name":"Philosophy","level":0,"score":0.0},{"id":"https://openalex.org/C121332964","wikidata":"https://www.wikidata.org/wiki/Q413","display_name":"Physics","level":0,"score":0.0},{"id":"https://openalex.org/C77088390","wikidata":"https://www.wikidata.org/wiki/Q8513","display_name":"Database","level":1,"score":0.0},{"id":"https://openalex.org/C27206212","wikidata":"https://www.wikidata.org/wiki/Q34178","display_name":"Theology","level":1,"score":0.0},{"id":"https://openalex.org/C62520636","wikidata":"https://www.wikidata.org/wiki/Q944","display_name":"Quantum mechanics","level":1,"score":0.0}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.1109/tim.2023.3273687","is_oa":false,"landing_page_url":"https://doi.org/10.1109/tim.2023.3273687","pdf_url":null,"source":{"id":"https://openalex.org/S10892749","display_name":"IEEE Transactions on Instrumentation and Measurement","issn_l":"0018-9456","issn":["0018-9456","1557-9662"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310319808","host_organization_name":"Institute of Electrical and Electronics Engineers","host_organization_lineage":["https://openalex.org/P4310319808"],"host_organization_lineage_names":["Institute of Electrical and Electronics Engineers"],"type":"journal"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"IEEE Transactions on Instrumentation and Measurement","raw_type":"journal-article"}],"best_oa_location":null,"sustainable_development_goals":[],"awards":[{"id":"https://openalex.org/G4363926683","display_name":null,"funder_award_id":"52102469","funder_id":"https://openalex.org/F4320321001","funder_display_name":"National Natural Science Foundation of China"},{"id":"https://openalex.org/G5806490193","display_name":null,"funder_award_id":"AB21196029","funder_id":"https://openalex.org/F4320335965","funder_display_name":"Science and Technology Major Project of Guangxi"},{"id":"https://openalex.org/G6812378864","display_name":null,"funder_award_id":"51979228","funder_id":"https://openalex.org/F4320321001","funder_display_name":"National Natural Science Foundation of China"}],"funders":[{"id":"https://openalex.org/F4320321001","display_name":"National Natural Science Foundation of China","ror":"https://ror.org/01h0zpd94"},{"id":"https://openalex.org/F4320335965","display_name":"Science and Technology Major Project of Guangxi","ror":null}],"has_content":{"grobid_xml":false,"pdf":false},"content_urls":null,"referenced_works_count":52,"referenced_works":["https://openalex.org/W779494576","https://openalex.org/W1480053368","https://openalex.org/W2045157402","https://openalex.org/W2082991751","https://openalex.org/W2098774185","https://openalex.org/W2100249329","https://openalex.org/W2201581102","https://openalex.org/W2471783715","https://openalex.org/W2530520848","https://openalex.org/W2736601468","https://openalex.org/W2781726626","https://openalex.org/W2787938642","https://openalex.org/W2788822937","https://openalex.org/W2886946457","https://openalex.org/W2892979040","https://openalex.org/W2910687636","https://openalex.org/W2914261249","https://openalex.org/W2935417428","https://openalex.org/W2942079888","https://openalex.org/W2963276097","https://openalex.org/W2963523627","https://openalex.org/W2964067469","https://openalex.org/W2964270628","https://openalex.org/W3003569344","https://openalex.org/W3010515602","https://openalex.org/W3021493720","https://openalex.org/W3034956653","https://openalex.org/W3041800508","https://openalex.org/W3096775261","https://openalex.org/W3126840281","https://openalex.org/W3129297821","https://openalex.org/W3129721466","https://openalex.org/W3206267548","https://openalex.org/W3216509389","https://openalex.org/W4210592545","https://openalex.org/W4220888007","https://openalex.org/W4287867830","https://openalex.org/W4297775537","https://openalex.org/W6622487243","https://openalex.org/W6628764021","https://openalex.org/W6674884181","https://openalex.org/W6687681856","https://openalex.org/W6717230150","https://openalex.org/W6737664043","https://openalex.org/W6741002519","https://openalex.org/W6747473740","https://openalex.org/W6748839928","https://openalex.org/W6756303580","https://openalex.org/W6758978475","https://openalex.org/W6771807793","https://openalex.org/W6775522024","https://openalex.org/W7037921825"],"related_works":["https://openalex.org/W2064636555","https://openalex.org/W1939982668","https://openalex.org/W2585503716","https://openalex.org/W2076090200","https://openalex.org/W4312933423","https://openalex.org/W3025682415","https://openalex.org/W2081173909","https://openalex.org/W4382317424","https://openalex.org/W1532481220","https://openalex.org/W2604316291"],"abstract_inverted_index":{"End-to-end":[0],"visual":[1],"servoing":[2],"based":[3,61,97,137],"on":[4,62,98,138],"reinforcement":[5],"learning(RL)":[6],"can":[7],"simplify":[8],"the":[9,44,72,75,92,105,113,119,127,139,157,162,182,187,195,198],"design":[10],"of":[11,74,197],"features":[12,64],"and":[13,16,49,107,116,173,178],"control":[14],"laws":[15],"has":[17],"strong":[18],"scalability":[19],"in":[20,35,46,118,126,149],"combination":[21],"with":[22],"neural":[23,68],"networks.":[24],"However,":[25],"it":[26],"is":[27,161],"challenging":[28],"for":[29,153],"RL-based":[30],"VS":[31,135,184],"tasks":[32],"to":[33,43,78,123,193],"operate":[34],"a":[36,57,67,85,99],"continuous":[37],"state":[38,77],"or":[39],"action":[40],"space":[41,47],"due":[42],"difficulty":[45],"exploration":[48],"slow":[50],"training":[51,128],"convergence.":[52],"Hence,":[53],"this":[54],"paper":[55],"presents":[56],"novel":[58],"measurement":[59],"method":[60,89],"centralized":[63],"extracted":[65],"by":[66,103],"network,":[69],"which":[70],"calculates":[71],"novelty":[73,115],"visited":[76],"encourage":[79],"RL-agent":[80],"exploration.":[81],"Moreover,":[82],"we":[83,131,190],"propose":[84],"hybrid":[86],"probability":[87],"sampling":[88],"that":[90,168],"improves":[91],"Prioritized":[93],"Experience":[94],"Replay":[95],"(PER)":[96],"Temporal-Difference":[100],"(TD)":[101],"error":[102],"integrating":[104],"intrinsic":[106],"external":[108],"rewards.":[109],"This":[110],"strategy":[111],"represents":[112],"transition":[114],"quality":[117],"buffer":[120],"replay,":[121],"respectively,":[122],"promote":[124],"convergence":[125],"process.":[129],"Finally,":[130],"develop":[132],"an":[133],"end-to-end":[134,154],"scheme":[136],"maximum":[140],"entropy":[141],"RL":[142],"Soft":[143],"Actor-Critic":[144],"(SAC).":[145],"Several":[146],"simulated":[147],"experiments":[148,192],"CoppeliaSim":[150],"are":[151,176],"designed":[152],"VS,":[155],"where":[156],"target":[158],"detection":[159],"information":[160],"agent\u2019s":[163],"input.":[164],"The":[165],"results":[166],"highlight":[167],"our":[169],"method\u2019s":[170],"reward":[171],"value":[172],"completion":[174],"rates":[175],"0.35":[177],"8.0%":[179],"higher":[180],"than":[181],"SAC":[183],"baseline.":[185],"At":[186],"same":[188],"time,":[189],"conduct":[191],"verify":[194],"effectiveness":[196],"proposed":[199],"algorithm.":[200]},"counts_by_year":[{"year":2025,"cited_by_count":2},{"year":2024,"cited_by_count":2},{"year":2023,"cited_by_count":2}],"updated_date":"2025-11-06T03:46:38.306776","created_date":"2025-10-10T00:00:00"}
