{"id":"https://openalex.org/W4402351070","doi":"https://doi.org/10.1109/ijcnn60899.2024.10650970","title":"Autoencoder Reconstruction Model for Long-Horizon Exploration","display_name":"Autoencoder Reconstruction Model for Long-Horizon Exploration","publication_year":2024,"publication_date":"2024-06-30","ids":{"openalex":"https://openalex.org/W4402351070","doi":"https://doi.org/10.1109/ijcnn60899.2024.10650970"},"language":"en","primary_location":{"id":"doi:10.1109/ijcnn60899.2024.10650970","is_oa":false,"landing_page_url":"https://doi.org/10.1109/ijcnn60899.2024.10650970","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"2024 International Joint Conference on Neural Networks (IJCNN)","raw_type":"proceedings-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":false,"oa_status":"closed","oa_url":null,"any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5089763177","display_name":"Renye Yan","orcid":null},"institutions":[{"id":"https://openalex.org/I20231570","display_name":"Peking University","ror":"https://ror.org/02v51f717","country_code":"CN","type":"education","lineage":["https://openalex.org/I20231570"]}],"countries":["CN"],"is_corresponding":true,"raw_author_name":"Renye Yan","raw_affiliation_strings":["Peiking University,School of Integrated Circuits,Beijing,China"],"affiliations":[{"raw_affiliation_string":"Peiking University,School of Integrated Circuits,Beijing,China","institution_ids":["https://openalex.org/I20231570"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5027187253","display_name":"Youting Wu","orcid":"https://orcid.org/0000-0003-4449-1561"},"institutions":[{"id":"https://openalex.org/I881766915","display_name":"Nanjing University","ror":"https://ror.org/01rxvg760","country_code":"CN","type":"education","lineage":["https://openalex.org/I881766915"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"You Wu","raw_affiliation_strings":["Nanjing University,Software Institute,Nanjing,China"],"affiliations":[{"raw_affiliation_string":"Nanjing University,Software Institute,Nanjing,China","institution_ids":["https://openalex.org/I881766915"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5016091831","display_name":"Yaozhong Gan","orcid":null},"institutions":[{"id":"https://openalex.org/I9842412","display_name":"Nanjing University of Aeronautics and Astronautics","ror":"https://ror.org/01scyh794","country_code":"CN","type":"education","lineage":["https://openalex.org/I9842412"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Yaozhong Gan","raw_affiliation_strings":["Nanjing University of Aeronautics and Astronautics,Nanjing,China"],"affiliations":[{"raw_affiliation_string":"Nanjing University of Aeronautics and Astronautics,Nanjing,China","institution_ids":["https://openalex.org/I9842412"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5100869147","display_name":"Yunfan Yang","orcid":null},"institutions":[{"id":"https://openalex.org/I20231570","display_name":"Peking University","ror":"https://ror.org/02v51f717","country_code":"CN","type":"education","lineage":["https://openalex.org/I20231570"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Yunfan Yang","raw_affiliation_strings":["Peiking University,School of Integrated Circuits,Beijing,China"],"affiliations":[{"raw_affiliation_string":"Peiking University,School of Integrated Circuits,Beijing,China","institution_ids":["https://openalex.org/I20231570"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5109778648","display_name":"Zhaoke Yu","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Zhaoke Yu","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5045078054","display_name":"Zongxi Liu","orcid":"https://orcid.org/0000-0003-0018-9037"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Zongxi Liu","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5100327574","display_name":"Xin Zhang","orcid":"https://orcid.org/0000-0003-1583-6401"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Xin Zhang","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5100526661","display_name":"Ling Liang","orcid":"https://orcid.org/0009-0009-0809-9053"},"institutions":[{"id":"https://openalex.org/I20231570","display_name":"Peking University","ror":"https://ror.org/02v51f717","country_code":"CN","type":"education","lineage":["https://openalex.org/I20231570"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Ling Liang","raw_affiliation_strings":["Peiking University,School of Integrated Circuits,Beijing,China"],"affiliations":[{"raw_affiliation_string":"Peiking University,School of Integrated Circuits,Beijing,China","institution_ids":["https://openalex.org/I20231570"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5060554231","display_name":"Yimao Cai","orcid":"https://orcid.org/0000-0002-6854-8211"},"institutions":[{"id":"https://openalex.org/I20231570","display_name":"Peking University","ror":"https://ror.org/02v51f717","country_code":"CN","type":"education","lineage":["https://openalex.org/I20231570"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Yimao Cai","raw_affiliation_strings":["Peiking University,School of Integrated Circuits,Beijing,China"],"affiliations":[{"raw_affiliation_string":"Peiking University,School of Integrated Circuits,Beijing,China","institution_ids":["https://openalex.org/I20231570"]}]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":9,"corresponding_author_ids":["https://openalex.org/A5089763177"],"corresponding_institution_ids":["https://openalex.org/I20231570"],"apc_list":null,"apc_paid":null,"fwci":0.0,"has_fulltext":false,"cited_by_count":0,"citation_normalized_percentile":{"value":0.1814781,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":null,"biblio":{"volume":null,"issue":null,"first_page":"1","last_page":"8"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T11801","display_name":"Reservoir Engineering and Simulation Methods","score":0.9948999881744385,"subfield":{"id":"https://openalex.org/subfields/2212","display_name":"Ocean Engineering"},"field":{"id":"https://openalex.org/fields/22","display_name":"Engineering"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T11801","display_name":"Reservoir Engineering and Simulation Methods","score":0.9948999881744385,"subfield":{"id":"https://openalex.org/subfields/2212","display_name":"Ocean Engineering"},"field":{"id":"https://openalex.org/fields/22","display_name":"Engineering"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10715","display_name":"Distributed and Parallel Computing Systems","score":0.9735999703407288,"subfield":{"id":"https://openalex.org/subfields/1705","display_name":"Computer Networks and Communications"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T14470","display_name":"Advanced Data Processing Techniques","score":0.963100016117096,"subfield":{"id":"https://openalex.org/subfields/2207","display_name":"Control and Systems Engineering"},"field":{"id":"https://openalex.org/fields/22","display_name":"Engineering"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/autoencoder","display_name":"Autoencoder","score":0.844305157661438},{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.6108824610710144},{"id":"https://openalex.org/keywords/horizon","display_name":"Horizon","score":0.6093023419380188},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.4321492910385132},{"id":"https://openalex.org/keywords/deep-learning","display_name":"Deep learning","score":0.18843290209770203},{"id":"https://openalex.org/keywords/mathematics","display_name":"Mathematics","score":0.10909587144851685}],"concepts":[{"id":"https://openalex.org/C101738243","wikidata":"https://www.wikidata.org/wiki/Q786435","display_name":"Autoencoder","level":3,"score":0.844305157661438},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.6108824610710144},{"id":"https://openalex.org/C159176650","wikidata":"https://www.wikidata.org/wiki/Q43261","display_name":"Horizon","level":2,"score":0.6093023419380188},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.4321492910385132},{"id":"https://openalex.org/C108583219","wikidata":"https://www.wikidata.org/wiki/Q197536","display_name":"Deep learning","level":2,"score":0.18843290209770203},{"id":"https://openalex.org/C33923547","wikidata":"https://www.wikidata.org/wiki/Q395","display_name":"Mathematics","level":0,"score":0.10909587144851685},{"id":"https://openalex.org/C2524010","wikidata":"https://www.wikidata.org/wiki/Q8087","display_name":"Geometry","level":1,"score":0.0}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.1109/ijcnn60899.2024.10650970","is_oa":false,"landing_page_url":"https://doi.org/10.1109/ijcnn60899.2024.10650970","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"2024 International Joint Conference on Neural Networks (IJCNN)","raw_type":"proceedings-article"}],"best_oa_location":null,"sustainable_development_goals":[{"id":"https://metadata.un.org/sdg/13","score":0.41999998688697815,"display_name":"Climate action"}],"awards":[],"funders":[{"id":"https://openalex.org/F4320321001","display_name":"National Natural Science Foundation of China","ror":"https://ror.org/01h0zpd94"}],"has_content":{"grobid_xml":false,"pdf":false},"content_urls":null,"referenced_works_count":53,"referenced_works":["https://openalex.org/W32403112","https://openalex.org/W1771410628","https://openalex.org/W1931877416","https://openalex.org/W1986014385","https://openalex.org/W1988526405","https://openalex.org/W2000514530","https://openalex.org/W2034806191","https://openalex.org/W2109910161","https://openalex.org/W2112447569","https://openalex.org/W2121863487","https://openalex.org/W2135046866","https://openalex.org/W2144558232","https://openalex.org/W2145339207","https://openalex.org/W2156737235","https://openalex.org/W2167489871","https://openalex.org/W2188721763","https://openalex.org/W2417786368","https://openalex.org/W2484231675","https://openalex.org/W2514775068","https://openalex.org/W2596982695","https://openalex.org/W2736601468","https://openalex.org/W2746553466","https://openalex.org/W2788862220","https://openalex.org/W2885550588","https://openalex.org/W2895453875","https://openalex.org/W2962787969","https://openalex.org/W2963099939","https://openalex.org/W2963277051","https://openalex.org/W2963359646","https://openalex.org/W2963523627","https://openalex.org/W2964067469","https://openalex.org/W2982316857","https://openalex.org/W2997289589","https://openalex.org/W3018036994","https://openalex.org/W3034962946","https://openalex.org/W3129322645","https://openalex.org/W3175870124","https://openalex.org/W4287867830","https://openalex.org/W4298857966","https://openalex.org/W6637967152","https://openalex.org/W6638088447","https://openalex.org/W6676727762","https://openalex.org/W6683195989","https://openalex.org/W6716474083","https://openalex.org/W6718092244","https://openalex.org/W6741002519","https://openalex.org/W6751540476","https://openalex.org/W6753925943","https://openalex.org/W6754957883","https://openalex.org/W6756303580","https://openalex.org/W6758641611","https://openalex.org/W6771807793","https://openalex.org/W6922480057"],"related_works":["https://openalex.org/W4391375266","https://openalex.org/W2748952813","https://openalex.org/W3013693939","https://openalex.org/W2159052453","https://openalex.org/W2566616303","https://openalex.org/W3131327266","https://openalex.org/W2734887215","https://openalex.org/W4297051394","https://openalex.org/W2752972570","https://openalex.org/W4220775285"],"abstract_inverted_index":{"Conventional":[0],"reinforcement":[1,124],"learning":[2],"(RL)":[3],"algorithms":[4],"often":[5],"necessitate":[6],"millions":[7],"of":[8,123],"environment":[9],"interactions":[10,49],"to":[11,64,77,96,135],"ascertain":[12],"an":[13,56,93],"efficacious":[14],"policy.":[15],"In":[16],"stark":[17],"contrast,":[18],"humans,":[19],"leveraging":[20],"their":[21],"curiosity":[22],"mechanisms,":[23],"can":[24],"develop":[25],"proficient":[26],"policies":[27],"with":[28,87,113],"minimal":[29],"effort.":[30],"Drawing":[31],"inspiration":[32],"from":[33,68],"this":[34,140],"observation,":[35],"we":[36],"introduce":[37],"the":[38,69,98,105,110,114,121,129],"Autoencoder":[39],"Reconstruction":[40],"Model(ARM),":[41],"a":[42,60],"curiosity-driven":[43],"RL":[44,79],"model":[45],"that":[46,104],"significantly":[47],"reduces":[48],"while":[50],"enhancing":[51],"policy":[52],"effectiveness.":[53],"ARM":[54,71,90,111],"employs":[55],"autoencoder":[57],"module,":[58],"utilizing":[59],"deep":[61],"neural":[62],"network":[63],"learn":[65],"feature":[66],"representations":[67],"environment.":[70],"utilizes":[72],"its":[73],"Curiosity":[74],"Measurement":[75],"Module":[76],"motivate":[78],"agents":[80],"for":[81],"effective":[82],"exploration,":[83],"particularly":[84],"in":[85,139],"environments":[86],"sparse":[88],"rewards.":[89],"also":[91],"introduces":[92],"innovative":[94],"mechanism":[95],"balance":[97],"exploration-exploitation":[99],"dilemma.":[100],"Theoretical":[101],"analyses":[102],"reveal":[103],"reward":[106,116],"shaping":[107,117],"introduced":[108],"by":[109],"aligns":[112],"potential-based":[115],"paradigm,":[118],"thereby":[119],"preserving":[120],"optimality":[122],"learning.":[125],"We":[126],"will":[127],"release":[128],"source":[130],"code":[131],"and":[132],"trained":[133],"models":[134],"facilitate":[136],"further":[137],"studies":[138],"research":[141],"direction.":[142]},"counts_by_year":[],"updated_date":"2025-12-27T23:08:20.325037","created_date":"2025-10-10T00:00:00"}
