{"id":"https://openalex.org/W4280625771","doi":"https://doi.org/10.1109/icra46639.2022.9811781","title":"Gaussian Process Self-triggered Policy Search in Weakly Observable Environments","display_name":"Gaussian Process Self-triggered Policy Search in Weakly Observable Environments","publication_year":2022,"publication_date":"2022-05-23","ids":{"openalex":"https://openalex.org/W4280625771","doi":"https://doi.org/10.1109/icra46639.2022.9811781"},"language":"en","primary_location":{"id":"doi:10.1109/icra46639.2022.9811781","is_oa":false,"landing_page_url":"https://doi.org/10.1109/icra46639.2022.9811781","pdf_url":null,"source":{"id":"https://openalex.org/S4363607759","display_name":"2022 International Conference on Robotics and Automation (ICRA)","issn_l":null,"issn":null,"is_oa":false,"is_in_doaj":false,"is_core":false,"host_organization":null,"host_organization_name":null,"host_organization_lineage":[],"host_organization_lineage_names":[],"type":"conference"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"2022 International Conference on Robotics and Automation (ICRA)","raw_type":"proceedings-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":false,"oa_status":"closed","oa_url":null,"any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5007321577","display_name":"Hikaru Sasaki","orcid":"https://orcid.org/0000-0001-7380-1931"},"institutions":[{"id":"https://openalex.org/I75917431","display_name":"Nara Institute of Science and Technology","ror":"https://ror.org/05bhada84","country_code":"JP","type":"education","lineage":["https://openalex.org/I75917431"]}],"countries":["JP"],"is_corresponding":false,"raw_author_name":"Hikaru Sasaki","raw_affiliation_strings":["Graduate School of Science and Technology, Nara Institute of Science and Technology (NAIST),Division of Information Science,Japan","Division of Information Science, Graduate School of Science and Technology, Nara Institute of Science and Technology (NAIST), Japan"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"Graduate School of Science and Technology, Nara Institute of Science and Technology (NAIST),Division of Information Science,Japan","institution_ids":["https://openalex.org/I75917431"]},{"raw_affiliation_string":"Division of Information Science, Graduate School of Science and Technology, Nara Institute of Science and Technology (NAIST), Japan","institution_ids":["https://openalex.org/I75917431"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5019757077","display_name":"Terushi Hirabayashi","orcid":"https://orcid.org/0000-0003-1040-3455"},"institutions":[{"id":"https://openalex.org/I38674515","display_name":"Kanadevia (Japan)","ror":"https://ror.org/05fvfp460","country_code":"JP","type":"company","lineage":["https://openalex.org/I38674515"]}],"countries":["JP"],"is_corresponding":false,"raw_author_name":"Terushi Hirabayashi","raw_affiliation_strings":["Hitachi Zosen Corporation,Japan","Hitachi Zosen Corporation, Japan"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"Hitachi Zosen Corporation,Japan","institution_ids":["https://openalex.org/I38674515"]},{"raw_affiliation_string":"Hitachi Zosen Corporation, Japan","institution_ids":["https://openalex.org/I38674515"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5068838254","display_name":"Kaoru Kawabata","orcid":"https://orcid.org/0000-0001-6281-7276"},"institutions":[{"id":"https://openalex.org/I38674515","display_name":"Kanadevia (Japan)","ror":"https://ror.org/05fvfp460","country_code":"JP","type":"company","lineage":["https://openalex.org/I38674515"]}],"countries":["JP"],"is_corresponding":false,"raw_author_name":"Kaoru Kawabata","raw_affiliation_strings":["Hitachi Zosen Corporation,Japan","Hitachi Zosen Corporation, Japan"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"Hitachi Zosen Corporation,Japan","institution_ids":["https://openalex.org/I38674515"]},{"raw_affiliation_string":"Hitachi Zosen Corporation, Japan","institution_ids":["https://openalex.org/I38674515"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5042074952","display_name":"Takamitsu Matsubara","orcid":"https://orcid.org/0000-0003-3545-4814"},"institutions":[{"id":"https://openalex.org/I75917431","display_name":"Nara Institute of Science and Technology","ror":"https://ror.org/05bhada84","country_code":"JP","type":"education","lineage":["https://openalex.org/I75917431"]}],"countries":["JP"],"is_corresponding":false,"raw_author_name":"Takamitsu Matsubara","raw_affiliation_strings":["Graduate School of Science and Technology, Nara Institute of Science and Technology (NAIST),Division of Information Science,Japan","Division of Information Science, Graduate School of Science and Technology, Nara Institute of Science and Technology (NAIST), Japan"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"Graduate School of Science and Technology, Nara Institute of Science and Technology (NAIST),Division of Information Science,Japan","institution_ids":["https://openalex.org/I75917431"]},{"raw_affiliation_string":"Division of Information Science, Graduate School of Science and Technology, Nara Institute of Science and Technology (NAIST), Japan","institution_ids":["https://openalex.org/I75917431"]}]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":4,"corresponding_author_ids":[],"corresponding_institution_ids":[],"apc_list":null,"apc_paid":null,"fwci":0.2076,"has_fulltext":false,"cited_by_count":2,"citation_normalized_percentile":{"value":0.3864829,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":{"min":90,"max":95},"biblio":{"volume":null,"issue":null,"first_page":"5946","last_page":"5952"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T12814","display_name":"Gaussian Processes and Bayesian Inference","score":0.9987000226974487,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T12814","display_name":"Gaussian Processes and Bayesian Inference","score":0.9987000226974487,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10462","display_name":"Reinforcement Learning in Robotics","score":0.9921000003814697,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11236","display_name":"Control Systems and Identification","score":0.9782000184059143,"subfield":{"id":"https://openalex.org/subfields/2207","display_name":"Control and Systems Engineering"},"field":{"id":"https://openalex.org/fields/22","display_name":"Engineering"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.6794354915618896},{"id":"https://openalex.org/keywords/garbage","display_name":"Garbage","score":0.5863054394721985},{"id":"https://openalex.org/keywords/gaussian-process","display_name":"Gaussian process","score":0.5434591174125671},{"id":"https://openalex.org/keywords/process","display_name":"Process (computing)","score":0.4903426170349121},{"id":"https://openalex.org/keywords/duration","display_name":"Duration (music)","score":0.48437580466270447},{"id":"https://openalex.org/keywords/action","display_name":"Action (physics)","score":0.47461286187171936},{"id":"https://openalex.org/keywords/parametric-statistics","display_name":"Parametric statistics","score":0.43546727299690247},{"id":"https://openalex.org/keywords/reinforcement-learning","display_name":"Reinforcement learning","score":0.429085910320282},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.41641560196876526},{"id":"https://openalex.org/keywords/incineration","display_name":"Incineration","score":0.41047194600105286},{"id":"https://openalex.org/keywords/mathematical-optimization","display_name":"Mathematical optimization","score":0.3543410003185272},{"id":"https://openalex.org/keywords/gaussian","display_name":"Gaussian","score":0.3510046601295471},{"id":"https://openalex.org/keywords/engineering","display_name":"Engineering","score":0.18598687648773193},{"id":"https://openalex.org/keywords/mathematics","display_name":"Mathematics","score":0.12971842288970947},{"id":"https://openalex.org/keywords/statistics","display_name":"Statistics","score":0.11134976148605347}],"concepts":[{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.6794354915618896},{"id":"https://openalex.org/C75403996","wikidata":"https://www.wikidata.org/wiki/Q5521979","display_name":"Garbage","level":2,"score":0.5863054394721985},{"id":"https://openalex.org/C61326573","wikidata":"https://www.wikidata.org/wiki/Q1496376","display_name":"Gaussian process","level":3,"score":0.5434591174125671},{"id":"https://openalex.org/C98045186","wikidata":"https://www.wikidata.org/wiki/Q205663","display_name":"Process (computing)","level":2,"score":0.4903426170349121},{"id":"https://openalex.org/C112758219","wikidata":"https://www.wikidata.org/wiki/Q16038819","display_name":"Duration (music)","level":2,"score":0.48437580466270447},{"id":"https://openalex.org/C2780791683","wikidata":"https://www.wikidata.org/wiki/Q846785","display_name":"Action (physics)","level":2,"score":0.47461286187171936},{"id":"https://openalex.org/C117251300","wikidata":"https://www.wikidata.org/wiki/Q1849855","display_name":"Parametric statistics","level":2,"score":0.43546727299690247},{"id":"https://openalex.org/C97541855","wikidata":"https://www.wikidata.org/wiki/Q830687","display_name":"Reinforcement learning","level":2,"score":0.429085910320282},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.41641560196876526},{"id":"https://openalex.org/C130751788","wikidata":"https://www.wikidata.org/wiki/Q622772","display_name":"Incineration","level":2,"score":0.41047194600105286},{"id":"https://openalex.org/C126255220","wikidata":"https://www.wikidata.org/wiki/Q141495","display_name":"Mathematical optimization","level":1,"score":0.3543410003185272},{"id":"https://openalex.org/C163716315","wikidata":"https://www.wikidata.org/wiki/Q901177","display_name":"Gaussian","level":2,"score":0.3510046601295471},{"id":"https://openalex.org/C127413603","wikidata":"https://www.wikidata.org/wiki/Q11023","display_name":"Engineering","level":0,"score":0.18598687648773193},{"id":"https://openalex.org/C33923547","wikidata":"https://www.wikidata.org/wiki/Q395","display_name":"Mathematics","level":0,"score":0.12971842288970947},{"id":"https://openalex.org/C105795698","wikidata":"https://www.wikidata.org/wiki/Q12483","display_name":"Statistics","level":1,"score":0.11134976148605347},{"id":"https://openalex.org/C548081761","wikidata":"https://www.wikidata.org/wiki/Q180388","display_name":"Waste management","level":1,"score":0.0},{"id":"https://openalex.org/C62520636","wikidata":"https://www.wikidata.org/wiki/Q944","display_name":"Quantum mechanics","level":1,"score":0.0},{"id":"https://openalex.org/C121332964","wikidata":"https://www.wikidata.org/wiki/Q413","display_name":"Physics","level":0,"score":0.0},{"id":"https://openalex.org/C199360897","wikidata":"https://www.wikidata.org/wiki/Q9143","display_name":"Programming language","level":1,"score":0.0},{"id":"https://openalex.org/C111919701","wikidata":"https://www.wikidata.org/wiki/Q9135","display_name":"Operating system","level":1,"score":0.0},{"id":"https://openalex.org/C142362112","wikidata":"https://www.wikidata.org/wiki/Q735","display_name":"Art","level":0,"score":0.0},{"id":"https://openalex.org/C124952713","wikidata":"https://www.wikidata.org/wiki/Q8242","display_name":"Literature","level":1,"score":0.0}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.1109/icra46639.2022.9811781","is_oa":false,"landing_page_url":"https://doi.org/10.1109/icra46639.2022.9811781","pdf_url":null,"source":{"id":"https://openalex.org/S4363607759","display_name":"2022 International Conference on Robotics and Automation (ICRA)","issn_l":null,"issn":null,"is_oa":false,"is_in_doaj":false,"is_core":false,"host_organization":null,"host_organization_name":null,"host_organization_lineage":[],"host_organization_lineage_names":[],"type":"conference"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"2022 International Conference on Robotics and Automation (ICRA)","raw_type":"proceedings-article"}],"best_oa_location":null,"sustainable_development_goals":[],"awards":[],"funders":[],"has_content":{"pdf":false,"grobid_xml":false},"content_urls":null,"referenced_works_count":27,"referenced_works":["https://openalex.org/W137285897","https://openalex.org/W1985235885","https://openalex.org/W2018705428","https://openalex.org/W2055921164","https://openalex.org/W2070801665","https://openalex.org/W2109910161","https://openalex.org/W2498991332","https://openalex.org/W2599381599","https://openalex.org/W2611756877","https://openalex.org/W2611833022","https://openalex.org/W2751302235","https://openalex.org/W2899105324","https://openalex.org/W2908518653","https://openalex.org/W2997896361","https://openalex.org/W3012370795","https://openalex.org/W3014507210","https://openalex.org/W3035992145","https://openalex.org/W3168354865","https://openalex.org/W3173031723","https://openalex.org/W3185855727","https://openalex.org/W4211049957","https://openalex.org/W4297791702","https://openalex.org/W6605566567","https://openalex.org/W6629804754","https://openalex.org/W6646535569","https://openalex.org/W6729403857","https://openalex.org/W6781678525"],"related_works":["https://openalex.org/W2612848883","https://openalex.org/W2032904806","https://openalex.org/W3088744871","https://openalex.org/W1221512877","https://openalex.org/W4382053766","https://openalex.org/W2348837382","https://openalex.org/W3035541749","https://openalex.org/W641660632","https://openalex.org/W2392175750","https://openalex.org/W2030133330"],"abstract_inverted_index":{"The":[0],"environments":[1,59],"of":[2,44,93,163],"such":[3,58],"large":[4],"industrial":[5],"machines":[6],"as":[7,136],"waste":[8,11,175,186],"cranes":[9],"in":[10,27,57],"incineration":[12],"plants":[13],"are":[14],"often":[15],"weakly":[16],"observable,":[17],"where":[18],"little":[19],"information":[20],"about":[21],"the":[22,28,42,45,52,104,108,112,116,121,130,157,161,192,200,206],"environ-mental":[23],"state":[24,43],"is":[25,134],"contained":[26],"observations":[29,128,179],"due":[30],"to":[31,47,129,155,198],"technical":[32],"difficulty":[33],"or":[34,119],"maintenance":[35],"cost":[36],"(e.g.,":[37,64],"no":[38],"sensors":[39],"for":[40,111,173],"observing":[41],"garbage":[46],"be":[48],"handled).":[49],"Based":[50],"on":[51,72,148,170,205],"findings":[53],"that":[54],"skilled":[55],"operators":[56],"choose":[60],"predetermined":[61],"control":[62,94],"strategies":[63],"grasping":[65],"and":[66,68,97,123,145,152,183,202],"scattering)":[67],"their":[69],"durations":[70],"based":[71,147,204],"sensor":[73],"values,":[74],"we":[75,167],"propose":[76],"a":[77,174,181,184],"novel":[78],"non-parametric":[79],"policy":[80,86,110,118],"search":[81,87],"algorithm:":[82],"Gaussian":[83],"process":[84],"self-triggered":[85],"(GPSTPS).":[88],"GPSTPS":[89,138],"has":[90],"two":[91],"types":[92],"policies:":[95],"action":[96,105,109,122,201],"duration.":[98],"A":[99],"gating":[100],"mechanism":[101],"either":[102],"maintains":[103],"selected":[106],"by":[107,115,125,143],"duration":[113,117,124,203],"specified":[114],"updates":[120],"passing":[126],"new":[127],"policy;":[131],"therefore,":[132],"it":[133],"categorized":[135],"self-triggered.":[137],"simultaneously":[139],"learns":[140],"both":[141],"policies":[142,197],"trial":[144],"error":[146],"sparse":[149],"GP":[150],"priors":[151],"variational":[153],"learning":[154],"maximize":[156],"return.":[158],"To":[159],"verify":[160],"performance":[162],"our":[164],"proposed":[165,193],"method,":[166],"conducted":[168],"experiments":[169],"garbage-grasping-scattering":[171],"task":[172],"crane":[176,187],"with":[177],"weak":[178],"using":[180],"simulation":[182],"robotic":[185],"system.":[188],"As":[189],"experimental":[190],"results,":[191],"method":[194],"acquired":[195],"suitable":[196],"determine":[199],"garbage's":[207],"characteristics.":[208]},"counts_by_year":[{"year":2025,"cited_by_count":1},{"year":2023,"cited_by_count":1}],"updated_date":"2026-06-11T09:08:48.828518","created_date":"2025-10-10T00:00:00"}
