{"id":"https://openalex.org/W4415398204","doi":"https://doi.org/10.1109/icdl63968.2025.11204455","title":"Intrinsic Reward Decomposition for Soft Robotic Manipulation Tasks","display_name":"Intrinsic Reward Decomposition for Soft Robotic Manipulation Tasks","publication_year":2025,"publication_date":"2025-09-16","ids":{"openalex":"https://openalex.org/W4415398204","doi":"https://doi.org/10.1109/icdl63968.2025.11204455"},"language":null,"primary_location":{"id":"doi:10.1109/icdl63968.2025.11204455","is_oa":false,"landing_page_url":"https://doi.org/10.1109/icdl63968.2025.11204455","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"2025 IEEE International Conference on Development and Learning (ICDL)","raw_type":"proceedings-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":false,"oa_status":"closed","oa_url":null,"any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5107013437","display_name":"Vladimir Sivtsov","orcid":"https://orcid.org/0009-0007-0098-4766"},"institutions":[{"id":"https://openalex.org/I181343428","display_name":"University of Zagreb","ror":"https://ror.org/00mv6sv71","country_code":"HR","type":"education","lineage":["https://openalex.org/I181343428"]}],"countries":["HR"],"is_corresponding":true,"raw_author_name":"Vladimir Sivtsov","raw_affiliation_strings":["University of Zagreb, Faculty of Electrical Engineering and Computing, Unska ulica 3,Zagreb,Croatia,10000"],"affiliations":[{"raw_affiliation_string":"University of Zagreb, Faculty of Electrical Engineering and Computing, Unska ulica 3,Zagreb,Croatia,10000","institution_ids":["https://openalex.org/I181343428"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5120083825","display_name":"Daniil Shkolnik","orcid":null},"institutions":[{"id":"https://openalex.org/I181343428","display_name":"University of Zagreb","ror":"https://ror.org/00mv6sv71","country_code":"HR","type":"education","lineage":["https://openalex.org/I181343428"]}],"countries":["HR"],"is_corresponding":false,"raw_author_name":"Daniil Shkolnik","raw_affiliation_strings":["University of Zagreb, Faculty of Electrical Engineering and Computing, Unska ulica 3,Zagreb,Croatia,10000"],"affiliations":[{"raw_affiliation_string":"University of Zagreb, Faculty of Electrical Engineering and Computing, Unska ulica 3,Zagreb,Croatia,10000","institution_ids":["https://openalex.org/I181343428"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5110845772","display_name":"\u0391\u03bb\u03ad\u03be\u03b1\u03bd\u03b4\u03c1\u03bf\u03c2 \u03a0\u03b1\u03c0\u03b1\u03bd\u03b9\u03ba\u03bf\u03bb\u03ac\u03bf\u03c5","orcid":"https://orcid.org/0009-0002-0098-0013"},"institutions":[{"id":"https://openalex.org/I181343428","display_name":"University of Zagreb","ror":"https://ror.org/00mv6sv71","country_code":"HR","type":"education","lineage":["https://openalex.org/I181343428"]}],"countries":["HR"],"is_corresponding":false,"raw_author_name":"Athanasios Papanikolaou","raw_affiliation_strings":["University of Zagreb, Faculty of Electrical Engineering and Computing, Unska ulica 3,Zagreb,Croatia,10000"],"affiliations":[{"raw_affiliation_string":"University of Zagreb, Faculty of Electrical Engineering and Computing, Unska ulica 3,Zagreb,Croatia,10000","institution_ids":["https://openalex.org/I181343428"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5035622961","display_name":"Ivan Markovi\u0107","orcid":"https://orcid.org/0000-0003-4138-1113"},"institutions":[{"id":"https://openalex.org/I181343428","display_name":"University of Zagreb","ror":"https://ror.org/00mv6sv71","country_code":"HR","type":"education","lineage":["https://openalex.org/I181343428"]}],"countries":["HR"],"is_corresponding":false,"raw_author_name":"Ivan Markovic","raw_affiliation_strings":["University of Zagreb, Faculty of Electrical Engineering and Computing, Unska ulica 3,Zagreb,Croatia,10000"],"affiliations":[{"raw_affiliation_string":"University of Zagreb, Faculty of Electrical Engineering and Computing, Unska ulica 3,Zagreb,Croatia,10000","institution_ids":["https://openalex.org/I181343428"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5001473761","display_name":"Ivan Petrovi\u0107","orcid":"https://orcid.org/0000-0001-9961-5627"},"institutions":[{"id":"https://openalex.org/I181343428","display_name":"University of Zagreb","ror":"https://ror.org/00mv6sv71","country_code":"HR","type":"education","lineage":["https://openalex.org/I181343428"]}],"countries":["HR"],"is_corresponding":false,"raw_author_name":"Ivan Petrovic","raw_affiliation_strings":["University of Zagreb, Faculty of Electrical Engineering and Computing, Unska ulica 3,Zagreb,Croatia,10000"],"affiliations":[{"raw_affiliation_string":"University of Zagreb, Faculty of Electrical Engineering and Computing, Unska ulica 3,Zagreb,Croatia,10000","institution_ids":["https://openalex.org/I181343428"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5055298709","display_name":"Enrica Zereik","orcid":"https://orcid.org/0000-0001-6380-3554"},"institutions":[{"id":"https://openalex.org/I4210155236","display_name":"National Research Council","ror":"https://ror.org/04zaypm56","country_code":"IT","type":"funder","lineage":["https://openalex.org/I4210155236"]},{"id":"https://openalex.org/I4210133906","display_name":"Institute of Marine Engineering","ror":"https://ror.org/02qnx8e75","country_code":"IT","type":"education","lineage":["https://openalex.org/I4210133906","https://openalex.org/I4210155236"]}],"countries":["IT"],"is_corresponding":false,"raw_author_name":"Enrica Zereik","raw_affiliation_strings":["Institute of Marine Engineering (CNR-INM),Italian National Research Council,Genoa,Italy,16149"],"affiliations":[{"raw_affiliation_string":"Institute of Marine Engineering (CNR-INM),Italian National Research Council,Genoa,Italy,16149","institution_ids":["https://openalex.org/I4210155236","https://openalex.org/I4210133906"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5032713426","display_name":"Fabio Bonsignorio","orcid":"https://orcid.org/0000-0002-5802-2814"},"institutions":[{"id":"https://openalex.org/I181343428","display_name":"University of Zagreb","ror":"https://ror.org/00mv6sv71","country_code":"HR","type":"education","lineage":["https://openalex.org/I181343428"]}],"countries":["HR"],"is_corresponding":false,"raw_author_name":"Fabio Bonsignorio","raw_affiliation_strings":["University of Zagreb, Faculty of Electrical Engineering and Computing, Unska ulica 3,Zagreb,Croatia,10000"],"affiliations":[{"raw_affiliation_string":"University of Zagreb, Faculty of Electrical Engineering and Computing, Unska ulica 3,Zagreb,Croatia,10000","institution_ids":["https://openalex.org/I181343428"]}]}],"institutions":[],"countries_distinct_count":2,"institutions_distinct_count":7,"corresponding_author_ids":["https://openalex.org/A5107013437"],"corresponding_institution_ids":["https://openalex.org/I181343428"],"apc_list":null,"apc_paid":null,"fwci":0.0,"has_fulltext":false,"cited_by_count":0,"citation_normalized_percentile":{"value":0.4061991,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":null,"biblio":{"volume":null,"issue":null,"first_page":"1","last_page":"6"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T11749","display_name":"Iterative Learning Control Systems","score":0.9975000023841858,"subfield":{"id":"https://openalex.org/subfields/2207","display_name":"Control and Systems Engineering"},"field":{"id":"https://openalex.org/fields/22","display_name":"Engineering"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T11749","display_name":"Iterative Learning Control Systems","score":0.9975000023841858,"subfield":{"id":"https://openalex.org/subfields/2207","display_name":"Control and Systems Engineering"},"field":{"id":"https://openalex.org/fields/22","display_name":"Engineering"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10653","display_name":"Robot Manipulation and Learning","score":0.9817000031471252,"subfield":{"id":"https://openalex.org/subfields/2207","display_name":"Control and Systems Engineering"},"field":{"id":"https://openalex.org/fields/22","display_name":"Engineering"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10868","display_name":"Soft Robotics and Applications","score":0.9460999965667725,"subfield":{"id":"https://openalex.org/subfields/2204","display_name":"Biomedical Engineering"},"field":{"id":"https://openalex.org/fields/22","display_name":"Engineering"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/reinforcement-learning","display_name":"Reinforcement learning","score":0.6879000067710876},{"id":"https://openalex.org/keywords/benchmark","display_name":"Benchmark (surveying)","score":0.6341999769210815},{"id":"https://openalex.org/keywords/decomposition","display_name":"Decomposition","score":0.5623000264167786},{"id":"https://openalex.org/keywords/robot","display_name":"Robot","score":0.5047000050544739},{"id":"https://openalex.org/keywords/soft-robotics","display_name":"Soft robotics","score":0.44830000400543213},{"id":"https://openalex.org/keywords/state-space","display_name":"State space","score":0.4375999867916107},{"id":"https://openalex.org/keywords/robotics","display_name":"Robotics","score":0.41690000891685486},{"id":"https://openalex.org/keywords/object","display_name":"Object (grammar)","score":0.39469999074935913}],"concepts":[{"id":"https://openalex.org/C97541855","wikidata":"https://www.wikidata.org/wiki/Q830687","display_name":"Reinforcement learning","level":2,"score":0.6879000067710876},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.6575000286102295},{"id":"https://openalex.org/C185798385","wikidata":"https://www.wikidata.org/wiki/Q1161707","display_name":"Benchmark (surveying)","level":2,"score":0.6341999769210815},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.5997999906539917},{"id":"https://openalex.org/C124681953","wikidata":"https://www.wikidata.org/wiki/Q339062","display_name":"Decomposition","level":2,"score":0.5623000264167786},{"id":"https://openalex.org/C90509273","wikidata":"https://www.wikidata.org/wiki/Q11012","display_name":"Robot","level":2,"score":0.5047000050544739},{"id":"https://openalex.org/C2776058767","wikidata":"https://www.wikidata.org/wiki/Q24327151","display_name":"Soft robotics","level":3,"score":0.44830000400543213},{"id":"https://openalex.org/C72434380","wikidata":"https://www.wikidata.org/wiki/Q230930","display_name":"State space","level":2,"score":0.4375999867916107},{"id":"https://openalex.org/C34413123","wikidata":"https://www.wikidata.org/wiki/Q170978","display_name":"Robotics","level":3,"score":0.41690000891685486},{"id":"https://openalex.org/C2781238097","wikidata":"https://www.wikidata.org/wiki/Q175026","display_name":"Object (grammar)","level":2,"score":0.39469999074935913},{"id":"https://openalex.org/C48103436","wikidata":"https://www.wikidata.org/wiki/Q599031","display_name":"State (computer science)","level":2,"score":0.3781999945640564},{"id":"https://openalex.org/C2778572836","wikidata":"https://www.wikidata.org/wiki/Q380933","display_name":"Space (punctuation)","level":2,"score":0.3375999927520752},{"id":"https://openalex.org/C158622935","wikidata":"https://www.wikidata.org/wiki/Q660848","display_name":"Nonlinear system","level":2,"score":0.3321000039577484},{"id":"https://openalex.org/C133731056","wikidata":"https://www.wikidata.org/wiki/Q4917288","display_name":"Control engineering","level":1,"score":0.3264999985694885},{"id":"https://openalex.org/C2780791683","wikidata":"https://www.wikidata.org/wiki/Q846785","display_name":"Action (physics)","level":2,"score":0.3133000135421753},{"id":"https://openalex.org/C2775960376","wikidata":"https://www.wikidata.org/wiki/Q1435859","display_name":"Grippers","level":2,"score":0.3018999993801117},{"id":"https://openalex.org/C119857082","wikidata":"https://www.wikidata.org/wiki/Q2539","display_name":"Machine learning","level":1,"score":0.2939000129699707},{"id":"https://openalex.org/C13687954","wikidata":"https://www.wikidata.org/wiki/Q4826847","display_name":"Autonomous agent","level":2,"score":0.2721000015735626},{"id":"https://openalex.org/C2776359362","wikidata":"https://www.wikidata.org/wiki/Q2145286","display_name":"Representation (politics)","level":3,"score":0.25999999046325684},{"id":"https://openalex.org/C2779038628","wikidata":"https://www.wikidata.org/wiki/Q7248497","display_name":"Programming by demonstration","level":3,"score":0.2547000050544739}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.1109/icdl63968.2025.11204455","is_oa":false,"landing_page_url":"https://doi.org/10.1109/icdl63968.2025.11204455","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"2025 IEEE International Conference on Development and Learning (ICDL)","raw_type":"proceedings-article"}],"best_oa_location":null,"sustainable_development_goals":[],"awards":[],"funders":[],"has_content":{"pdf":false,"grobid_xml":false},"content_urls":null,"referenced_works_count":9,"referenced_works":["https://openalex.org/W2571445476","https://openalex.org/W2897673281","https://openalex.org/W2910273746","https://openalex.org/W3034637066","https://openalex.org/W4285009743","https://openalex.org/W4367320906","https://openalex.org/W4389667566","https://openalex.org/W4392946708","https://openalex.org/W4413925071"],"related_works":[],"abstract_inverted_index":{"Reinforcement":[0],"learning":[1,54],"has":[2],"shown":[3],"remarkable":[4],"potential":[5],"for":[6],"autonomous":[7],"skill":[8],"acquisition.":[9],"However,":[10],"effective":[11,158],"exploration-exploitation":[12],"of":[13,32,110,126,160],"possible":[14],"actions":[15],"and":[16,39,99,136,163],"states":[17],"remains":[18],"a":[19,79,107,123],"fundamental":[20],"challenge,":[21],"especially":[22],"in":[23,87,146],"soft":[24,33,148],"robotic":[25,88,149],"manipulation":[26,137,144,161],"tasks":[27,145],"where":[28,90],"the":[29,58,74,96,100,147],"continuous":[30],"deformation":[31],"materials":[34],"causes":[35],"complex":[36],"nonlinear":[37],"dynamics":[38],"high-dimensional":[40],"state":[41,76],"spaces.":[42],"A":[43],"promising":[44],"solution":[45],"to":[46,56],"this":[47,103,153],"problem":[48],"is":[49],"intrinsic":[50,68,111],"motivation,":[51],"which":[52,82,114],"allows":[53],"agents":[55],"explore":[57],"environment":[59],"more":[60,157],"systematically":[61],"by":[62],"producing":[63],"self-supervised":[64],"reward":[65,69,112],"signals.":[66],"Existing":[67],"techniques,":[70],"however,":[71],"frequently":[72],"approach":[73],"whole":[75],"space":[77],"as":[78],"single":[80],"entity,":[81],"may":[83],"reduce":[84],"their":[85],"efficacy":[86],"manipulation,":[89],"interactions":[91],"can":[92],"take":[93],"place":[94],"between":[95],"manipulated":[97],"item":[98],"robot.":[101],"In":[102],"work,":[104],"we":[105],"introduce":[106],"new":[108],"method":[109,121],"decomposition":[113,155],"focuses":[115],"exploration":[116],"on":[117],"task-relevant":[118],"interactions.":[119],"Our":[120],"implements":[122],"weighted":[124],"combination":[125],"random":[127],"network":[128],"distillation":[129],"rewards":[130],"derived":[131],"separately":[132],"from":[133],"robot":[134],"observations":[135],"object":[138],"states.":[139],"Experimental":[140],"results":[141],"across":[142],"various":[143],"benchmark":[150],"show":[151],"that":[152],"attention-inspired":[154],"enables":[156],"discovery":[159],"strategies":[162],"significantly":[164],"enhances":[165],"performance.":[166]},"counts_by_year":[],"updated_date":"2026-03-07T16:01:11.037858","created_date":"2025-10-22T00:00:00"}
