{"id":"https://openalex.org/W4401018075","doi":"https://doi.org/10.1109/ur61395.2024.10597441","title":"Relational Q-Functionals: Multi-Agent Learning to Recover from Unforeseen Robot Malfunctions in Continuous Action Domains","display_name":"Relational Q-Functionals: Multi-Agent Learning to Recover from Unforeseen Robot Malfunctions in Continuous Action Domains","publication_year":2024,"publication_date":"2024-06-24","ids":{"openalex":"https://openalex.org/W4401018075","doi":"https://doi.org/10.1109/ur61395.2024.10597441"},"language":"en","primary_location":{"id":"doi:10.1109/ur61395.2024.10597441","is_oa":false,"landing_page_url":"http://dx.doi.org/10.1109/ur61395.2024.10597441","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"2024 21st International Conference on Ubiquitous Robots (UR)","raw_type":"proceedings-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":false,"oa_status":"closed","oa_url":null,"any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5022223707","display_name":"Yasin F\u0131nd\u0131k","orcid":null},"institutions":[{"id":"https://openalex.org/I133738476","display_name":"University of Massachusetts Lowell","ror":"https://ror.org/03hamhx47","country_code":"US","type":"education","lineage":["https://openalex.org/I133738476"]}],"countries":["US"],"is_corresponding":true,"raw_author_name":"Yasin Findik","raw_affiliation_strings":["Richard Miner School of Computer and Information Sciences, University of Massachusetts,PeARL Lab,Lowell,MA,USA"],"affiliations":[{"raw_affiliation_string":"Richard Miner School of Computer and Information Sciences, University of Massachusetts,PeARL Lab,Lowell,MA,USA","institution_ids":["https://openalex.org/I133738476"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5031412747","display_name":"Paul Robinette","orcid":"https://orcid.org/0000-0001-8066-156X"},"institutions":[{"id":"https://openalex.org/I133738476","display_name":"University of Massachusetts Lowell","ror":"https://ror.org/03hamhx47","country_code":"US","type":"education","lineage":["https://openalex.org/I133738476"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Paul Robinette","raw_affiliation_strings":["University of Massachusetts,Department of Electrical and Computer Engineering,Lowell,MA,USA"],"affiliations":[{"raw_affiliation_string":"University of Massachusetts,Department of Electrical and Computer Engineering,Lowell,MA,USA","institution_ids":["https://openalex.org/I133738476"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5084813481","display_name":"Kshitij Jerath","orcid":"https://orcid.org/0000-0001-6356-9438"},"institutions":[{"id":"https://openalex.org/I133738476","display_name":"University of Massachusetts Lowell","ror":"https://ror.org/03hamhx47","country_code":"US","type":"education","lineage":["https://openalex.org/I133738476"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Kshitij Jerath","raw_affiliation_strings":["University of Massachusetts,Department of Mechanical Engineering,Lowell,MA,USA"],"affiliations":[{"raw_affiliation_string":"University of Massachusetts,Department of Mechanical Engineering,Lowell,MA,USA","institution_ids":["https://openalex.org/I133738476"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5096831411","display_name":"Reza Azadeh","orcid":"https://orcid.org/0000-0002-6651-8684"},"institutions":[{"id":"https://openalex.org/I133738476","display_name":"University of Massachusetts Lowell","ror":"https://ror.org/03hamhx47","country_code":"US","type":"education","lineage":["https://openalex.org/I133738476"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Reza Azadeh","raw_affiliation_strings":["Richard Miner School of Computer and Information Sciences, University of Massachusetts,PeARL Lab,Lowell,MA,USA"],"affiliations":[{"raw_affiliation_string":"Richard Miner School of Computer and Information Sciences, University of Massachusetts,PeARL Lab,Lowell,MA,USA","institution_ids":["https://openalex.org/I133738476"]}]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":4,"corresponding_author_ids":["https://openalex.org/A5022223707"],"corresponding_institution_ids":["https://openalex.org/I133738476"],"apc_list":null,"apc_paid":null,"fwci":0.0,"has_fulltext":false,"cited_by_count":0,"citation_normalized_percentile":{"value":0.157591,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":null,"biblio":{"volume":"20","issue":null,"first_page":"251","last_page":"256"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10763","display_name":"Digital Transformation in Industry","score":0.8274999856948853,"subfield":{"id":"https://openalex.org/subfields/2209","display_name":"Industrial and Manufacturing Engineering"},"field":{"id":"https://openalex.org/fields/22","display_name":"Engineering"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10763","display_name":"Digital Transformation in Industry","score":0.8274999856948853,"subfield":{"id":"https://openalex.org/subfields/2209","display_name":"Industrial and Manufacturing Engineering"},"field":{"id":"https://openalex.org/fields/22","display_name":"Engineering"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/action","display_name":"Action (physics)","score":0.6756809949874878},{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.6412994861602783},{"id":"https://openalex.org/keywords/robot","display_name":"Robot","score":0.6305826902389526},{"id":"https://openalex.org/keywords/human\u2013computer-interaction","display_name":"Human\u2013computer interaction","score":0.4939637780189514},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.4695979356765747},{"id":"https://openalex.org/keywords/q-learning","display_name":"Q-learning","score":0.4127488136291504},{"id":"https://openalex.org/keywords/reinforcement-learning","display_name":"Reinforcement learning","score":0.1819092035293579},{"id":"https://openalex.org/keywords/physics","display_name":"Physics","score":0.0844980776309967}],"concepts":[{"id":"https://openalex.org/C2780791683","wikidata":"https://www.wikidata.org/wiki/Q846785","display_name":"Action (physics)","level":2,"score":0.6756809949874878},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.6412994861602783},{"id":"https://openalex.org/C90509273","wikidata":"https://www.wikidata.org/wiki/Q11012","display_name":"Robot","level":2,"score":0.6305826902389526},{"id":"https://openalex.org/C107457646","wikidata":"https://www.wikidata.org/wiki/Q207434","display_name":"Human\u2013computer interaction","level":1,"score":0.4939637780189514},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.4695979356765747},{"id":"https://openalex.org/C188116033","wikidata":"https://www.wikidata.org/wiki/Q2664563","display_name":"Q-learning","level":3,"score":0.4127488136291504},{"id":"https://openalex.org/C97541855","wikidata":"https://www.wikidata.org/wiki/Q830687","display_name":"Reinforcement learning","level":2,"score":0.1819092035293579},{"id":"https://openalex.org/C121332964","wikidata":"https://www.wikidata.org/wiki/Q413","display_name":"Physics","level":0,"score":0.0844980776309967},{"id":"https://openalex.org/C62520636","wikidata":"https://www.wikidata.org/wiki/Q944","display_name":"Quantum mechanics","level":1,"score":0.0}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.1109/ur61395.2024.10597441","is_oa":false,"landing_page_url":"http://dx.doi.org/10.1109/ur61395.2024.10597441","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"2024 21st International Conference on Ubiquitous Robots (UR)","raw_type":"proceedings-article"}],"best_oa_location":null,"sustainable_development_goals":[{"score":0.550000011920929,"id":"https://metadata.un.org/sdg/10","display_name":"Reduced inequalities"}],"awards":[{"id":"https://openalex.org/G1257104999","display_name":null,"funder_award_id":"W911NF20-2-0089","funder_id":"https://openalex.org/F4320338295","funder_display_name":"Army Research Laboratory"},{"id":"https://openalex.org/G3611504697","display_name":null,"funder_award_id":"IIS-2112633","funder_id":"https://openalex.org/F4320306076","funder_display_name":"National Science Foundation"}],"funders":[{"id":"https://openalex.org/F4320306076","display_name":"National Science Foundation","ror":"https://ror.org/021nxhr62"},{"id":"https://openalex.org/F4320338295","display_name":"Army Research Laboratory","ror":"https://ror.org/011hc8f90"}],"has_content":{"pdf":false,"grobid_xml":false},"content_urls":null,"referenced_works_count":41,"referenced_works":["https://openalex.org/W32403112","https://openalex.org/W1641379095","https://openalex.org/W2096145798","https://openalex.org/W2099618002","https://openalex.org/W2104602264","https://openalex.org/W2145339207","https://openalex.org/W2155007355","https://openalex.org/W2156194062","https://openalex.org/W2166533447","https://openalex.org/W2626637010","https://openalex.org/W2740377041","https://openalex.org/W2799899844","https://openalex.org/W2883532348","https://openalex.org/W2941168284","https://openalex.org/W2963658727","https://openalex.org/W2963762747","https://openalex.org/W2963864421","https://openalex.org/W3163926178","https://openalex.org/W3209101326","https://openalex.org/W4285579909","https://openalex.org/W4286748781","https://openalex.org/W4295150809","https://openalex.org/W4299802797","https://openalex.org/W4382237550","https://openalex.org/W4391022011","https://openalex.org/W4391800915","https://openalex.org/W6675811377","https://openalex.org/W6682849425","https://openalex.org/W6684921986","https://openalex.org/W6738796088","https://openalex.org/W6739516088","https://openalex.org/W6742529797","https://openalex.org/W6744562401","https://openalex.org/W6761989198","https://openalex.org/W6762491519","https://openalex.org/W6766805167","https://openalex.org/W6795908048","https://openalex.org/W6797146277","https://openalex.org/W6840380725","https://openalex.org/W6857726652","https://openalex.org/W6861294192"],"related_works":["https://openalex.org/W2320718078","https://openalex.org/W2653530212","https://openalex.org/W8302103","https://openalex.org/W3171631314","https://openalex.org/W2953216818","https://openalex.org/W2674584172","https://openalex.org/W2967743314","https://openalex.org/W1990892711","https://openalex.org/W2606825221","https://openalex.org/W2030191131"],"abstract_inverted_index":{"Cooperative":[0],"multi-agent":[1,12,140],"learning":[2,102],"methods":[3,17,40],"are":[4],"essential":[5],"in":[6,11,126,139,143],"developing":[7],"effective":[8],"cooperation":[9,119],"strategies":[10],"domains.":[13],"In":[14],"robotics,":[15],"these":[16,114],"extend":[18],"beyond":[19],"multi-robot":[20],"scenarios":[21,144],"to":[22,43,46,61,82,112,117],"single-robot":[23,127],"systems,":[24,141],"where":[25],"they":[26],"enable":[27],"coordination":[28],"among":[29],"different":[30],"robot":[31,34,53],"modules":[32],"(e.g.,":[33],"legs":[35],"or":[36],"joints).":[37],"However,":[38],"current":[39],"often":[41],"struggle":[42],"quickly":[44],"adapt":[45],"unforeseen":[47,146],"failures,":[48],"such":[49],"as":[50],"a":[51,62,76],"malfunctioning":[52],"leg,":[54],"especially":[55],"after":[56],"the":[57,69],"algorithm":[58,90],"has":[59],"converged":[60],"strategy.":[63],"To":[64],"overcome":[65],"this,":[66],"we":[67],"introduce":[68],"Relational":[70],"Q-Functionals":[71],"(RQF)":[72],"framework.":[73],"RQF":[74,109],"leverages":[75],"relational":[77],"network,":[78],"representing":[79],"agents'":[80],"relationships,":[81],"enhance":[83],"adaptability,":[84],"providing":[85],"resilience":[86],"against":[87],"malfunction(s).":[88],"Our":[89,104],"also":[91],"efficiently":[92],"handles":[93],"continuous":[94],"state-action":[95],"domains,":[96],"making":[97],"it":[98],"adept":[99],"for":[100],"robotic":[101],"tasks.":[103],"empirical":[105],"results":[106],"show":[107],"that":[108],"enables":[110],"agents":[111],"use":[113],"relationships":[115],"effectively":[116],"facilitate":[118],"and":[120],"recover":[121],"from":[122],"an":[123],"unexpected":[124],"malfunction":[125],"systems":[128],"with":[129,145],"multiple":[130],"interacting":[131],"modules.":[132],"Thus,":[133],"our":[134],"approach":[135],"offers":[136],"promising":[137],"applications":[138],"particularly":[142],"malfunctions.":[147]},"counts_by_year":[],"updated_date":"2025-12-22T23:10:17.713674","created_date":"2025-10-10T00:00:00"}
