{"id":"https://openalex.org/W4401751948","doi":"https://doi.org/10.1109/aim55361.2024.10637099","title":"Efficient Design Space Exploration with Multi-Task Reinforcement Learning","display_name":"Efficient Design Space Exploration with Multi-Task Reinforcement Learning","publication_year":2024,"publication_date":"2024-07-15","ids":{"openalex":"https://openalex.org/W4401751948","doi":"https://doi.org/10.1109/aim55361.2024.10637099"},"language":"en","primary_location":{"id":"doi:10.1109/aim55361.2024.10637099","is_oa":false,"landing_page_url":"https://doi.org/10.1109/aim55361.2024.10637099","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"2024 IEEE International Conference on Advanced Intelligent Mechatronics (AIM)","raw_type":"proceedings-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":false,"oa_status":"closed","oa_url":null,"any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5073584703","display_name":"P. Hoffmann","orcid":"https://orcid.org/0000-0002-7924-6219"},"institutions":[{"id":"https://openalex.org/I889804353","display_name":"Robert Bosch (Germany)","ror":"https://ror.org/01fe0jt45","country_code":"DE","type":"company","lineage":["https://openalex.org/I889804353"]}],"countries":["DE"],"is_corresponding":true,"raw_author_name":"Patrick Hoffmann","raw_affiliation_strings":["Robert Bosch GmbH,Corporate Sector Research and Advance Engineering,Renningen,Germany,71272"],"affiliations":[{"raw_affiliation_string":"Robert Bosch GmbH,Corporate Sector Research and Advance Engineering,Renningen,Germany,71272","institution_ids":["https://openalex.org/I889804353"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5086133983","display_name":"Kirill Gorelik","orcid":"https://orcid.org/0000-0001-6813-6076"},"institutions":[{"id":"https://openalex.org/I889804353","display_name":"Robert Bosch (Germany)","ror":"https://ror.org/01fe0jt45","country_code":"DE","type":"company","lineage":["https://openalex.org/I889804353"]}],"countries":["DE"],"is_corresponding":false,"raw_author_name":"Kirill Gorelik","raw_affiliation_strings":["Robert Bosch GmbH,Corporate Sector Research and Advance Engineering,Renningen,Germany,71272"],"affiliations":[{"raw_affiliation_string":"Robert Bosch GmbH,Corporate Sector Research and Advance Engineering,Renningen,Germany,71272","institution_ids":["https://openalex.org/I889804353"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5082684102","display_name":"Valentin Ivanov","orcid":"https://orcid.org/0000-0001-7252-7184"},"institutions":[{"id":"https://openalex.org/I119449181","display_name":"Technische Universit\u00e4t Ilmenau","ror":"https://ror.org/01weqhp73","country_code":"DE","type":"education","lineage":["https://openalex.org/I119449181"]}],"countries":["DE"],"is_corresponding":false,"raw_author_name":"Valentin Ivanov","raw_affiliation_strings":["Technische Universit&#x00E4;t Ilmenau,Department of Computer Science,Ilmenau,Germany,98693"],"affiliations":[{"raw_affiliation_string":"Technische Universit&#x00E4;t Ilmenau,Department of Computer Science,Ilmenau,Germany,98693","institution_ids":["https://openalex.org/I119449181"]}]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":3,"corresponding_author_ids":["https://openalex.org/A5073584703"],"corresponding_institution_ids":["https://openalex.org/I889804353"],"apc_list":null,"apc_paid":null,"fwci":0.3626,"has_fulltext":false,"cited_by_count":1,"citation_normalized_percentile":{"value":0.65757967,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":{"min":91,"max":95},"biblio":{"volume":null,"issue":null,"first_page":"1378","last_page":"1385"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10462","display_name":"Reinforcement Learning in Robotics","score":0.9962000250816345,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10462","display_name":"Reinforcement Learning in Robotics","score":0.9962000250816345,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T12784","display_name":"Modular Robots and Swarm Intelligence","score":0.9836999773979187,"subfield":{"id":"https://openalex.org/subfields/2210","display_name":"Mechanical Engineering"},"field":{"id":"https://openalex.org/fields/22","display_name":"Engineering"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11814","display_name":"Advanced Manufacturing and Logistics Optimization","score":0.9812999963760376,"subfield":{"id":"https://openalex.org/subfields/2209","display_name":"Industrial and Manufacturing Engineering"},"field":{"id":"https://openalex.org/fields/22","display_name":"Engineering"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/reinforcement-learning","display_name":"Reinforcement learning","score":0.7686516046524048},{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.7139440774917603},{"id":"https://openalex.org/keywords/task","display_name":"Task (project management)","score":0.6636930108070374},{"id":"https://openalex.org/keywords/space","display_name":"Space (punctuation)","score":0.5161603689193726},{"id":"https://openalex.org/keywords/space-exploration","display_name":"Space exploration","score":0.4955488443374634},{"id":"https://openalex.org/keywords/human\u2013computer-interaction","display_name":"Human\u2013computer interaction","score":0.47519028186798096},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.33386027812957764},{"id":"https://openalex.org/keywords/engineering","display_name":"Engineering","score":0.15582668781280518},{"id":"https://openalex.org/keywords/systems-engineering","display_name":"Systems engineering","score":0.14505469799041748},{"id":"https://openalex.org/keywords/aerospace-engineering","display_name":"Aerospace engineering","score":0.09957191348075867},{"id":"https://openalex.org/keywords/operating-system","display_name":"Operating system","score":0.06907385587692261}],"concepts":[{"id":"https://openalex.org/C97541855","wikidata":"https://www.wikidata.org/wiki/Q830687","display_name":"Reinforcement learning","level":2,"score":0.7686516046524048},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.7139440774917603},{"id":"https://openalex.org/C2780451532","wikidata":"https://www.wikidata.org/wiki/Q759676","display_name":"Task (project management)","level":2,"score":0.6636930108070374},{"id":"https://openalex.org/C2778572836","wikidata":"https://www.wikidata.org/wiki/Q380933","display_name":"Space (punctuation)","level":2,"score":0.5161603689193726},{"id":"https://openalex.org/C104060986","wikidata":"https://www.wikidata.org/wiki/Q180046","display_name":"Space exploration","level":2,"score":0.4955488443374634},{"id":"https://openalex.org/C107457646","wikidata":"https://www.wikidata.org/wiki/Q207434","display_name":"Human\u2013computer interaction","level":1,"score":0.47519028186798096},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.33386027812957764},{"id":"https://openalex.org/C127413603","wikidata":"https://www.wikidata.org/wiki/Q11023","display_name":"Engineering","level":0,"score":0.15582668781280518},{"id":"https://openalex.org/C201995342","wikidata":"https://www.wikidata.org/wiki/Q682496","display_name":"Systems engineering","level":1,"score":0.14505469799041748},{"id":"https://openalex.org/C146978453","wikidata":"https://www.wikidata.org/wiki/Q3798668","display_name":"Aerospace engineering","level":1,"score":0.09957191348075867},{"id":"https://openalex.org/C111919701","wikidata":"https://www.wikidata.org/wiki/Q9135","display_name":"Operating system","level":1,"score":0.06907385587692261}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.1109/aim55361.2024.10637099","is_oa":false,"landing_page_url":"https://doi.org/10.1109/aim55361.2024.10637099","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"2024 IEEE International Conference on Advanced Intelligent Mechatronics (AIM)","raw_type":"proceedings-article"}],"best_oa_location":null,"sustainable_development_goals":[],"awards":[],"funders":[],"has_content":{"grobid_xml":false,"pdf":false},"content_urls":null,"referenced_works_count":32,"referenced_works":["https://openalex.org/W41554520","https://openalex.org/W1191599655","https://openalex.org/W2481081394","https://openalex.org/W2624871570","https://openalex.org/W2735995851","https://openalex.org/W2736601468","https://openalex.org/W2913340405","https://openalex.org/W2991309414","https://openalex.org/W2998268493","https://openalex.org/W3013821552","https://openalex.org/W3087549734","https://openalex.org/W3121095832","https://openalex.org/W4230112301","https://openalex.org/W4241431509","https://openalex.org/W4286963241","https://openalex.org/W4287329474","https://openalex.org/W4308754326","https://openalex.org/W4379374853","https://openalex.org/W4390482198","https://openalex.org/W4391338760","https://openalex.org/W6627932998","https://openalex.org/W6677916085","https://openalex.org/W6739365718","https://openalex.org/W6740879895","https://openalex.org/W6741002519","https://openalex.org/W6755851568","https://openalex.org/W6768689258","https://openalex.org/W6770205404","https://openalex.org/W6775647304","https://openalex.org/W6783292247","https://openalex.org/W6790190981","https://openalex.org/W6801964084"],"related_works":["https://openalex.org/W4306904969","https://openalex.org/W2138720691","https://openalex.org/W4362501864","https://openalex.org/W4380318855","https://openalex.org/W2031695474","https://openalex.org/W3084456289","https://openalex.org/W2024136090","https://openalex.org/W3196817267","https://openalex.org/W1976600725","https://openalex.org/W4402059566"],"abstract_inverted_index":{"Exploring":[0],"the":[1,13,16,26,55,60,129,186,196],"design":[2,28,64,116,121,138,200],"space":[3,65,139,201],"is":[4,31,67,147,209],"a":[5,37,69,150,181],"critical":[6],"aspect":[7],"of":[8,39,59,81,131,134,190,193,199],"engineering":[9],"and":[10,44,158,167,176,205],"optimization,":[11],"involving":[12],"search":[14],"for":[15,84,97,203],"best":[17],"configuration":[18],"in":[19,63,119,174],"complex":[20],"systems":[21],"with":[22],"numerous":[23],"options.":[24],"In":[25],"system":[27,171,207],"process,":[29],"it":[30],"essential":[32],"to":[33,42,73,149],"take":[34],"into":[35],"account":[36],"range":[38],"constraints":[40],"related":[41],"architecture":[43],"component":[45],"dimensioning,":[46],"as":[47,49,93],"well":[48],"requirements":[50],"defined":[51],"by":[52],"standards":[53],"or":[54],"current":[56],"state-of-the-art.":[57],"One":[58],"main":[61],"challenges":[62],"exploration":[66,140,202],"developing":[68],"control":[70,99,135,194],"strategy":[71],"tailored":[72],"each":[74],"specific":[75],"design,":[76],"facilitating":[77],"an":[78,94],"objective":[79],"comparison":[80],"different":[82,164],"designs":[83],"closed-loop":[85],"scenarios.":[86],"Even":[87],"though":[88],"reinforcement":[89,143],"learning":[90],"offers":[91],"promise":[92],"automated":[95,132,191],"solution":[96],"deriving":[98],"strategies,":[100],"its":[101],"trial-and-error":[102],"methodology":[103],"demands":[104],"significant":[105],"computational":[106],"resources.":[107],"To":[108],"address":[109],"this":[110],"challenge,":[111],"leveraging":[112],"knowledge":[113],"from":[114],"similar":[115],"combinations,":[117],"especially":[118],"larger":[120],"spaces,":[122],"becomes":[123],"beneficial.":[124],"This":[125],"study":[126],"specifically":[127],"targets":[128],"speed-up":[130],"derivation":[133,192],"strategies":[136,195],"within":[137,180],"using":[141],"multi-task":[142],"learning.":[144],"The":[145],"work":[146],"applied":[148],"safety-critical":[151],"cross-domain":[152],"motion":[153],"system,":[154],"comprising":[155],"drive,":[156],"brake,":[157],"steer":[159],"systems.":[160],"It":[161],"further":[162],"considers":[163],"driving":[165],"scenarios":[166],"failure":[168,178],"cases,":[169],"enabling":[170],"performance":[172],"assessment":[173],"normal":[175],"various":[177],"modes":[179],"limited":[182],"time":[183],"frame.":[184],"With":[185],"proposed":[187],"speed":[188],"up":[189],"overall":[197],"effectiveness":[198],"multi-actuated":[204],"integrated":[206],"architectures":[208],"enhanced.":[210]},"counts_by_year":[{"year":2025,"cited_by_count":1}],"updated_date":"2025-12-19T19:40:27.379048","created_date":"2025-10-10T00:00:00"}
