{"id":"https://openalex.org/W2109294593","doi":"https://doi.org/10.1109/icsmc.2004.1401110","title":"A modular neurocontroller for creative mobile autonomous robots learning by temporal difference","display_name":"A modular neurocontroller for creative mobile autonomous robots learning by temporal difference","publication_year":2005,"publication_date":"2005-03-31","ids":{"openalex":"https://openalex.org/W2109294593","doi":"https://doi.org/10.1109/icsmc.2004.1401110","mag":"2109294593"},"language":"en","primary_location":{"id":"doi:10.1109/icsmc.2004.1401110","is_oa":false,"landing_page_url":"https://doi.org/10.1109/icsmc.2004.1401110","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"2004 IEEE International Conference on Systems, Man and Cybernetics (IEEE Cat. No.04CH37583)","raw_type":"proceedings-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":false,"oa_status":"closed","oa_url":null,"any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5000576234","display_name":"Helmut A. Mayer","orcid":"https://orcid.org/0000-0002-2428-0962"},"institutions":[{"id":"https://openalex.org/I182212641","display_name":"University of Salzburg","ror":"https://ror.org/05gs8cd61","country_code":"AT","type":"education","lineage":["https://openalex.org/I182212641"]}],"countries":["AT"],"is_corresponding":true,"raw_author_name":"H.A. Mayer","raw_affiliation_strings":["Department of Scientific Computing, University of Salzburg, Salzburg, Austria","Dept. of Sci. Comput., Salzburg Univ., Austria"],"affiliations":[{"raw_affiliation_string":"Department of Scientific Computing, University of Salzburg, Salzburg, Austria","institution_ids":["https://openalex.org/I182212641"]},{"raw_affiliation_string":"Dept. of Sci. Comput., Salzburg Univ., Austria","institution_ids":["https://openalex.org/I182212641"]}]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":1,"corresponding_author_ids":["https://openalex.org/A5000576234"],"corresponding_institution_ids":["https://openalex.org/I182212641"],"apc_list":null,"apc_paid":null,"fwci":0.0,"has_fulltext":false,"cited_by_count":0,"citation_normalized_percentile":{"value":0.13159906,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":null,"biblio":{"volume":"6","issue":null,"first_page":"5742","last_page":"5747"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10462","display_name":"Reinforcement Learning in Robotics","score":0.9993000030517578,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10462","display_name":"Reinforcement Learning in Robotics","score":0.9993000030517578,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10320","display_name":"Neural Networks and Applications","score":0.9952999949455261,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10581","display_name":"Neural dynamics and brain function","score":0.9890000224113464,"subfield":{"id":"https://openalex.org/subfields/2805","display_name":"Cognitive Neuroscience"},"field":{"id":"https://openalex.org/fields/28","display_name":"Neuroscience"},"domain":{"id":"https://openalex.org/domains/1","display_name":"Life Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/robot","display_name":"Robot","score":0.80748051404953},{"id":"https://openalex.org/keywords/mobile-robot","display_name":"Mobile robot","score":0.7239552736282349},{"id":"https://openalex.org/keywords/reinforcement-learning","display_name":"Reinforcement learning","score":0.7209962010383606},{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.7024911642074585},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.6194732785224915},{"id":"https://openalex.org/keywords/artificial-neural-network","display_name":"Artificial neural network","score":0.5730361938476562},{"id":"https://openalex.org/keywords/robot-learning","display_name":"Robot learning","score":0.561485767364502},{"id":"https://openalex.org/keywords/modular-design","display_name":"Modular design","score":0.4950787127017975},{"id":"https://openalex.org/keywords/robot-control","display_name":"Robot control","score":0.47929754853248596},{"id":"https://openalex.org/keywords/state-space","display_name":"State space","score":0.47523191571235657},{"id":"https://openalex.org/keywords/evolutionary-robotics","display_name":"Evolutionary robotics","score":0.42768171429634094},{"id":"https://openalex.org/keywords/state","display_name":"State (computer science)","score":0.4149662256240845},{"id":"https://openalex.org/keywords/social-robot","display_name":"Social robot","score":0.41225191950798035},{"id":"https://openalex.org/keywords/action","display_name":"Action (physics)","score":0.41143739223480225},{"id":"https://openalex.org/keywords/mathematics","display_name":"Mathematics","score":0.08998522162437439}],"concepts":[{"id":"https://openalex.org/C90509273","wikidata":"https://www.wikidata.org/wiki/Q11012","display_name":"Robot","level":2,"score":0.80748051404953},{"id":"https://openalex.org/C19966478","wikidata":"https://www.wikidata.org/wiki/Q4810574","display_name":"Mobile robot","level":3,"score":0.7239552736282349},{"id":"https://openalex.org/C97541855","wikidata":"https://www.wikidata.org/wiki/Q830687","display_name":"Reinforcement learning","level":2,"score":0.7209962010383606},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.7024911642074585},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.6194732785224915},{"id":"https://openalex.org/C50644808","wikidata":"https://www.wikidata.org/wiki/Q192776","display_name":"Artificial neural network","level":2,"score":0.5730361938476562},{"id":"https://openalex.org/C188888258","wikidata":"https://www.wikidata.org/wiki/Q7353390","display_name":"Robot learning","level":4,"score":0.561485767364502},{"id":"https://openalex.org/C101468663","wikidata":"https://www.wikidata.org/wiki/Q1620158","display_name":"Modular design","level":2,"score":0.4950787127017975},{"id":"https://openalex.org/C65401140","wikidata":"https://www.wikidata.org/wiki/Q7353385","display_name":"Robot control","level":4,"score":0.47929754853248596},{"id":"https://openalex.org/C72434380","wikidata":"https://www.wikidata.org/wiki/Q230930","display_name":"State space","level":2,"score":0.47523191571235657},{"id":"https://openalex.org/C199505168","wikidata":"https://www.wikidata.org/wiki/Q3267529","display_name":"Evolutionary robotics","level":3,"score":0.42768171429634094},{"id":"https://openalex.org/C48103436","wikidata":"https://www.wikidata.org/wiki/Q599031","display_name":"State (computer science)","level":2,"score":0.4149662256240845},{"id":"https://openalex.org/C162947575","wikidata":"https://www.wikidata.org/wiki/Q2005645","display_name":"Social robot","level":5,"score":0.41225191950798035},{"id":"https://openalex.org/C2780791683","wikidata":"https://www.wikidata.org/wiki/Q846785","display_name":"Action (physics)","level":2,"score":0.41143739223480225},{"id":"https://openalex.org/C33923547","wikidata":"https://www.wikidata.org/wiki/Q395","display_name":"Mathematics","level":0,"score":0.08998522162437439},{"id":"https://openalex.org/C121332964","wikidata":"https://www.wikidata.org/wiki/Q413","display_name":"Physics","level":0,"score":0.0},{"id":"https://openalex.org/C111919701","wikidata":"https://www.wikidata.org/wiki/Q9135","display_name":"Operating system","level":1,"score":0.0},{"id":"https://openalex.org/C62520636","wikidata":"https://www.wikidata.org/wiki/Q944","display_name":"Quantum mechanics","level":1,"score":0.0},{"id":"https://openalex.org/C11413529","wikidata":"https://www.wikidata.org/wiki/Q8366","display_name":"Algorithm","level":1,"score":0.0},{"id":"https://openalex.org/C105795698","wikidata":"https://www.wikidata.org/wiki/Q12483","display_name":"Statistics","level":1,"score":0.0}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.1109/icsmc.2004.1401110","is_oa":false,"landing_page_url":"https://doi.org/10.1109/icsmc.2004.1401110","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"2004 IEEE International Conference on Systems, Man and Cybernetics (IEEE Cat. No.04CH37583)","raw_type":"proceedings-article"}],"best_oa_location":null,"sustainable_development_goals":[{"score":0.6399999856948853,"id":"https://metadata.un.org/sdg/16","display_name":"Peace, Justice and strong institutions"}],"awards":[],"funders":[],"has_content":{"pdf":false,"grobid_xml":false},"content_urls":null,"referenced_works_count":10,"referenced_works":["https://openalex.org/W1488698606","https://openalex.org/W1608391772","https://openalex.org/W1936699754","https://openalex.org/W2076103977","https://openalex.org/W2103285838","https://openalex.org/W2121796542","https://openalex.org/W2312609093","https://openalex.org/W4214717370","https://openalex.org/W6640552426","https://openalex.org/W6677897226"],"related_works":["https://openalex.org/W13141533","https://openalex.org/W2314472328","https://openalex.org/W2544716473","https://openalex.org/W2909564046","https://openalex.org/W3044674998","https://openalex.org/W2126211886","https://openalex.org/W2134294860","https://openalex.org/W2493438666","https://openalex.org/W1965774354","https://openalex.org/W2724299411"],"abstract_inverted_index":{"One":[0],"of":[1,10,42,83,99,129,134,174,182],"the":[2,8,27,53,78,91,110,123,135,154,158,160,172,175,180],"most":[3],"prominent":[4],"research":[5],"goals":[6],"in":[7,106,153],"field":[9],"mobile":[11],"autonomous":[12],"robots":[13,17,28,184],"is":[14,76,86],"to":[15,21,23,32,51,73,94,108,122,162,185],"create":[16],"that":[18,77],"are":[19,59,142],"able":[20,31],"adapt":[22],"new":[24,164],"environments,":[25],"i.e.,":[26],"should":[29],"be":[30],"learn":[33,186],"during":[34],"their":[35],"\"lifetime\"":[36],"possibly":[37],"without":[38],"(or":[39],"a":[40,60,84,118,127],"minimum)":[41],"human":[43],"intervention.":[44],"When":[45],"employing":[46],"artificial":[47],"neural":[48],"networks":[49],"(ANNs)":[50],"control":[52],"robot,":[54],"reinforcement":[55],"learning":[56,75],"(RL)":[57],"techniques":[58],"good":[61],"candidate":[62],"for":[63],"achieving":[64],"continuous":[65],"on-line":[66],"learning.":[67,193],"A":[68],"problem":[69,115],"with":[70],"RL":[71],"applied":[72],"robot":[74,85,92,159],"state":[79],"(and":[80],"action)":[81],"space":[82],"typically":[87],"not":[88],"discrete.":[89],"Thus,":[90],"had":[93],"evaluate":[95,163],"an":[96],"infinite":[97],"number":[98],"possible":[100],"actions":[101],"at":[102],"every":[103],"time":[104],"step":[105],"order":[107],"select":[109],"best.":[111],"To":[112],"overcome":[113],"this":[114],"we":[116],"add":[117],"second":[119],"network":[120,156],"module":[121],"neurocontroller":[124],"acting":[125],"as":[126],"memory":[128,155],"previous":[130,145],"decisions":[131,146],"(state-action":[132],"pairs)":[133],"robot.":[136],"The":[137],"robot's":[138],"actual":[139],"decisions,":[140],"then,":[141],"based":[143],"on":[144],"retrieved":[147],"from":[148],"memory.":[149],"Additionally,":[150],"intrinsic":[151],"noise":[152],"gives":[157],"possibility":[161],"\"ideas\",":[165],"hence":[166],"it":[167],"becomes":[168],"creative.":[169],"We":[170],"analyze":[171],"potential":[173],"above":[176],"approach":[177],"by":[178],"measuring":[179],"ability":[181],"(simulated)":[183],"simple":[187],"tasks":[188],"using":[189],"temporal":[190],"difference":[191],"(TD)":[192]},"counts_by_year":[],"updated_date":"2025-11-06T03:46:38.306776","created_date":"2025-10-10T00:00:00"}
