{"id":"https://openalex.org/W3087055389","doi":"https://doi.org/10.1007/s00521-021-06850-6","title":"Human engagement providing evaluative and informative advice for interactive reinforcement learning","display_name":"Human engagement providing evaluative and informative advice for interactive reinforcement learning","publication_year":2022,"publication_date":"2022-01-12","ids":{"openalex":"https://openalex.org/W3087055389","doi":"https://doi.org/10.1007/s00521-021-06850-6","mag":"3087055389"},"language":"en","primary_location":{"id":"doi:10.1007/s00521-021-06850-6","is_oa":true,"landing_page_url":"https://doi.org/10.1007/s00521-021-06850-6","pdf_url":"https://link.springer.com/content/pdf/10.1007/s00521-021-06850-6.pdf","source":{"id":"https://openalex.org/S147897268","display_name":"Neural Computing and Applications","issn_l":"0941-0643","issn":["0941-0643","1433-3058"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310319900","host_organization_name":"Springer Science+Business Media","host_organization_lineage":["https://openalex.org/P4310319900","https://openalex.org/P4310319965"],"host_organization_lineage_names":["Springer Science+Business Media","Springer Nature"],"type":"journal"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Neural Computing and Applications","raw_type":"journal-article"},"type":"article","indexed_in":["arxiv","crossref"],"open_access":{"is_oa":true,"oa_status":"hybrid","oa_url":"https://link.springer.com/content/pdf/10.1007/s00521-021-06850-6.pdf","any_repository_has_fulltext":true},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5091862657","display_name":"Adam Bignold","orcid":"https://orcid.org/0000-0001-9002-4281"},"institutions":[{"id":"https://openalex.org/I149672521","display_name":"Federation University","ror":"https://ror.org/05qbzwv83","country_code":"AU","type":"education","lineage":["https://openalex.org/I149672521"]}],"countries":["AU"],"is_corresponding":true,"raw_author_name":"Adam Bignold","raw_affiliation_strings":["School of Engineering, IT and Physical Sciences, Federation University, Ballarat, Australia"],"affiliations":[{"raw_affiliation_string":"School of Engineering, IT and Physical Sciences, Federation University, Ballarat, Australia","institution_ids":["https://openalex.org/I149672521"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5044098673","display_name":"Francisco Cruz","orcid":"https://orcid.org/0000-0002-1131-3382"},"institutions":[{"id":"https://openalex.org/I149704539","display_name":"Deakin University","ror":"https://ror.org/02czsnj07","country_code":"AU","type":"education","lineage":["https://openalex.org/I149704539"]},{"id":"https://openalex.org/I4210156023","display_name":"Universidad Central de Chile","ror":"https://ror.org/0577avk88","country_code":"CL","type":"education","lineage":["https://openalex.org/I4210156023"]}],"countries":["AU","CL"],"is_corresponding":false,"raw_author_name":"Francisco Cruz","raw_affiliation_strings":["Escuela de Ingenier\u00eda, Universidad Central de Chile, Santiago, Chile","School of Information Technology, Deakin University, Geelong, Australia"],"affiliations":[{"raw_affiliation_string":"Escuela de Ingenier\u00eda, Universidad Central de Chile, Santiago, Chile","institution_ids":["https://openalex.org/I4210156023"]},{"raw_affiliation_string":"School of Information Technology, Deakin University, Geelong, Australia","institution_ids":["https://openalex.org/I149704539"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5032749222","display_name":"Richard Dazeley","orcid":"https://orcid.org/0000-0002-6199-9685"},"institutions":[{"id":"https://openalex.org/I149704539","display_name":"Deakin University","ror":"https://ror.org/02czsnj07","country_code":"AU","type":"education","lineage":["https://openalex.org/I149704539"]}],"countries":["AU"],"is_corresponding":false,"raw_author_name":"Richard Dazeley","raw_affiliation_strings":["School of Information Technology, Deakin University, Geelong, Australia"],"affiliations":[{"raw_affiliation_string":"School of Information Technology, Deakin University, Geelong, Australia","institution_ids":["https://openalex.org/I149704539"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5080095540","display_name":"Peter Vamplew","orcid":"https://orcid.org/0000-0002-8687-4424"},"institutions":[{"id":"https://openalex.org/I149672521","display_name":"Federation University","ror":"https://ror.org/05qbzwv83","country_code":"AU","type":"education","lineage":["https://openalex.org/I149672521"]}],"countries":["AU"],"is_corresponding":false,"raw_author_name":"Peter Vamplew","raw_affiliation_strings":["School of Engineering, IT and Physical Sciences, Federation University, Ballarat, Australia"],"affiliations":[{"raw_affiliation_string":"School of Engineering, IT and Physical Sciences, Federation University, Ballarat, Australia","institution_ids":["https://openalex.org/I149672521"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5013402425","display_name":"Cameron Foale","orcid":"https://orcid.org/0000-0003-2537-0326"},"institutions":[{"id":"https://openalex.org/I149672521","display_name":"Federation University","ror":"https://ror.org/05qbzwv83","country_code":"AU","type":"education","lineage":["https://openalex.org/I149672521"]}],"countries":["AU"],"is_corresponding":false,"raw_author_name":"Cameron Foale","raw_affiliation_strings":["School of Engineering, IT and Physical Sciences, Federation University, Ballarat, Australia"],"affiliations":[{"raw_affiliation_string":"School of Engineering, IT and Physical Sciences, Federation University, Ballarat, Australia","institution_ids":["https://openalex.org/I149672521"]}]}],"institutions":[],"countries_distinct_count":2,"institutions_distinct_count":5,"corresponding_author_ids":["https://openalex.org/A5091862657"],"corresponding_institution_ids":["https://openalex.org/I149672521"],"apc_list":{"value":2390,"currency":"EUR","value_usd":2990},"apc_paid":{"value":2390,"currency":"EUR","value_usd":2990},"fwci":2.7774,"has_fulltext":true,"cited_by_count":25,"citation_normalized_percentile":{"value":0.91383036,"is_in_top_1_percent":false,"is_in_top_10_percent":true},"cited_by_percentile_year":{"min":96,"max":99},"biblio":{"volume":"35","issue":"25","first_page":"18215","last_page":"18230"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10462","display_name":"Reinforcement Learning in Robotics","score":0.9991000294685364,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10462","display_name":"Reinforcement Learning in Robotics","score":0.9991000294685364,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10042","display_name":"Neural and Behavioral Psychology Studies","score":0.9402999877929688,"subfield":{"id":"https://openalex.org/subfields/2805","display_name":"Cognitive Neuroscience"},"field":{"id":"https://openalex.org/fields/28","display_name":"Neuroscience"},"domain":{"id":"https://openalex.org/domains/1","display_name":"Life Sciences"}},{"id":"https://openalex.org/T10883","display_name":"Ethics and Social Impacts of AI","score":0.9366000294685364,"subfield":{"id":"https://openalex.org/subfields/3311","display_name":"Safety Research"},"field":{"id":"https://openalex.org/fields/33","display_name":"Social Sciences"},"domain":{"id":"https://openalex.org/domains/2","display_name":"Social Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/advice","display_name":"Advice (programming)","score":0.9287353157997131},{"id":"https://openalex.org/keywords/reinforcement-learning","display_name":"Reinforcement learning","score":0.6608829498291016},{"id":"https://openalex.org/keywords/process","display_name":"Process (computing)","score":0.6304103136062622},{"id":"https://openalex.org/keywords/reinforcement","display_name":"Reinforcement","score":0.584551215171814},{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.4996497631072998},{"id":"https://openalex.org/keywords/psychology","display_name":"Psychology","score":0.4006447196006775},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.23499330878257751},{"id":"https://openalex.org/keywords/social-psychology","display_name":"Social psychology","score":0.1767180860042572}],"concepts":[{"id":"https://openalex.org/C2779955035","wikidata":"https://www.wikidata.org/wiki/Q4686785","display_name":"Advice (programming)","level":2,"score":0.9287353157997131},{"id":"https://openalex.org/C97541855","wikidata":"https://www.wikidata.org/wiki/Q830687","display_name":"Reinforcement learning","level":2,"score":0.6608829498291016},{"id":"https://openalex.org/C98045186","wikidata":"https://www.wikidata.org/wiki/Q205663","display_name":"Process (computing)","level":2,"score":0.6304103136062622},{"id":"https://openalex.org/C67203356","wikidata":"https://www.wikidata.org/wiki/Q1321905","display_name":"Reinforcement","level":2,"score":0.584551215171814},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.4996497631072998},{"id":"https://openalex.org/C15744967","wikidata":"https://www.wikidata.org/wiki/Q9418","display_name":"Psychology","level":0,"score":0.4006447196006775},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.23499330878257751},{"id":"https://openalex.org/C77805123","wikidata":"https://www.wikidata.org/wiki/Q161272","display_name":"Social psychology","level":1,"score":0.1767180860042572},{"id":"https://openalex.org/C111919701","wikidata":"https://www.wikidata.org/wiki/Q9135","display_name":"Operating system","level":1,"score":0.0},{"id":"https://openalex.org/C199360897","wikidata":"https://www.wikidata.org/wiki/Q9143","display_name":"Programming language","level":1,"score":0.0}],"mesh":[],"locations_count":5,"locations":[{"id":"doi:10.1007/s00521-021-06850-6","is_oa":true,"landing_page_url":"https://doi.org/10.1007/s00521-021-06850-6","pdf_url":"https://link.springer.com/content/pdf/10.1007/s00521-021-06850-6.pdf","source":{"id":"https://openalex.org/S147897268","display_name":"Neural Computing and Applications","issn_l":"0941-0643","issn":["0941-0643","1433-3058"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310319900","host_organization_name":"Springer Science+Business Media","host_organization_lineage":["https://openalex.org/P4310319900","https://openalex.org/P4310319965"],"host_organization_lineage_names":["Springer Science+Business Media","Springer Nature"],"type":"journal"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Neural Computing and Applications","raw_type":"journal-article"},{"id":"pmh:oai:arXiv.org:2009.09575","is_oa":true,"landing_page_url":"http://arxiv.org/abs/2009.09575","pdf_url":"https://arxiv.org/pdf/2009.09575","source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"text"},{"id":"pmh:vital:18966","is_oa":true,"landing_page_url":"http://researchonline.federation.edu.au/vital/access/HandleResolver/1959.17/197965","pdf_url":null,"source":{"id":"https://openalex.org/S4306400234","display_name":"FedUni ResearchOnline (Federation University Australia)","issn_l":null,"issn":null,"is_oa":false,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I4210158496","host_organization_name":"Australian Federation of University Women \u2013 South Australia","host_organization_lineage":["https://openalex.org/I4210158496"],"host_organization_lineage_names":[],"type":"repository"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":"","raw_type":"Text"},{"id":"pmh:oai:dro.deakin.edu.au:DU:30162073","is_oa":false,"landing_page_url":null,"pdf_url":null,"source":{"id":"https://openalex.org/S4306401102","display_name":"Own your potential (DEAKIN)","issn_l":null,"issn":null,"is_oa":false,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I149704539","host_organization_name":"Deakin University","host_organization_lineage":["https://openalex.org/I149704539"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":"","raw_type":"Journal Article"},{"id":"pmh:oai:figshare.com:article/20623896","is_oa":true,"landing_page_url":"https://figshare.com/articles/journal_contribution/Human_engagement_providing_evaluative_and_informative_advice_for_interactive_reinforcement_learning/20623896","pdf_url":null,"source":{"id":"https://openalex.org/S4377196282","display_name":"Figshare","issn_l":null,"issn":null,"is_oa":false,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I4210132348","host_organization_name":"Figshare (United Kingdom)","host_organization_lineage":["https://openalex.org/I4210132348"],"host_organization_lineage_names":[],"type":"repository"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":"","raw_type":"Text"}],"best_oa_location":{"id":"doi:10.1007/s00521-021-06850-6","is_oa":true,"landing_page_url":"https://doi.org/10.1007/s00521-021-06850-6","pdf_url":"https://link.springer.com/content/pdf/10.1007/s00521-021-06850-6.pdf","source":{"id":"https://openalex.org/S147897268","display_name":"Neural Computing and Applications","issn_l":"0941-0643","issn":["0941-0643","1433-3058"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310319900","host_organization_name":"Springer Science+Business Media","host_organization_lineage":["https://openalex.org/P4310319900","https://openalex.org/P4310319965"],"host_organization_lineage_names":["Springer Science+Business Media","Springer Nature"],"type":"journal"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Neural Computing and Applications","raw_type":"journal-article"},"sustainable_development_goals":[{"score":0.5,"display_name":"Quality Education","id":"https://metadata.un.org/sdg/4"}],"awards":[],"funders":[{"id":"https://openalex.org/F4320315885","display_name":"Australian Government","ror":"https://ror.org/0314h5y94"},{"id":"https://openalex.org/F4320320970","display_name":"Deakin University","ror":"https://ror.org/02czsnj07"},{"id":"https://openalex.org/F4320324008","display_name":"Federation University Australia","ror":"https://ror.org/05qbzwv83"}],"has_content":{"pdf":true,"grobid_xml":true},"content_urls":{"pdf":"https://content.openalex.org/works/W3087055389.pdf","grobid_xml":"https://content.openalex.org/works/W3087055389.grobid-xml"},"referenced_works_count":84,"referenced_works":["https://openalex.org/W41554520","https://openalex.org/W47268242","https://openalex.org/W111328409","https://openalex.org/W196196703","https://openalex.org/W197704362","https://openalex.org/W1501005121","https://openalex.org/W1542941925","https://openalex.org/W1572400973","https://openalex.org/W1580572138","https://openalex.org/W1583837637","https://openalex.org/W1641379095","https://openalex.org/W1777239053","https://openalex.org/W1966259872","https://openalex.org/W1984742304","https://openalex.org/W2031727428","https://openalex.org/W2041367235","https://openalex.org/W2058689487","https://openalex.org/W2070410573","https://openalex.org/W2093313552","https://openalex.org/W2097381042","https://openalex.org/W2098441518","https://openalex.org/W2107726111","https://openalex.org/W2109021302","https://openalex.org/W2116157560","https://openalex.org/W2121110499","https://openalex.org/W2121863487","https://openalex.org/W2131797004","https://openalex.org/W2133040789","https://openalex.org/W2138796020","https://openalex.org/W2154633587","https://openalex.org/W2156578004","https://openalex.org/W2156869222","https://openalex.org/W2157174816","https://openalex.org/W2157726050","https://openalex.org/W2158969944","https://openalex.org/W2165442026","https://openalex.org/W2166798247","https://openalex.org/W2200983898","https://openalex.org/W2400915889","https://openalex.org/W2415726935","https://openalex.org/W2471883051","https://openalex.org/W2539402368","https://openalex.org/W2563829177","https://openalex.org/W2583816737","https://openalex.org/W2620974420","https://openalex.org/W2788455270","https://openalex.org/W2792217087","https://openalex.org/W2795786572","https://openalex.org/W2883750587","https://openalex.org/W2903375875","https://openalex.org/W2911719076","https://openalex.org/W2912947802","https://openalex.org/W2919115771","https://openalex.org/W2944766483","https://openalex.org/W2946780324","https://openalex.org/W2957624498","https://openalex.org/W2975684468","https://openalex.org/W3012983342","https://openalex.org/W3015592223","https://openalex.org/W3036003300","https://openalex.org/W3038676770","https://openalex.org/W3039116038","https://openalex.org/W3039772337","https://openalex.org/W3096621767","https://openalex.org/W3101926919","https://openalex.org/W3112469726","https://openalex.org/W3126966255","https://openalex.org/W3134299257","https://openalex.org/W3135497281","https://openalex.org/W3155878512","https://openalex.org/W3165749036","https://openalex.org/W3182743297","https://openalex.org/W3186035148","https://openalex.org/W3193790705","https://openalex.org/W3198729202","https://openalex.org/W3200372272","https://openalex.org/W4237229184","https://openalex.org/W4285719527","https://openalex.org/W4287122174","https://openalex.org/W4287610367","https://openalex.org/W4288363736","https://openalex.org/W4288593469","https://openalex.org/W4300110528","https://openalex.org/W6601977772"],"related_works":["https://openalex.org/W4391375266","https://openalex.org/W2748952813","https://openalex.org/W4393601209","https://openalex.org/W3090906284","https://openalex.org/W253876680","https://openalex.org/W4393803066","https://openalex.org/W1987931999","https://openalex.org/W2920061524","https://openalex.org/W4310083477","https://openalex.org/W2328553770"],"abstract_inverted_index":{"Abstract":[0],"Interactive":[1],"reinforcement":[2,50],"learning":[3,17,51,58],"proposes":[4],"the":[5,16,38,48,57,61,65,69,84,104,126,137,155,161,166],"use":[6,107],"of":[7,40,60,77,113,179],"externally":[8],"sourced":[9],"information":[10],"in":[11,111],"order":[12],"to":[13,55,102,108,125,135,164,177,184],"speed":[14,59],"up":[15],"process.":[18],"When":[19],"interacting":[20],"with":[21],"a":[22,98,141],"learner":[23,127,138],"agent,":[24,62],"humans":[25],"may":[26],"provide":[27,129,145],"either":[28],"evaluative":[29,80,187],"or":[30,81],"informative":[31,123,156],"advice.":[32,188],"Prior":[33],"research":[34],"has":[35,158],"focused":[36],"on":[37,47,68,74],"effect":[39],"human-sourced":[41],"advice":[42,110,124,147,167,176],"by":[43],"including":[44],"real-time":[45],"feedback":[46],"interactive":[49],"process,":[52],"specifically":[53],"aiming":[54],"improve":[56],"while":[63],"minimising":[64],"time":[66],"demands":[67],"human.":[70],"This":[71],"work":[72,92],"focuses":[73],"answering":[75],"which":[76],"two":[78],"approaches,":[79],"informative,":[82],"is":[83,168],"preferred":[85],"instructional":[86],"approach":[87,157],"for":[88,97,140],"humans.":[89],"Moreover,":[90],"this":[91],"presents":[93],"an":[94],"experimental":[95],"setup":[96],"human":[99,114],"trial":[100],"designed":[101],"compare":[103],"methods":[105],"people":[106,185],"deliver":[109],"terms":[112],"engagement.":[115],"The":[116],"results":[117],"obtained":[118],"show":[119],"that":[120,160],"users":[121],"giving":[122],"agents":[128],"more":[130,146],"accurate":[131],"advice,":[132],"are":[133],"willing":[134],"assist":[136],"agent":[139],"longer":[142],"time,":[143],"and":[144,170],"per":[148],"episode.":[149],"Additionally,":[150],"self-evaluation":[151],"from":[152],"participants":[153],"using":[154],"indicated":[159],"agent\u2019s":[162],"ability":[163],"follow":[165],"higher,":[169],"therefore,":[171],"they":[172],"feel":[173],"their":[174],"own":[175],"be":[178],"higher":[180],"accuracy":[181],"when":[182],"compared":[183],"providing":[186]},"counts_by_year":[{"year":2025,"cited_by_count":7},{"year":2024,"cited_by_count":6},{"year":2023,"cited_by_count":3},{"year":2022,"cited_by_count":4},{"year":2021,"cited_by_count":5}],"updated_date":"2026-04-04T16:13:02.066488","created_date":"2025-10-10T00:00:00"}
