{"id":"https://openalex.org/W2965797071","doi":"https://doi.org/10.1109/acii.2019.8925443","title":"Batch Recurrent Q-Learning for Backchannel Generation Towards Engaging Agents","display_name":"Batch Recurrent Q-Learning for Backchannel Generation Towards Engaging Agents","publication_year":2019,"publication_date":"2019-09-01","ids":{"openalex":"https://openalex.org/W2965797071","doi":"https://doi.org/10.1109/acii.2019.8925443","mag":"2965797071"},"language":"en","primary_location":{"id":"doi:10.1109/acii.2019.8925443","is_oa":false,"landing_page_url":"https://doi.org/10.1109/acii.2019.8925443","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"2019 8th International Conference on Affective Computing and Intelligent Interaction (ACII)","raw_type":"proceedings-article"},"type":"preprint","indexed_in":["arxiv","crossref","datacite"],"open_access":{"is_oa":true,"oa_status":"green","oa_url":"https://arxiv.org/pdf/1908.02037","any_repository_has_fulltext":true},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5073627972","display_name":"Nusrah Hussain","orcid":"https://orcid.org/0000-0001-8786-1871"},"institutions":[{"id":"https://openalex.org/I1351752","display_name":"Ko\u00e7 University","ror":"https://ror.org/00jzwgz36","country_code":"TR","type":"education","lineage":["https://openalex.org/I1351752"]}],"countries":["TR"],"is_corresponding":true,"raw_author_name":"Nusrah Hussain","raw_affiliation_strings":["College of Engineering, Ko\u00e7 University, Istanbul, Turkey","College of Engineering, Ko\u00e7 University, Istanbul, Turkey#TAB#"],"affiliations":[{"raw_affiliation_string":"College of Engineering, Ko\u00e7 University, Istanbul, Turkey","institution_ids":["https://openalex.org/I1351752"]},{"raw_affiliation_string":"College of Engineering, Ko\u00e7 University, Istanbul, Turkey#TAB#","institution_ids":["https://openalex.org/I1351752"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5064993025","display_name":"Engin Erzin","orcid":"https://orcid.org/0000-0002-2715-2368"},"institutions":[{"id":"https://openalex.org/I1351752","display_name":"Ko\u00e7 University","ror":"https://ror.org/00jzwgz36","country_code":"TR","type":"education","lineage":["https://openalex.org/I1351752"]}],"countries":["TR"],"is_corresponding":false,"raw_author_name":"Engin Erzin","raw_affiliation_strings":["College of Engineering, Ko\u00e7 University, Istanbul, Turkey","College of Engineering, Ko\u00e7 University, Istanbul, Turkey#TAB#"],"affiliations":[{"raw_affiliation_string":"College of Engineering, Ko\u00e7 University, Istanbul, Turkey","institution_ids":["https://openalex.org/I1351752"]},{"raw_affiliation_string":"College of Engineering, Ko\u00e7 University, Istanbul, Turkey#TAB#","institution_ids":["https://openalex.org/I1351752"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5005565161","display_name":"Tevfik Metin Sezgin","orcid":"https://orcid.org/0000-0002-1524-1646"},"institutions":[{"id":"https://openalex.org/I1351752","display_name":"Ko\u00e7 University","ror":"https://ror.org/00jzwgz36","country_code":"TR","type":"education","lineage":["https://openalex.org/I1351752"]}],"countries":["TR"],"is_corresponding":false,"raw_author_name":"T. Metin Sezgin","raw_affiliation_strings":["College of Engineering, Ko\u00e7 University, Istanbul, Turkey","College of Engineering, Ko\u00e7 University, Istanbul, Turkey#TAB#"],"affiliations":[{"raw_affiliation_string":"College of Engineering, Ko\u00e7 University, Istanbul, Turkey","institution_ids":["https://openalex.org/I1351752"]},{"raw_affiliation_string":"College of Engineering, Ko\u00e7 University, Istanbul, Turkey#TAB#","institution_ids":["https://openalex.org/I1351752"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5074744284","display_name":"Y. Yemez","orcid":"https://orcid.org/0000-0002-7515-3138"},"institutions":[{"id":"https://openalex.org/I1351752","display_name":"Ko\u00e7 University","ror":"https://ror.org/00jzwgz36","country_code":"TR","type":"education","lineage":["https://openalex.org/I1351752"]}],"countries":["TR"],"is_corresponding":false,"raw_author_name":"Yucel Yemez","raw_affiliation_strings":["College of Engineering, Ko\u00e7 University, Istanbul, Turkey","College of Engineering, Ko\u00e7 University, Istanbul, Turkey#TAB#"],"affiliations":[{"raw_affiliation_string":"College of Engineering, Ko\u00e7 University, Istanbul, Turkey","institution_ids":["https://openalex.org/I1351752"]},{"raw_affiliation_string":"College of Engineering, Ko\u00e7 University, Istanbul, Turkey#TAB#","institution_ids":["https://openalex.org/I1351752"]}]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":4,"corresponding_author_ids":["https://openalex.org/A5073627972"],"corresponding_institution_ids":["https://openalex.org/I1351752"],"apc_list":null,"apc_paid":null,"fwci":0.2698,"has_fulltext":true,"cited_by_count":1,"citation_normalized_percentile":{"value":0.64362717,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":{"min":89,"max":94},"biblio":{"volume":"135","issue":null,"first_page":"1","last_page":"7"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T11795","display_name":"Humor Studies and Applications","score":0.9940999746322632,"subfield":{"id":"https://openalex.org/subfields/3207","display_name":"Social Psychology"},"field":{"id":"https://openalex.org/fields/32","display_name":"Psychology"},"domain":{"id":"https://openalex.org/domains/2","display_name":"Social Sciences"}},"topics":[{"id":"https://openalex.org/T11795","display_name":"Humor Studies and Applications","score":0.9940999746322632,"subfield":{"id":"https://openalex.org/subfields/3207","display_name":"Social Psychology"},"field":{"id":"https://openalex.org/fields/32","display_name":"Psychology"},"domain":{"id":"https://openalex.org/domains/2","display_name":"Social Sciences"}},{"id":"https://openalex.org/T11714","display_name":"Multimodal Machine Learning Applications","score":0.9926000237464905,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10709","display_name":"Social Robot Interaction and HRI","score":0.9839000105857849,"subfield":{"id":"https://openalex.org/subfields/3207","display_name":"Social Psychology"},"field":{"id":"https://openalex.org/fields/32","display_name":"Psychology"},"domain":{"id":"https://openalex.org/domains/2","display_name":"Social Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/reinforcement-learning","display_name":"Reinforcement learning","score":0.8643884658813477},{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.7024909853935242},{"id":"https://openalex.org/keywords/imitation","display_name":"Imitation","score":0.640425443649292},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.5051115155220032},{"id":"https://openalex.org/keywords/q-learning","display_name":"Q-learning","score":0.48596107959747314},{"id":"https://openalex.org/keywords/value","display_name":"Value (mathematics)","score":0.45911329984664917},{"id":"https://openalex.org/keywords/reinforcement","display_name":"Reinforcement","score":0.45483797788619995},{"id":"https://openalex.org/keywords/function","display_name":"Function (biology)","score":0.4519963562488556},{"id":"https://openalex.org/keywords/robot","display_name":"Robot","score":0.44172850251197815},{"id":"https://openalex.org/keywords/human\u2013computer-interaction","display_name":"Human\u2013computer interaction","score":0.4012957215309143},{"id":"https://openalex.org/keywords/machine-learning","display_name":"Machine learning","score":0.19857728481292725},{"id":"https://openalex.org/keywords/psychology","display_name":"Psychology","score":0.08887124061584473}],"concepts":[{"id":"https://openalex.org/C97541855","wikidata":"https://www.wikidata.org/wiki/Q830687","display_name":"Reinforcement learning","level":2,"score":0.8643884658813477},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.7024909853935242},{"id":"https://openalex.org/C126388530","wikidata":"https://www.wikidata.org/wiki/Q1131737","display_name":"Imitation","level":2,"score":0.640425443649292},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.5051115155220032},{"id":"https://openalex.org/C188116033","wikidata":"https://www.wikidata.org/wiki/Q2664563","display_name":"Q-learning","level":3,"score":0.48596107959747314},{"id":"https://openalex.org/C2776291640","wikidata":"https://www.wikidata.org/wiki/Q2912517","display_name":"Value (mathematics)","level":2,"score":0.45911329984664917},{"id":"https://openalex.org/C67203356","wikidata":"https://www.wikidata.org/wiki/Q1321905","display_name":"Reinforcement","level":2,"score":0.45483797788619995},{"id":"https://openalex.org/C14036430","wikidata":"https://www.wikidata.org/wiki/Q3736076","display_name":"Function (biology)","level":2,"score":0.4519963562488556},{"id":"https://openalex.org/C90509273","wikidata":"https://www.wikidata.org/wiki/Q11012","display_name":"Robot","level":2,"score":0.44172850251197815},{"id":"https://openalex.org/C107457646","wikidata":"https://www.wikidata.org/wiki/Q207434","display_name":"Human\u2013computer interaction","level":1,"score":0.4012957215309143},{"id":"https://openalex.org/C119857082","wikidata":"https://www.wikidata.org/wiki/Q2539","display_name":"Machine learning","level":1,"score":0.19857728481292725},{"id":"https://openalex.org/C15744967","wikidata":"https://www.wikidata.org/wiki/Q9418","display_name":"Psychology","level":0,"score":0.08887124061584473},{"id":"https://openalex.org/C78458016","wikidata":"https://www.wikidata.org/wiki/Q840400","display_name":"Evolutionary biology","level":1,"score":0.0},{"id":"https://openalex.org/C86803240","wikidata":"https://www.wikidata.org/wiki/Q420","display_name":"Biology","level":0,"score":0.0},{"id":"https://openalex.org/C77805123","wikidata":"https://www.wikidata.org/wiki/Q161272","display_name":"Social psychology","level":1,"score":0.0}],"mesh":[],"locations_count":4,"locations":[{"id":"doi:10.1109/acii.2019.8925443","is_oa":false,"landing_page_url":"https://doi.org/10.1109/acii.2019.8925443","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"2019 8th International Conference on Affective Computing and Intelligent Interaction (ACII)","raw_type":"proceedings-article"},{"id":"pmh:oai:arXiv.org:1908.02037","is_oa":true,"landing_page_url":"http://arxiv.org/abs/1908.02037","pdf_url":"https://arxiv.org/pdf/1908.02037","source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"text"},{"id":"mag:2965797071","is_oa":true,"landing_page_url":"https://arxiv.org/abs/1908.02037","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":"arXiv (Cornell University)","raw_type":null},{"id":"doi:10.48550/arxiv.1908.02037","is_oa":true,"landing_page_url":"https://doi.org/10.48550/arxiv.1908.02037","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":null,"is_accepted":false,"is_published":null,"raw_source_name":null,"raw_type":"article"}],"best_oa_location":{"id":"pmh:oai:arXiv.org:1908.02037","is_oa":true,"landing_page_url":"http://arxiv.org/abs/1908.02037","pdf_url":"https://arxiv.org/pdf/1908.02037","source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"text"},"sustainable_development_goals":[{"display_name":"Peace, Justice and strong institutions","score":0.4699999988079071,"id":"https://metadata.un.org/sdg/16"}],"awards":[],"funders":[],"has_content":{"pdf":true,"grobid_xml":true},"content_urls":{"pdf":"https://content.openalex.org/works/W2965797071.pdf","grobid_xml":"https://content.openalex.org/works/W2965797071.grobid-xml"},"referenced_works_count":42,"referenced_works":["https://openalex.org/W32403112","https://openalex.org/W192920577","https://openalex.org/W837827503","https://openalex.org/W1515851193","https://openalex.org/W1646707810","https://openalex.org/W1925043605","https://openalex.org/W1974219072","https://openalex.org/W1980763452","https://openalex.org/W2019934316","https://openalex.org/W2063643001","https://openalex.org/W2070629246","https://openalex.org/W2092287437","https://openalex.org/W2094240310","https://openalex.org/W2094856020","https://openalex.org/W2120346334","https://openalex.org/W2140996653","https://openalex.org/W2145339207","https://openalex.org/W2146334809","https://openalex.org/W2147272821","https://openalex.org/W2187036766","https://openalex.org/W2291168657","https://openalex.org/W2471193380","https://openalex.org/W2530983305","https://openalex.org/W2570651606","https://openalex.org/W2594693247","https://openalex.org/W2747602812","https://openalex.org/W2769428625","https://openalex.org/W2810033056","https://openalex.org/W2962938178","https://openalex.org/W3101568187","https://openalex.org/W3143996792","https://openalex.org/W4246277771","https://openalex.org/W6603745846","https://openalex.org/W6606719070","https://openalex.org/W6658084583","https://openalex.org/W6677737365","https://openalex.org/W6677939520","https://openalex.org/W6691215711","https://openalex.org/W6694521564","https://openalex.org/W6696555554","https://openalex.org/W6704084210","https://openalex.org/W6746563764"],"related_works":["https://openalex.org/W2965916794","https://openalex.org/W2964263543","https://openalex.org/W3167658443","https://openalex.org/W3092995464","https://openalex.org/W3039601517","https://openalex.org/W3027086341","https://openalex.org/W3093430376","https://openalex.org/W2945719686","https://openalex.org/W2604299654","https://openalex.org/W2183893812","https://openalex.org/W2754794180","https://openalex.org/W2158150115","https://openalex.org/W2911607485","https://openalex.org/W3205271037","https://openalex.org/W2550648340","https://openalex.org/W3168250321","https://openalex.org/W2535652371","https://openalex.org/W2973940173","https://openalex.org/W2169106844","https://openalex.org/W2344013593"],"abstract_inverted_index":{"The":[0,100],"ability":[1],"to":[2,166],"generate":[3],"appropriate":[4],"verbal":[5],"and":[6,28,34,80,90,121],"nonverbal":[7],"backchannels":[8],"by":[9,72,109],"an":[10,123,171],"agent":[11,124,172],"during":[12,51],"human-robot":[13,53],"interaction":[14,18,54,73],"greatly":[15],"enhances":[16],"the":[17,37,56,62,86,132,138,147,161],"experience.":[19],"Backchannels":[20],"are":[21,164],"particularly":[22],"important":[23],"in":[24,137,149],"applications":[25],"like":[26],"tutoring":[27],"counseling,":[29],"which":[30],"require":[31],"constant":[32],"attention":[33],"engagement":[35,67,169],"of":[36,64,85,134],"user.":[38],"We":[39,113],"present":[40],"here":[41],"a":[42,46,52,75,95,105,119],"method":[43],"for":[44,48,142],"training":[45],"robot":[47],"backchannel":[49,120],"generation":[50],"within":[55],"reinforcement":[57,97],"learning":[58,71,98],"(RL)":[59],"framework,":[60],"with":[61,74,116,125],"goal":[63],"maintaining":[65],"high":[66],"level.":[68],"Since":[69],"online":[70],"human":[76],"is":[77,102,158],"highly":[78],"time-consuming":[79],"impractical,":[81],"we":[82,130],"take":[83],"advantage":[84],"recorded":[87],"human-to-human":[88],"dataset":[89,101],"approach":[91],"our":[92],"problem":[93],"as":[94,104,118],"batch":[96,106],"problem.":[99],"utilized":[103],"data":[107],"acquired":[108],"some":[110],"behavior":[111],"policy.":[112],"perform":[114],"experiments":[115],"laughs":[117],"train":[122],"value-based":[126],"techniques.":[127],"In":[128],"particular,":[129],"demonstrate":[131],"effectiveness":[133],"recurrent":[135],"layers":[136],"approximate":[139],"value":[140],"function":[141],"this":[143],"problem,":[144],"that":[145,160],"boosts":[146],"performance":[148],"partially":[150],"observable":[151],"environments.":[152],"With":[153],"off-policy":[154],"policy":[155],"evaluation,":[156],"it":[157],"shown":[159],"RL":[162],"agents":[163],"expected":[165],"produce":[167],"more":[168],"than":[170],"trained":[173],"from":[174],"imitation":[175],"learning.":[176]},"counts_by_year":[{"year":2022,"cited_by_count":1}],"updated_date":"2026-03-20T23:20:44.827607","created_date":"2025-10-10T00:00:00"}
