{"id":"https://openalex.org/W2901285216","doi":"https://doi.org/10.1145/3267851.3267898","title":"Investigating the use of recurrent motion modelling for speech gesture generation","display_name":"Investigating the use of recurrent motion modelling for speech gesture generation","publication_year":2018,"publication_date":"2018-11-05","ids":{"openalex":"https://openalex.org/W2901285216","doi":"https://doi.org/10.1145/3267851.3267898","mag":"2901285216"},"language":"en","primary_location":{"id":"doi:10.1145/3267851.3267898","is_oa":false,"landing_page_url":"https://doi.org/10.1145/3267851.3267898","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Proceedings of the 18th International Conference on Intelligent Virtual Agents","raw_type":"proceedings-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":true,"oa_status":"green","oa_url":"https://www.tara.tcd.ie/bitstream/2262/91094/1/IVA2018b.pdf","any_repository_has_fulltext":true},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5035410702","display_name":"Ylva Ferstl","orcid":"https://orcid.org/0000-0001-7259-0378"},"institutions":[{"id":"https://openalex.org/I205274468","display_name":"Trinity College Dublin","ror":"https://ror.org/02tyrky19","country_code":"IE","type":"education","lineage":["https://openalex.org/I205274468"]}],"countries":["IE"],"is_corresponding":true,"raw_author_name":"Ylva Ferstl","raw_affiliation_strings":["Graphics, Vision and Visualisation Group, Trinity College Dublin"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"Graphics, Vision and Visualisation Group, Trinity College Dublin","institution_ids":["https://openalex.org/I205274468"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5079301210","display_name":"Rachel McDonnell","orcid":"https://orcid.org/0000-0002-1957-2506"},"institutions":[{"id":"https://openalex.org/I205274468","display_name":"Trinity College Dublin","ror":"https://ror.org/02tyrky19","country_code":"IE","type":"education","lineage":["https://openalex.org/I205274468"]}],"countries":["IE"],"is_corresponding":false,"raw_author_name":"Rachel McDonnell","raw_affiliation_strings":["Graphics, Vision and Visualisation Group, Trinity College Dublin"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"Graphics, Vision and Visualisation Group, Trinity College Dublin","institution_ids":["https://openalex.org/I205274468"]}]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":2,"corresponding_author_ids":["https://openalex.org/A5035410702"],"corresponding_institution_ids":["https://openalex.org/I205274468"],"apc_list":null,"apc_paid":null,"fwci":13.2566,"has_fulltext":true,"cited_by_count":137,"citation_normalized_percentile":{"value":0.99042221,"is_in_top_1_percent":true,"is_in_top_10_percent":true},"cited_by_percentile_year":{"min":98,"max":100},"biblio":{"volume":null,"issue":null,"first_page":"93","last_page":"98"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10709","display_name":"Social Robot Interaction and HRI","score":0.9997000098228455,"subfield":{"id":"https://openalex.org/subfields/3207","display_name":"Social Psychology"},"field":{"id":"https://openalex.org/fields/32","display_name":"Psychology"},"domain":{"id":"https://openalex.org/domains/2","display_name":"Social Sciences"}},"topics":[{"id":"https://openalex.org/T10709","display_name":"Social Robot Interaction and HRI","score":0.9997000098228455,"subfield":{"id":"https://openalex.org/subfields/3207","display_name":"Social Psychology"},"field":{"id":"https://openalex.org/fields/32","display_name":"Psychology"},"domain":{"id":"https://openalex.org/domains/2","display_name":"Social Sciences"}},{"id":"https://openalex.org/T12031","display_name":"Speech and dialogue systems","score":0.9991999864578247,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11714","display_name":"Multimodal Machine Learning Applications","score":0.9983999729156494,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/gesture","display_name":"Gesture","score":0.8869713544845581},{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.8001915812492371},{"id":"https://openalex.org/keywords/motion","display_name":"Motion (physics)","score":0.5862311720848083},{"id":"https://openalex.org/keywords/task","display_name":"Task (project management)","score":0.5818521976470947},{"id":"https://openalex.org/keywords/speech-recognition","display_name":"Speech recognition","score":0.564195990562439},{"id":"https://openalex.org/keywords/probabilistic-logic","display_name":"Probabilistic logic","score":0.5088763236999512},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.5065230131149292},{"id":"https://openalex.org/keywords/gesture-recognition","display_name":"Gesture recognition","score":0.4453135132789612},{"id":"https://openalex.org/keywords/natural-language-processing","display_name":"Natural language processing","score":0.3539189398288727},{"id":"https://openalex.org/keywords/human\u2013computer-interaction","display_name":"Human\u2013computer interaction","score":0.3329855501651764},{"id":"https://openalex.org/keywords/machine-learning","display_name":"Machine learning","score":0.3279385566711426},{"id":"https://openalex.org/keywords/engineering","display_name":"Engineering","score":0.09681946039199829}],"concepts":[{"id":"https://openalex.org/C207347870","wikidata":"https://www.wikidata.org/wiki/Q371174","display_name":"Gesture","level":2,"score":0.8869713544845581},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.8001915812492371},{"id":"https://openalex.org/C104114177","wikidata":"https://www.wikidata.org/wiki/Q79782","display_name":"Motion (physics)","level":2,"score":0.5862311720848083},{"id":"https://openalex.org/C2780451532","wikidata":"https://www.wikidata.org/wiki/Q759676","display_name":"Task (project management)","level":2,"score":0.5818521976470947},{"id":"https://openalex.org/C28490314","wikidata":"https://www.wikidata.org/wiki/Q189436","display_name":"Speech recognition","level":1,"score":0.564195990562439},{"id":"https://openalex.org/C49937458","wikidata":"https://www.wikidata.org/wiki/Q2599292","display_name":"Probabilistic logic","level":2,"score":0.5088763236999512},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.5065230131149292},{"id":"https://openalex.org/C159437735","wikidata":"https://www.wikidata.org/wiki/Q1519524","display_name":"Gesture recognition","level":3,"score":0.4453135132789612},{"id":"https://openalex.org/C204321447","wikidata":"https://www.wikidata.org/wiki/Q30642","display_name":"Natural language processing","level":1,"score":0.3539189398288727},{"id":"https://openalex.org/C107457646","wikidata":"https://www.wikidata.org/wiki/Q207434","display_name":"Human\u2013computer interaction","level":1,"score":0.3329855501651764},{"id":"https://openalex.org/C119857082","wikidata":"https://www.wikidata.org/wiki/Q2539","display_name":"Machine learning","level":1,"score":0.3279385566711426},{"id":"https://openalex.org/C127413603","wikidata":"https://www.wikidata.org/wiki/Q11023","display_name":"Engineering","level":0,"score":0.09681946039199829},{"id":"https://openalex.org/C201995342","wikidata":"https://www.wikidata.org/wiki/Q682496","display_name":"Systems engineering","level":1,"score":0.0}],"mesh":[],"locations_count":2,"locations":[{"id":"doi:10.1145/3267851.3267898","is_oa":false,"landing_page_url":"https://doi.org/10.1145/3267851.3267898","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Proceedings of the 18th International Conference on Intelligent Virtual Agents","raw_type":"proceedings-article"},{"id":"pmh:oai:tara.tcd.ie:2262/91094","is_oa":true,"landing_page_url":"http://hdl.handle.net/2262/111444","pdf_url":"https://www.tara.tcd.ie/bitstream/2262/91094/1/IVA2018b.pdf","source":{"id":"https://openalex.org/S4306400387","display_name":"Trinity's Access to Research Output (TARA) (Trinity College Dublin)","issn_l":null,"issn":null,"is_oa":false,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205274468","host_organization_name":"Trinity College Dublin","host_organization_lineage":["https://openalex.org/I205274468"],"host_organization_lineage_names":[],"type":"repository"},"license":"cc-by-nc-sa","license_id":"https://openalex.org/licenses/cc-by-nc-sa","version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":"","raw_type":"Conference Paper"}],"best_oa_location":{"id":"pmh:oai:tara.tcd.ie:2262/91094","is_oa":true,"landing_page_url":"http://hdl.handle.net/2262/111444","pdf_url":"https://www.tara.tcd.ie/bitstream/2262/91094/1/IVA2018b.pdf","source":{"id":"https://openalex.org/S4306400387","display_name":"Trinity's Access to Research Output (TARA) (Trinity College Dublin)","issn_l":null,"issn":null,"is_oa":false,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205274468","host_organization_name":"Trinity College Dublin","host_organization_lineage":["https://openalex.org/I205274468"],"host_organization_lineage_names":[],"type":"repository"},"license":"cc-by-nc-sa","license_id":"https://openalex.org/licenses/cc-by-nc-sa","version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":"","raw_type":"Conference Paper"},"sustainable_development_goals":[{"display_name":"Quality Education","score":0.5899999737739563,"id":"https://metadata.un.org/sdg/4"}],"awards":[{"id":"https://openalex.org/G2693890202","display_name":null,"funder_award_id":"13/RC/2016","funder_id":"https://openalex.org/F4320320847","funder_display_name":"Science Foundation Ireland"}],"funders":[{"id":"https://openalex.org/F4320320847","display_name":"Science Foundation Ireland","ror":"https://ror.org/0271asj38"}],"has_content":{"grobid_xml":true,"pdf":true},"content_urls":{"pdf":"https://content.openalex.org/works/W2901285216.pdf","grobid_xml":"https://content.openalex.org/works/W2901285216.grobid-xml"},"referenced_works_count":40,"referenced_works":["https://openalex.org/W114912394","https://openalex.org/W179875071","https://openalex.org/W1208039178","https://openalex.org/W1534876773","https://openalex.org/W1546103008","https://openalex.org/W1969681536","https://openalex.org/W1974604838","https://openalex.org/W1984037038","https://openalex.org/W1984541135","https://openalex.org/W2022214202","https://openalex.org/W2024536104","https://openalex.org/W2035046981","https://openalex.org/W2065338371","https://openalex.org/W2077206503","https://openalex.org/W2090777335","https://openalex.org/W2109636054","https://openalex.org/W2111902182","https://openalex.org/W2112604602","https://openalex.org/W2115825178","https://openalex.org/W2118163921","https://openalex.org/W2122376170","https://openalex.org/W2131734538","https://openalex.org/W2135966470","https://openalex.org/W2141125555","https://openalex.org/W2142487393","https://openalex.org/W2235920218","https://openalex.org/W2250644439","https://openalex.org/W2253728219","https://openalex.org/W2296371640","https://openalex.org/W2530983305","https://openalex.org/W2747610795","https://openalex.org/W2764552839","https://openalex.org/W2766709201","https://openalex.org/W2800691917","https://openalex.org/W2913756371","https://openalex.org/W2949888546","https://openalex.org/W2951188428","https://openalex.org/W2963165299","https://openalex.org/W2964203186","https://openalex.org/W4299390018"],"related_works":["https://openalex.org/W2066003895","https://openalex.org/W2902873204","https://openalex.org/W2185750513","https://openalex.org/W4312416068","https://openalex.org/W3147379364","https://openalex.org/W2010878661","https://openalex.org/W2026258298","https://openalex.org/W3204639664","https://openalex.org/W2970836791","https://openalex.org/W2805039731"],"abstract_inverted_index":{"The":[0],"growing":[1],"use":[2,83,102],"of":[3,39,51,57,72,84,121,139,145],"virtual":[4,27],"humans":[5],"demands":[6],"generating":[7],"increasingly":[8],"realistic":[9,24],"behavior":[10],"for":[11,23,96,142],"them":[12],"while":[13],"minimizing":[14],"cost":[15],"and":[16,25,29,54,116],"time.":[17],"Gestures":[18],"are":[19],"a":[20,36,69,103,118,129,135],"key":[21],"ingredient":[22],"engaging":[26],"agents":[28],"consequently":[30],"automatized":[31],"gesture":[32,44,97,122],"generation":[33,45,98],"has":[34,46],"been":[35],"popular":[37],"area":[38],"research.":[40],"So":[41],"far,":[42],"good":[43],"relied":[47],"on":[48],"explicit":[49],"formulation":[50],"if-then":[52],"rules":[53],"probabilistic":[55],"modelling":[56,90,131],"annotated":[58],"features.":[59],"Machine":[60],"learning":[61,75,86,94],"approaches":[62],"have":[63],"yielded":[64],"only":[65],"marginal":[66],"success,":[67],"indicating":[68],"high":[70],"complexity":[71],"the":[73,82,126,143],"speech-to-motion":[74],"task.":[76,132],"In":[77],"this":[78,146],"work,":[79],"we":[80],"explore":[81],"transfer":[85],"using":[87],"previous":[88],"motion":[89,130],"research":[91],"to":[92],"improve":[93],"outcomes":[95],"from":[99],"speech.":[100],"We":[101,124,133],"recurrent":[104],"network":[105,127],"with":[106,128],"an":[107],"encoder-decoder":[108],"structure":[109],"that":[110],"takes":[111],"in":[112],"prosodic":[113],"speech":[114,141],"features":[115],"generates":[117],"short":[119],"sequence":[120],"motion.":[123],"pre-train":[125],"recorded":[134],"large":[136],"multimodal":[137],"database":[138],"conversational":[140],"purpose":[144],"work.":[147]},"counts_by_year":[{"year":2026,"cited_by_count":5},{"year":2025,"cited_by_count":17},{"year":2024,"cited_by_count":26},{"year":2023,"cited_by_count":25},{"year":2022,"cited_by_count":17},{"year":2021,"cited_by_count":28},{"year":2020,"cited_by_count":14},{"year":2019,"cited_by_count":5}],"updated_date":"2026-05-05T08:41:31.759640","created_date":"2018-11-29T00:00:00"}
