{"id":"https://openalex.org/W4403913099","doi":"https://doi.org/10.1145/3678957.3685742","title":"Online Multimodal End-of-Turn Prediction for Three-party Conversations","display_name":"Online Multimodal End-of-Turn Prediction for Three-party Conversations","publication_year":2024,"publication_date":"2024-10-30","ids":{"openalex":"https://openalex.org/W4403913099","doi":"https://doi.org/10.1145/3678957.3685742"},"language":"en","primary_location":{"id":"doi:10.1145/3678957.3685742","is_oa":false,"landing_page_url":"https://doi.org/10.1145/3678957.3685742","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"International Conference on Multimodel Interaction","raw_type":"proceedings-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":false,"oa_status":"closed","oa_url":null,"any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5005674450","display_name":"Meng-Chen Lee","orcid":"https://orcid.org/0009-0002-9726-1153"},"institutions":[{"id":"https://openalex.org/I44461941","display_name":"University of Houston","ror":"https://ror.org/048sx0r50","country_code":"US","type":"education","lineage":["https://openalex.org/I44461941"]}],"countries":["US"],"is_corresponding":true,"raw_author_name":"Meng-Chen Lee","raw_affiliation_strings":["Department of Computer Science, University of Houston, United States"],"raw_orcid":"https://orcid.org/0009-0002-9726-1153","affiliations":[{"raw_affiliation_string":"Department of Computer Science, University of Houston, United States","institution_ids":["https://openalex.org/I44461941"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5026683388","display_name":"Zhigang Deng","orcid":"https://orcid.org/0000-0002-0452-8676"},"institutions":[{"id":"https://openalex.org/I44461941","display_name":"University of Houston","ror":"https://ror.org/048sx0r50","country_code":"US","type":"education","lineage":["https://openalex.org/I44461941"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Zhigang Deng","raw_affiliation_strings":["Department of Computer Science, University of Houston, United States"],"raw_orcid":"https://orcid.org/0000-0002-0452-8676","affiliations":[{"raw_affiliation_string":"Department of Computer Science, University of Houston, United States","institution_ids":["https://openalex.org/I44461941"]}]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":2,"corresponding_author_ids":["https://openalex.org/A5005674450"],"corresponding_institution_ids":["https://openalex.org/I44461941"],"apc_list":null,"apc_paid":null,"fwci":1.9868,"has_fulltext":false,"cited_by_count":6,"citation_normalized_percentile":{"value":0.88703388,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":{"min":96,"max":98},"biblio":{"volume":null,"issue":null,"first_page":"57","last_page":"65"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T12031","display_name":"Speech and dialogue systems","score":0.9995999932289124,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T12031","display_name":"Speech and dialogue systems","score":0.9995999932289124,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11148","display_name":"Language, Metaphor, and Cognition","score":0.9957000017166138,"subfield":{"id":"https://openalex.org/subfields/3205","display_name":"Experimental and Cognitive Psychology"},"field":{"id":"https://openalex.org/fields/32","display_name":"Psychology"},"domain":{"id":"https://openalex.org/domains/2","display_name":"Social Sciences"}},{"id":"https://openalex.org/T10181","display_name":"Natural Language Processing Techniques","score":0.9933000206947327,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/turn-taking","display_name":"Turn-taking","score":0.7452935576438904},{"id":"https://openalex.org/keywords/turn","display_name":"Turn (biochemistry)","score":0.6484887599945068},{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.6378491520881653},{"id":"https://openalex.org/keywords/human\u2013computer-interaction","display_name":"Human\u2013computer interaction","score":0.3242063820362091},{"id":"https://openalex.org/keywords/conversation","display_name":"Conversation","score":0.2922716736793518},{"id":"https://openalex.org/keywords/communication","display_name":"Communication","score":0.13310042023658752},{"id":"https://openalex.org/keywords/psychology","display_name":"Psychology","score":0.09285929799079895},{"id":"https://openalex.org/keywords/chemistry","display_name":"Chemistry","score":0.06765958666801453}],"concepts":[{"id":"https://openalex.org/C2776352735","wikidata":"https://www.wikidata.org/wiki/Q2313343","display_name":"Turn-taking","level":3,"score":0.7452935576438904},{"id":"https://openalex.org/C85641259","wikidata":"https://www.wikidata.org/wiki/Q290042","display_name":"Turn (biochemistry)","level":2,"score":0.6484887599945068},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.6378491520881653},{"id":"https://openalex.org/C107457646","wikidata":"https://www.wikidata.org/wiki/Q207434","display_name":"Human\u2013computer interaction","level":1,"score":0.3242063820362091},{"id":"https://openalex.org/C2777200299","wikidata":"https://www.wikidata.org/wiki/Q52943","display_name":"Conversation","level":2,"score":0.2922716736793518},{"id":"https://openalex.org/C46312422","wikidata":"https://www.wikidata.org/wiki/Q11024","display_name":"Communication","level":1,"score":0.13310042023658752},{"id":"https://openalex.org/C15744967","wikidata":"https://www.wikidata.org/wiki/Q9418","display_name":"Psychology","level":0,"score":0.09285929799079895},{"id":"https://openalex.org/C185592680","wikidata":"https://www.wikidata.org/wiki/Q2329","display_name":"Chemistry","level":0,"score":0.06765958666801453},{"id":"https://openalex.org/C55493867","wikidata":"https://www.wikidata.org/wiki/Q7094","display_name":"Biochemistry","level":1,"score":0.0}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.1145/3678957.3685742","is_oa":false,"landing_page_url":"https://doi.org/10.1145/3678957.3685742","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"International Conference on Multimodel Interaction","raw_type":"proceedings-article"}],"best_oa_location":null,"sustainable_development_goals":[],"awards":[],"funders":[],"has_content":{"grobid_xml":false,"pdf":false},"content_urls":null,"referenced_works_count":37,"referenced_works":["https://openalex.org/W1161474730","https://openalex.org/W1526675628","https://openalex.org/W1533504578","https://openalex.org/W1583748115","https://openalex.org/W1981611667","https://openalex.org/W2002069029","https://openalex.org/W2008741806","https://openalex.org/W2087762538","https://openalex.org/W2100356893","https://openalex.org/W2116985048","https://openalex.org/W2129090275","https://openalex.org/W2139659117","https://openalex.org/W2141666434","https://openalex.org/W2154524549","https://openalex.org/W2161782031","https://openalex.org/W2260472133","https://openalex.org/W2293392332","https://openalex.org/W2401047175","https://openalex.org/W2591348521","https://openalex.org/W2610786808","https://openalex.org/W2786387151","https://openalex.org/W2888997666","https://openalex.org/W2889445100","https://openalex.org/W2921495256","https://openalex.org/W2944069152","https://openalex.org/W2965465515","https://openalex.org/W2980823180","https://openalex.org/W3104405162","https://openalex.org/W3112188842","https://openalex.org/W3143450176","https://openalex.org/W4224308101","https://openalex.org/W4283268092","https://openalex.org/W4312372834","https://openalex.org/W4387421683","https://openalex.org/W4405812764","https://openalex.org/W6778883912","https://openalex.org/W6810081322"],"related_works":["https://openalex.org/W2900127165","https://openalex.org/W320957374","https://openalex.org/W2379107843","https://openalex.org/W3120641923","https://openalex.org/W2909654650","https://openalex.org/W3161619631","https://openalex.org/W4242512034","https://openalex.org/W3003178987","https://openalex.org/W4400912116","https://openalex.org/W4376475259"],"abstract_inverted_index":{"Predicting":[0],"end-of-turn":[1,32,70,119],"in":[2,34,36,72,107,130],"multiparty":[3,37],"conversations":[4],"is":[5],"crucial":[6],"to":[7,21,30,67,125],"increase":[8],"the":[9,41,57,90,108,127],"usability":[10],"and":[11,49,94,113,137],"natural":[12,136],"flow":[13],"of":[14,43,92,101,110],"spoken":[15],"dialogue":[16],"systems,":[17],"offering":[18],"substantial":[19],"enhancements":[20],"conversational":[22],"agents.":[23],"We":[24],"present":[25],"a":[26,62],"novel":[27],"window-based":[28],"method":[29,55],"predict":[31,69],"moments":[33],"real-time":[35],"conversations,":[38],"by":[39],"leveraging":[40],"capabilities":[42],"cutting-edge":[44],"pre-trained":[45],"language":[46,59],"models":[47],"(PLMs)":[48],"recurrent":[50],"neural":[51],"networks":[52],"(RNN).":[53],"Our":[54,76,116],"fuses":[56],"distilBERT":[58],"model":[60,121],"with":[61],"Gated":[63],"Recurrent":[64],"Unit":[65,83],"(GRU)":[66],"accurately":[68],"points":[71],"an":[73],"online":[74,118],"fashion.":[75],"approach":[77],"can":[78,122],"significantly":[79],"outperform":[80],"conventional":[81],"Inter-Pausal":[82],"(IPU)-based":[84],"prediction":[85,120],"methods":[86],"that":[87],"often":[88],"overlook":[89],"nuances":[91],"overlap":[93],"interruption":[95],"during":[96],"dynamic":[97],"conversations.":[98,142],"Potential":[99],"applications":[100],"this":[102],"study":[103],"are":[104],"significant,":[105],"particularly":[106],"domains":[109],"virtual":[111],"agents":[112],"human-robot":[114],"interactions.":[115],"accurate":[117],"be":[123],"facilitated":[124],"enhance":[126],"user":[128],"experience":[129],"these":[131],"applications,":[132],"making":[133],"them":[134],"more":[135],"seamlessly":[138],"integrated":[139],"into":[140],"real-world":[141]},"counts_by_year":[{"year":2026,"cited_by_count":1},{"year":2025,"cited_by_count":5}],"updated_date":"2025-12-27T23:08:20.325037","created_date":"2025-10-10T00:00:00"}
