{"id":"https://openalex.org/W4406123789","doi":"https://doi.org/10.48550/arxiv.2501.03190","title":"Multimodal Machine Learning Can Predict Videoconference Fluidity and Enjoyment","display_name":"Multimodal Machine Learning Can Predict Videoconference Fluidity and Enjoyment","publication_year":2025,"publication_date":"2025-01-06","ids":{"openalex":"https://openalex.org/W4406123789","doi":"https://doi.org/10.48550/arxiv.2501.03190"},"language":"en","primary_location":{"id":"pmh:oai:arXiv.org:2501.03190","is_oa":true,"landing_page_url":"http://arxiv.org/abs/2501.03190","pdf_url":"https://arxiv.org/pdf/2501.03190","source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":"cc-by-sa","license_id":"https://openalex.org/licenses/cc-by-sa","version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"text"},"type":"preprint","indexed_in":["arxiv","datacite"],"open_access":{"is_oa":true,"oa_status":"green","oa_url":"https://arxiv.org/pdf/2501.03190","any_repository_has_fulltext":true},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5102881477","display_name":"Andrew Chang","orcid":"https://orcid.org/0009-0003-1441-1310"},"institutions":[],"countries":[],"is_corresponding":true,"raw_author_name":"Chang, Andrew","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5115792754","display_name":"Viswadruth Akkaraju","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Akkaraju, Viswadruth","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5115792755","display_name":"Ray McFadden Cogliano","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Cogliano, Ray McFadden","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5033417964","display_name":"David Poeppel","orcid":"https://orcid.org/0000-0003-0184-163X"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Poeppel, David","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"last","author":{"id":"https://openalex.org/A5035737956","display_name":"Dustin Freeman","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Freeman, Dustin","raw_affiliation_strings":[],"affiliations":[]}],"institutions":[],"countries_distinct_count":0,"institutions_distinct_count":5,"corresponding_author_ids":["https://openalex.org/A5102881477"],"corresponding_institution_ids":[],"apc_list":null,"apc_paid":null,"fwci":null,"has_fulltext":true,"cited_by_count":0,"citation_normalized_percentile":null,"cited_by_percentile_year":null,"biblio":{"volume":null,"issue":null,"first_page":null,"last_page":null},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T11165","display_name":"Image and Video Quality Assessment","score":0.9571999907493591,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T11165","display_name":"Image and Video Quality Assessment","score":0.9571999907493591,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/videoconferencing","display_name":"Videoconferencing","score":0.577660322189331},{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.48865702748298645},{"id":"https://openalex.org/keywords/human\u2013computer-interaction","display_name":"Human\u2013computer interaction","score":0.39687713980674744},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.3425073027610779},{"id":"https://openalex.org/keywords/multimedia","display_name":"Multimedia","score":0.3207392394542694}],"concepts":[{"id":"https://openalex.org/C22561748","wikidata":"https://www.wikidata.org/wiki/Q854954","display_name":"Videoconferencing","level":2,"score":0.577660322189331},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.48865702748298645},{"id":"https://openalex.org/C107457646","wikidata":"https://www.wikidata.org/wiki/Q207434","display_name":"Human\u2013computer interaction","level":1,"score":0.39687713980674744},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.3425073027610779},{"id":"https://openalex.org/C49774154","wikidata":"https://www.wikidata.org/wiki/Q131765","display_name":"Multimedia","level":1,"score":0.3207392394542694}],"mesh":[],"locations_count":2,"locations":[{"id":"pmh:oai:arXiv.org:2501.03190","is_oa":true,"landing_page_url":"http://arxiv.org/abs/2501.03190","pdf_url":"https://arxiv.org/pdf/2501.03190","source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":"cc-by-sa","license_id":"https://openalex.org/licenses/cc-by-sa","version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"text"},{"id":"doi:10.48550/arxiv.2501.03190","is_oa":true,"landing_page_url":"https://doi.org/10.48550/arxiv.2501.03190","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":null,"is_accepted":false,"is_published":null,"raw_source_name":null,"raw_type":"article-journal"}],"best_oa_location":{"id":"pmh:oai:arXiv.org:2501.03190","is_oa":true,"landing_page_url":"http://arxiv.org/abs/2501.03190","pdf_url":"https://arxiv.org/pdf/2501.03190","source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":"cc-by-sa","license_id":"https://openalex.org/licenses/cc-by-sa","version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"text"},"sustainable_development_goals":[],"awards":[{"id":"https://openalex.org/G7279642215","display_name":null,"funder_award_id":"F32DC018205","funder_id":"https://openalex.org/F4320337352","funder_display_name":"National Institute on Deafness and Other Communication Disorders"}],"funders":[{"id":"https://openalex.org/F4320309445","display_name":"Leon Levy Foundation","ror":"https://ror.org/033hnyq61"},{"id":"https://openalex.org/F4320319918","display_name":"York University","ror":"https://ror.org/05fq50484"},{"id":"https://openalex.org/F4320332161","display_name":"National Institutes of Health","ror":"https://ror.org/01cwqze88"},{"id":"https://openalex.org/F4320337352","display_name":"National Institute on Deafness and Other Communication Disorders","ror":"https://ror.org/04mhx6838"}],"has_content":{"pdf":true,"grobid_xml":false},"content_urls":{"pdf":"https://content.openalex.org/works/W4406123789.pdf"},"referenced_works_count":0,"referenced_works":[],"related_works":["https://openalex.org/W4391375266","https://openalex.org/W2899084033","https://openalex.org/W2748952813","https://openalex.org/W2142127558","https://openalex.org/W1546632383","https://openalex.org/W4313257994","https://openalex.org/W2390279801","https://openalex.org/W4391913857","https://openalex.org/W2358668433","https://openalex.org/W2309250577"],"abstract_inverted_index":{"Videoconferencing":[0],"is":[1,114],"now":[2],"a":[3,115],"frequent":[4],"mode":[5],"of":[6,22,34,42,82,136],"communication":[7],"in":[8,37],"both":[9],"professional":[10],"and":[11,20,54,68],"informal":[12],"settings,":[13],"yet":[14],"it":[15],"often":[16],"lacks":[17],"the":[18,46],"fluidity":[19],"enjoyment":[21],"in-person":[23],"conversation.":[24],"This":[25,97],"study":[26,142],"leverages":[27],"multimodal":[28,101,126],"machine":[29,127],"learning":[30,128],"to":[31,58,84,117,132],"predict":[32,106],"moments":[33,135],"negative":[35,137],"experience":[36,122,139],"videoconferencing.":[38],"We":[39],"sampled":[40],"thousands":[41],"short":[43],"clips":[44],"from":[45],"RoomReader":[47],"corpus,":[48],"extracting":[49],"audio":[50,92],"embeddings,":[51],"facial":[52],"actions,":[53],"body":[55],"motion":[56],"features":[57,93],"train":[59],"models":[60,78],"for":[61,140],"identifying":[62],"low":[63,66],"conversational":[64,70,109],"fluidity,":[65],"enjoyment,":[67],"classifying":[69],"events":[71],"(backchanneling,":[72],"interruption,":[73],"or":[74,143],"gap).":[75],"Our":[76],"best":[77],"achieved":[79],"an":[80],"ROC-AUC":[81],"up":[83],"0.87":[85],"on":[86,119],"hold-out":[87],"videoconference":[88],"sessions,":[89],"with":[90],"domain-general":[91],"proving":[94],"most":[95],"critical.":[96],"work":[98],"demonstrates":[99],"that":[100,125],"audio-video":[102],"signals":[103],"can":[104,129],"effectively":[105],"high-level":[107],"subjective":[108],"outcomes.":[110],"In":[111],"addition,":[112],"this":[113],"contribution":[116],"research":[118],"videoconferencing":[120],"user":[121,138],"by":[123],"showing":[124],"be":[130],"used":[131],"identify":[133],"rare":[134],"further":[141],"mitigation.":[144]},"counts_by_year":[],"updated_date":"2026-04-10T15:06:20.359241","created_date":"2025-10-10T00:00:00"}
