{"id":"https://openalex.org/W7139937265","doi":"https://doi.org/10.48550/arxiv.2603.18758","title":"Dual-Model Prediction of Affective Engagement and Vocal Attractiveness from Speaker Expressiveness in Video Learning","display_name":"Dual-Model Prediction of Affective Engagement and Vocal Attractiveness from Speaker Expressiveness in Video Learning","publication_year":2026,"publication_date":"2026-03-19","ids":{"openalex":"https://openalex.org/W7139937265","doi":"https://doi.org/10.48550/arxiv.2603.18758"},"language":null,"primary_location":{"id":"doi:10.48550/arxiv.2603.18758","is_oa":true,"landing_page_url":"https://doi.org/10.48550/arxiv.2603.18758","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":null,"is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"article"},"type":"preprint","indexed_in":["datacite"],"open_access":{"is_oa":true,"oa_status":"green","oa_url":"https://doi.org/10.48550/arxiv.2603.18758","any_repository_has_fulltext":true},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5036002469","display_name":"Hung-Yue Suen","orcid":"https://orcid.org/0000-0002-6796-2031"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Suen, Hung-Yue","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5074186083","display_name":"Kuo-En Hung","orcid":"https://orcid.org/0000-0003-2091-2747"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Hung, Kuo-En","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"last","author":{"id":"https://openalex.org/A5000917818","display_name":"Fan\u2010Hsun Tseng","orcid":"https://orcid.org/0000-0003-2461-8377"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Tseng, Fan-Hsun","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]}],"institutions":[],"countries_distinct_count":0,"institutions_distinct_count":3,"corresponding_author_ids":[],"corresponding_institution_ids":[],"apc_list":null,"apc_paid":null,"fwci":null,"has_fulltext":false,"cited_by_count":0,"citation_normalized_percentile":null,"cited_by_percentile_year":null,"biblio":{"volume":null,"issue":null,"first_page":null,"last_page":null},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10667","display_name":"Emotion and Mood Recognition","score":0.9229000210762024,"subfield":{"id":"https://openalex.org/subfields/3205","display_name":"Experimental and Cognitive Psychology"},"field":{"id":"https://openalex.org/fields/32","display_name":"Psychology"},"domain":{"id":"https://openalex.org/domains/2","display_name":"Social Sciences"}},"topics":[{"id":"https://openalex.org/T10667","display_name":"Emotion and Mood Recognition","score":0.9229000210762024,"subfield":{"id":"https://openalex.org/subfields/3205","display_name":"Experimental and Cognitive Psychology"},"field":{"id":"https://openalex.org/fields/32","display_name":"Psychology"},"domain":{"id":"https://openalex.org/domains/2","display_name":"Social Sciences"}},{"id":"https://openalex.org/T10709","display_name":"Social Robot Interaction and HRI","score":0.01140000019222498,"subfield":{"id":"https://openalex.org/subfields/3207","display_name":"Social Psychology"},"field":{"id":"https://openalex.org/fields/32","display_name":"Psychology"},"domain":{"id":"https://openalex.org/domains/2","display_name":"Social Sciences"}},{"id":"https://openalex.org/T11902","display_name":"Intelligent Tutoring Systems and Adaptive Learning","score":0.005499999970197678,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/attractiveness","display_name":"Attractiveness","score":0.664900004863739},{"id":"https://openalex.org/keywords/leverage","display_name":"Leverage (statistics)","score":0.5846999883651733},{"id":"https://openalex.org/keywords/affective-computing","display_name":"Affective computing","score":0.5009999871253967},{"id":"https://openalex.org/keywords/regression","display_name":"Regression","score":0.4661000072956085},{"id":"https://openalex.org/keywords/regression-analysis","display_name":"Regression analysis","score":0.460999995470047},{"id":"https://openalex.org/keywords/affect","display_name":"Affect (linguistics)","score":0.4494999945163727},{"id":"https://openalex.org/keywords/asynchronous-communication","display_name":"Asynchronous communication","score":0.4456000030040741},{"id":"https://openalex.org/keywords/emotion-recognition","display_name":"Emotion recognition","score":0.44200000166893005}],"concepts":[{"id":"https://openalex.org/C31173074","wikidata":"https://www.wikidata.org/wiki/Q2632514","display_name":"Attractiveness","level":2,"score":0.664900004863739},{"id":"https://openalex.org/C15744967","wikidata":"https://www.wikidata.org/wiki/Q9418","display_name":"Psychology","level":0,"score":0.618399977684021},{"id":"https://openalex.org/C153083717","wikidata":"https://www.wikidata.org/wiki/Q6535263","display_name":"Leverage (statistics)","level":2,"score":0.5846999883651733},{"id":"https://openalex.org/C6438553","wikidata":"https://www.wikidata.org/wiki/Q1185804","display_name":"Affective computing","level":2,"score":0.5009999871253967},{"id":"https://openalex.org/C83546350","wikidata":"https://www.wikidata.org/wiki/Q1139051","display_name":"Regression","level":2,"score":0.4661000072956085},{"id":"https://openalex.org/C152877465","wikidata":"https://www.wikidata.org/wiki/Q208042","display_name":"Regression analysis","level":2,"score":0.460999995470047},{"id":"https://openalex.org/C180747234","wikidata":"https://www.wikidata.org/wiki/Q23373","display_name":"Cognitive psychology","level":1,"score":0.459199994802475},{"id":"https://openalex.org/C2776035688","wikidata":"https://www.wikidata.org/wiki/Q1606558","display_name":"Affect (linguistics)","level":2,"score":0.4494999945163727},{"id":"https://openalex.org/C151319957","wikidata":"https://www.wikidata.org/wiki/Q752739","display_name":"Asynchronous communication","level":2,"score":0.4456000030040741},{"id":"https://openalex.org/C2777438025","wikidata":"https://www.wikidata.org/wiki/Q1339090","display_name":"Emotion recognition","level":2,"score":0.44200000166893005},{"id":"https://openalex.org/C120936955","wikidata":"https://www.wikidata.org/wiki/Q2155640","display_name":"Empirical research","level":2,"score":0.4406999945640564},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.43160000443458557},{"id":"https://openalex.org/C195704467","wikidata":"https://www.wikidata.org/wiki/Q327968","display_name":"Facial expression","level":2,"score":0.4099999964237213},{"id":"https://openalex.org/C169900460","wikidata":"https://www.wikidata.org/wiki/Q2200417","display_name":"Cognition","level":2,"score":0.3953000009059906},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.3506999909877777},{"id":"https://openalex.org/C28490314","wikidata":"https://www.wikidata.org/wiki/Q189436","display_name":"Speech recognition","level":1,"score":0.3449000120162964},{"id":"https://openalex.org/C2777375102","wikidata":"https://www.wikidata.org/wiki/Q208351","display_name":"Disgust","level":3,"score":0.3353999853134155},{"id":"https://openalex.org/C206310091","wikidata":"https://www.wikidata.org/wiki/Q750859","display_name":"Emotion classification","level":2,"score":0.328000009059906},{"id":"https://openalex.org/C77805123","wikidata":"https://www.wikidata.org/wiki/Q161272","display_name":"Social psychology","level":1,"score":0.3127000033855438},{"id":"https://openalex.org/C56461940","wikidata":"https://www.wikidata.org/wiki/Q970687","display_name":"Eye tracking","level":2,"score":0.31119999289512634},{"id":"https://openalex.org/C143110190","wikidata":"https://www.wikidata.org/wiki/Q5373787","display_name":"Emotional expression","level":2,"score":0.2946999967098236},{"id":"https://openalex.org/C2777267654","wikidata":"https://www.wikidata.org/wiki/Q3519023","display_name":"Test (biology)","level":2,"score":0.2799000144004822},{"id":"https://openalex.org/C2776036281","wikidata":"https://www.wikidata.org/wiki/Q48769818","display_name":"Constraint (computer-aided design)","level":2,"score":0.2720000147819519},{"id":"https://openalex.org/C12267149","wikidata":"https://www.wikidata.org/wiki/Q282453","display_name":"Support vector machine","level":2,"score":0.26969999074935913},{"id":"https://openalex.org/C2781168091","wikidata":"https://www.wikidata.org/wiki/Q1059883","display_name":"Audience response","level":2,"score":0.25429999828338623}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.48550/arxiv.2603.18758","is_oa":true,"landing_page_url":"https://doi.org/10.48550/arxiv.2603.18758","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":null,"is_accepted":false,"is_published":null,"raw_source_name":null,"raw_type":"article"}],"best_oa_location":{"id":"doi:10.48550/arxiv.2603.18758","is_oa":true,"landing_page_url":"https://doi.org/10.48550/arxiv.2603.18758","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":null,"is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"article"},"sustainable_development_goals":[],"awards":[],"funders":[],"has_content":{"pdf":false,"grobid_xml":false},"content_urls":null,"referenced_works_count":0,"referenced_works":[],"related_works":[],"abstract_inverted_index":{"This":[0,138],"paper":[1,139],"outlines":[2],"a":[3,50,89,141],"machine":[4],"learning-enabled":[5],"speaker-centric":[6,39,142],"Emotion":[7,40,143],"AI":[8,41,144],"approach":[9,42,145],"capable":[10],"of":[11],"predicting":[12,68],"audience-affective":[13],"engagement":[14,70,120],"and":[15,84,121],"vocal":[16,95,126],"attractiveness":[17,96],"in":[18],"asynchronous":[19],"video-based":[20],"learning,":[21],"relying":[22],"solely":[23],"on":[24,99,104],"speaker-side":[25,100,130,153],"affective":[26,35,69,119],"expressions.":[27],"Inspired":[28],"by":[29,73,147],"the":[30],"demand":[31],"for":[32,118,125],"scalable,":[33],"privacy-preserving":[34],"computing":[36],"applications,":[37],"this":[38],"incorporates":[43],"two":[44],"distinct":[45],"regression":[46,66,91,109],"models":[47,110],"that":[48,129,152],"leverage":[49],"massive":[51],"corpus":[52],"developed":[53,72],"within":[54],"Massive":[55],"Open":[56],"Online":[57],"Courses":[58],"(MOOCs)":[59],"to":[60,93],"enable":[61],"affectively":[62],"engaging":[63],"experiences.":[64],"The":[65],"model":[67,92],"is":[71],"assimilating":[74],"emotional":[75],"expressions":[76],"emanating":[77],"from":[78],"facial":[79],"dynamics,":[80],"oculomotor":[81],"features,":[82,155],"prosody,":[83],"cognitive":[85],"semantics,":[86],"while":[87],"incorporating":[88],"second":[90],"predict":[94],"based":[97],"exclusively":[98],"acoustic":[101],"features.":[102],"Notably,":[103],"speaker-independent":[105],"test":[106],"sets,":[107],"both":[108],"yielded":[111],"impressive":[112],"predictive":[113],"performance":[114],"(R2":[115],"=":[116,123],"0.85":[117],"R2":[122],"0.88":[124],"attractiveness),":[127],"confirming":[128],"affect":[131],"can":[132,158],"functionally":[133],"represent":[134],"aggregated":[135],"audience":[136,161],"feedback.":[137],"provides":[140],"substantiated":[146],"an":[148],"empirical":[149],"study":[150],"discovering":[151],"multimodal":[154],"including":[156],"acoustics,":[157],"prospectively":[159],"forecast":[160],"feedback":[162],"without":[163],"necessarily":[164],"employing":[165],"audience-side":[166],"input":[167],"information.":[168]},"counts_by_year":[],"updated_date":"2026-06-11T09:08:48.828518","created_date":"2026-03-21T00:00:00"}
